diff --git "a/wandb/run-20220327_210229-2wif55w7/files/wandb-summary.json" "b/wandb/run-20220327_210229-2wif55w7/files/wandb-summary.json" --- "a/wandb/run-20220327_210229-2wif55w7/files/wandb-summary.json" +++ "b/wandb/run-20220327_210229-2wif55w7/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.3698, "train/learning_rate": 4.057803468208092e-06, "train/epoch": 8.97, "train/global_step": 2000, "_runtime": 46489, "_timestamp": 1648461438, "_step": 2003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 48.0, 197.0, 392.0, 279.0, 69.0, 14.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9832725524902344, -3.574183464050293, -3.1650943756103516, -2.7560055255889893, -2.346916437149048, -1.9378273487091064, -1.5287384986877441, -1.1196494102478027, -0.7105603218078613, -0.3014712929725647, 0.10761773586273193, 0.5167067050933838, 0.9257957935333252, 1.3348848819732666, 1.743973731994629, 2.1530628204345703, 2.5621519088745117, 2.971240997314453, 3.3803300857543945, 3.789418935775757, 4.198508262634277, 4.607597351074219, 5.016685962677002, 5.425775051116943, 5.834864139556885, 6.243953227996826, 6.653042316436768, 7.062130928039551, 7.471220016479492, 7.880309104919434, 8.289398193359375, 8.698487281799316, 9.107576370239258, 9.5166654586792, 9.92575454711914, 10.334843635559082, 10.743932723999023, 11.153021812438965, 11.562110900878906, 11.971199035644531, 12.380289077758789, 12.78937816619873, 13.198467254638672, 13.607556343078613, 14.016645431518555, 14.425734519958496, 14.834823608398438, 15.243911743164062, 15.653000831604004, 16.062089920043945, 16.47117805480957, 16.880268096923828, 17.289356231689453, 17.69844627380371, 18.107534408569336, 18.516624450683594, 18.92571258544922, 19.334800720214844, 19.7438907623291, 20.152978897094727, 20.562068939208984, 20.97115707397461, 21.380247116088867, 21.789335250854492, 22.19842529296875]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 4.0, 7.0, 12.0, 28.0, 24.0, 32.0, 18.0, 27.0, 24.0, 35.0, 41.0, 45.0, 42.0, 50.0, 42.0, 52.0, 39.0, 55.0, 59.0, 44.0, 28.0, 32.0, 36.0, 39.0, 22.0, 24.0, 26.0, 19.0, 22.0, 12.0, 10.0, 9.0, 7.0, 9.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.747800827026367, -3.639263391494751, -3.5307259559631348, -3.4221882820129395, -3.3136508464813232, -3.205113410949707, -3.096575975418091, -2.9880385398864746, -2.8795008659362793, -2.770963430404663, -2.662425994873047, -2.5538883209228516, -2.4453508853912354, -2.336813449859619, -2.228276014328003, -2.1197385787963867, -2.0112011432647705, -1.9026637077331543, -1.7941261529922485, -1.6855887174606323, -1.5770511627197266, -1.4685137271881104, -1.3599762916564941, -1.251438856124878, -1.1429013013839722, -1.034363865852356, -0.9258263111114502, -0.817288875579834, -0.708751380443573, -0.600213885307312, -0.4916764497756958, -0.3831389546394348, -0.27460145950317383, -0.16606397926807404, -0.05752649903297424, 0.051010966300964355, 0.15954846143722534, 0.26808595657348633, 0.37662339210510254, 0.4851608872413635, 0.5936983823776245, 0.7022358775138855, 0.8107733726501465, 0.9193108081817627, 1.027848243713379, 1.1363857984542847, 1.2449232339859009, 1.3534607887268066, 1.4619982242584229, 1.570535659790039, 1.6790732145309448, 1.787610650062561, 1.8961482048034668, 2.004685640335083, 2.113223075866699, 2.2217605113983154, 2.3302979469299316, 2.438835382461548, 2.547372817993164, 2.6559104919433594, 2.7644479274749756, 2.872985363006592, 2.981522798538208, 3.090060234069824, 3.1985979080200195]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 16.0, 20.0, 50.0, 88.0, 163.0, 378.0, 776.0, 1933.0, 5110.0, 14025.0, 42551.0, 144545.0, 489544.0, 1258242.0, 1385800.0, 595714.0, 175795.0, 51415.0, 17565.0, 6426.0, 2394.0, 936.0, 414.0, 184.0, 76.0, 56.0, 29.0, 12.0, 6.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.21875, -7.04302978515625, -6.8673095703125, -6.69158935546875, -6.515869140625, -6.34014892578125, -6.1644287109375, -5.98870849609375, -5.81298828125, -5.63726806640625, -5.4615478515625, -5.28582763671875, -5.110107421875, -4.93438720703125, -4.7586669921875, -4.58294677734375, -4.4072265625, -4.23150634765625, -4.0557861328125, -3.88006591796875, -3.704345703125, -3.52862548828125, -3.3529052734375, -3.17718505859375, -3.00146484375, -2.82574462890625, -2.6500244140625, -2.47430419921875, -2.298583984375, -2.12286376953125, -1.9471435546875, -1.77142333984375, -1.595703125, -1.41998291015625, -1.2442626953125, -1.06854248046875, -0.892822265625, -0.71710205078125, -0.5413818359375, -0.36566162109375, -0.18994140625, -0.01422119140625, 0.1614990234375, 0.33721923828125, 0.512939453125, 0.68865966796875, 0.8643798828125, 1.04010009765625, 1.2158203125, 1.39154052734375, 1.5672607421875, 1.74298095703125, 1.918701171875, 2.09442138671875, 2.2701416015625, 2.44586181640625, 2.62158203125, 2.79730224609375, 2.9730224609375, 3.14874267578125, 3.324462890625, 3.50018310546875, 3.6759033203125, 3.85162353515625, 4.02734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 9.0, 17.0, 15.0, 24.0, 24.0, 25.0, 37.0, 43.0, 46.0, 47.0, 58.0, 55.0, 62.0, 66.0, 65.0, 52.0, 51.0, 45.0, 48.0, 48.0, 26.0, 26.0, 25.0, 26.0, 16.0, 15.0, 9.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.984375, -7.78228759765625, -7.5802001953125, -7.37811279296875, -7.176025390625, -6.97393798828125, -6.7718505859375, -6.56976318359375, -6.36767578125, -6.16558837890625, -5.9635009765625, -5.76141357421875, -5.559326171875, -5.35723876953125, -5.1551513671875, -4.95306396484375, -4.7509765625, -4.54888916015625, -4.3468017578125, -4.14471435546875, -3.942626953125, -3.74053955078125, -3.5384521484375, -3.33636474609375, -3.13427734375, -2.93218994140625, -2.7301025390625, -2.52801513671875, -2.325927734375, -2.12384033203125, -1.9217529296875, -1.71966552734375, -1.517578125, -1.31549072265625, -1.1134033203125, -0.91131591796875, -0.709228515625, -0.50714111328125, -0.3050537109375, -0.10296630859375, 0.09912109375, 0.30120849609375, 0.5032958984375, 0.70538330078125, 0.907470703125, 1.10955810546875, 1.3116455078125, 1.51373291015625, 1.7158203125, 1.91790771484375, 2.1199951171875, 2.32208251953125, 2.524169921875, 2.72625732421875, 2.9283447265625, 3.13043212890625, 3.33251953125, 3.53460693359375, 3.7366943359375, 3.93878173828125, 4.140869140625, 4.34295654296875, 4.5450439453125, 4.74713134765625, 4.94921875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 13.0, 8.0, 32.0, 94.0, 241.0, 815.0, 3980324.0, 211775.0, 612.0, 199.0, 71.0, 33.0, 16.0, 12.0, 12.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-188.25, -183.6533203125, -179.056640625, -174.4599609375, -169.86328125, -165.2666015625, -160.669921875, -156.0732421875, -151.4765625, -146.8798828125, -142.283203125, -137.6865234375, -133.08984375, -128.4931640625, -123.896484375, -119.2998046875, -114.703125, -110.1064453125, -105.509765625, -100.9130859375, -96.31640625, -91.7197265625, -87.123046875, -82.5263671875, -77.9296875, -73.3330078125, -68.736328125, -64.1396484375, -59.54296875, -54.9462890625, -50.349609375, -45.7529296875, -41.15625, -36.5595703125, -31.962890625, -27.3662109375, -22.76953125, -18.1728515625, -13.576171875, -8.9794921875, -4.3828125, 0.2138671875, 4.810546875, 9.4072265625, 14.00390625, 18.6005859375, 23.197265625, 27.7939453125, 32.390625, 36.9873046875, 41.583984375, 46.1806640625, 50.77734375, 55.3740234375, 59.970703125, 64.5673828125, 69.1640625, 73.7607421875, 78.357421875, 82.9541015625, 87.55078125, 92.1474609375, 96.744140625, 101.3408203125, 105.9375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 17.0, 20.0, 46.0, 117.0, 271.0, 514.0, 1081.0, 1080.0, 470.0, 235.0, 97.0, 46.0, 26.0, 12.0, 6.0, 10.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96484375, -5.811798095703125, -5.65875244140625, -5.505706787109375, -5.3526611328125, -5.199615478515625, -5.04656982421875, -4.893524169921875, -4.740478515625, -4.587432861328125, -4.43438720703125, -4.281341552734375, -4.1282958984375, -3.975250244140625, -3.82220458984375, -3.669158935546875, -3.51611328125, -3.363067626953125, -3.21002197265625, -3.056976318359375, -2.9039306640625, -2.750885009765625, -2.59783935546875, -2.444793701171875, -2.291748046875, -2.138702392578125, -1.98565673828125, -1.832611083984375, -1.6795654296875, -1.526519775390625, -1.37347412109375, -1.220428466796875, -1.0673828125, -0.914337158203125, -0.76129150390625, -0.608245849609375, -0.4552001953125, -0.302154541015625, -0.14910888671875, 0.003936767578125, 0.156982421875, 0.310028076171875, 0.46307373046875, 0.616119384765625, 0.7691650390625, 0.922210693359375, 1.07525634765625, 1.228302001953125, 1.38134765625, 1.534393310546875, 1.68743896484375, 1.840484619140625, 1.9935302734375, 2.146575927734375, 2.29962158203125, 2.452667236328125, 2.605712890625, 2.758758544921875, 2.91180419921875, 3.064849853515625, 3.2178955078125, 3.370941162109375, 3.52398681640625, 3.677032470703125, 3.830078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 11.0, 20.0, 42.0, 62.0, 75.0, 99.0, 95.0, 124.0, 125.0, 106.0, 82.0, 64.0, 42.0, 21.0, 13.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.221722602844238, -4.9310784339904785, -4.6404337882995605, -4.349789619445801, -4.059144973754883, -3.768500804901123, -3.477856397628784, -3.1872119903564453, -2.8965675830841064, -2.6059231758117676, -2.3152787685394287, -2.02463436126709, -1.7339900732040405, -1.4433456659317017, -1.1527013778686523, -0.8620569705963135, -0.5714125633239746, -0.28076818585395813, 0.00987619161605835, 0.30052053928375244, 0.5911649465560913, 0.8818093538284302, 1.1724536418914795, 1.4630980491638184, 1.7537424564361572, 2.044386863708496, 2.335031270980835, 2.625675678253174, 2.9163198471069336, 3.2069644927978516, 3.4976086616516113, 3.78825306892395, 4.078897476196289, 4.369541645050049, 4.660186290740967, 4.950830459594727, 5.2414751052856445, 5.532119274139404, 5.822763442993164, 6.113408088684082, 6.404052734375, 6.69469690322876, 6.985341548919678, 7.2759857177734375, 7.5666303634643555, 7.857274532318115, 8.147918701171875, 8.438563346862793, 8.729207992553711, 9.019852638244629, 9.31049633026123, 9.601140975952148, 9.891785621643066, 10.182430267333984, 10.473073959350586, 10.763718605041504, 11.054362297058105, 11.345006942749023, 11.635650634765625, 11.926295280456543, 12.216939926147461, 12.507584571838379, 12.79822826385498, 13.088872909545898, 13.379517555236816]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 8.0, 10.0, 9.0, 22.0, 12.0, 18.0, 10.0, 27.0, 29.0, 35.0, 37.0, 30.0, 44.0, 49.0, 39.0, 51.0, 48.0, 37.0, 39.0, 33.0, 47.0, 31.0, 34.0, 35.0, 24.0, 31.0, 24.0, 39.0, 27.0, 17.0, 18.0, 12.0, 13.0, 11.0, 10.0, 6.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.194772720336914, -3.067945718765259, -2.9411187171936035, -2.8142917156219482, -2.687464714050293, -2.560637950897217, -2.4338109493255615, -2.3069839477539062, -2.180156946182251, -2.0533299446105957, -1.9265029430389404, -1.7996760606765747, -1.6728490591049194, -1.5460220575332642, -1.4191951751708984, -1.2923681735992432, -1.165541172027588, -1.0387141704559326, -0.9118872284889221, -0.7850602865219116, -0.6582332849502563, -0.5314062833786011, -0.4045793414115906, -0.2777523994445801, -0.1509253978729248, -0.02409842610359192, 0.10272854566574097, 0.22955551743507385, 0.35638248920440674, 0.483209490776062, 0.6100364327430725, 0.736863374710083, 0.8636908531188965, 0.9905178546905518, 1.117344856262207, 1.2441717386245728, 1.370998740196228, 1.4978257417678833, 1.624652624130249, 1.7514796257019043, 1.8783066272735596, 2.005133628845215, 2.13196063041687, 2.2587876319885254, 2.3856143951416016, 2.512441635131836, 2.639268398284912, 2.7660953998565674, 2.8929224014282227, 3.019749402999878, 3.146576404571533, 3.2734034061431885, 3.4002304077148438, 3.52705717086792, 3.653884172439575, 3.7807111740112305, 3.9075381755828857, 4.034365177154541, 4.161191940307617, 4.288019180297852, 4.414845943450928, 4.541673183441162, 4.668499946594238, 4.795327186584473, 4.922153949737549]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 10.0, 14.0, 22.0, 34.0, 44.0, 65.0, 101.0, 130.0, 235.0, 398.0, 609.0, 1052.0, 2234.0, 6450.0, 28349.0, 155012.0, 495831.0, 285383.0, 54792.0, 11040.0, 3370.0, 1417.0, 699.0, 410.0, 272.0, 171.0, 118.0, 91.0, 48.0, 44.0, 34.0, 15.0, 19.0, 3.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0595703125, -1.025054931640625, -0.99053955078125, -0.956024169921875, -0.9215087890625, -0.886993408203125, -0.85247802734375, -0.817962646484375, -0.783447265625, -0.748931884765625, -0.71441650390625, -0.679901123046875, -0.6453857421875, -0.610870361328125, -0.57635498046875, -0.541839599609375, -0.50732421875, -0.472808837890625, -0.43829345703125, -0.403778076171875, -0.3692626953125, -0.334747314453125, -0.30023193359375, -0.265716552734375, -0.231201171875, -0.196685791015625, -0.16217041015625, -0.127655029296875, -0.0931396484375, -0.058624267578125, -0.02410888671875, 0.010406494140625, 0.044921875, 0.079437255859375, 0.11395263671875, 0.148468017578125, 0.1829833984375, 0.217498779296875, 0.25201416015625, 0.286529541015625, 0.321044921875, 0.355560302734375, 0.39007568359375, 0.424591064453125, 0.4591064453125, 0.493621826171875, 0.52813720703125, 0.562652587890625, 0.59716796875, 0.631683349609375, 0.66619873046875, 0.700714111328125, 0.7352294921875, 0.769744873046875, 0.80426025390625, 0.838775634765625, 0.873291015625, 0.907806396484375, 0.94232177734375, 0.976837158203125, 1.0113525390625, 1.045867919921875, 1.08038330078125, 1.114898681640625, 1.1494140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 13.0, 9.0, 12.0, 12.0, 16.0, 17.0, 17.0, 23.0, 29.0, 38.0, 45.0, 46.0, 50.0, 45.0, 55.0, 49.0, 55.0, 40.0, 41.0, 51.0, 51.0, 42.0, 46.0, 27.0, 38.0, 27.0, 29.0, 17.0, 18.0, 8.0, 10.0, 6.0, 5.0, 1.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2364501953125, -4.105712890625, -3.9749755859375, -3.84423828125, -3.7135009765625, -3.582763671875, -3.4520263671875, -3.3212890625, -3.1905517578125, -3.059814453125, -2.9290771484375, -2.79833984375, -2.6676025390625, -2.536865234375, -2.4061279296875, -2.275390625, -2.1446533203125, -2.013916015625, -1.8831787109375, -1.75244140625, -1.6217041015625, -1.490966796875, -1.3602294921875, -1.2294921875, -1.0987548828125, -0.968017578125, -0.8372802734375, -0.70654296875, -0.5758056640625, -0.445068359375, -0.3143310546875, -0.18359375, -0.0528564453125, 0.077880859375, 0.2086181640625, 0.33935546875, 0.4700927734375, 0.600830078125, 0.7315673828125, 0.8623046875, 0.9930419921875, 1.123779296875, 1.2545166015625, 1.38525390625, 1.5159912109375, 1.646728515625, 1.7774658203125, 1.908203125, 2.0389404296875, 2.169677734375, 2.3004150390625, 2.43115234375, 2.5618896484375, 2.692626953125, 2.8233642578125, 2.9541015625, 3.0848388671875, 3.215576171875, 3.3463134765625, 3.47705078125, 3.6077880859375, 3.738525390625, 3.8692626953125, 4.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 2.0, 8.0, 3.0, 20.0, 23.0, 26.0, 46.0, 81.0, 154.0, 254.0, 468.0, 919.0, 1838.0, 3672.0, 7899.0, 16312.0, 33685.0, 67700.0, 125364.0, 193979.0, 220915.0, 169733.0, 101201.0, 52926.0, 26090.0, 12943.0, 6088.0, 2979.0, 1478.0, 722.0, 428.0, 224.0, 138.0, 79.0, 38.0, 35.0, 30.0, 14.0, 10.0, 4.0, 8.0, 6.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.3701171875, -0.3590087890625, -0.347900390625, -0.3367919921875, -0.32568359375, -0.3145751953125, -0.303466796875, -0.2923583984375, -0.28125, -0.2701416015625, -0.259033203125, -0.2479248046875, -0.23681640625, -0.2257080078125, -0.214599609375, -0.2034912109375, -0.1923828125, -0.1812744140625, -0.170166015625, -0.1590576171875, -0.14794921875, -0.1368408203125, -0.125732421875, -0.1146240234375, -0.103515625, -0.0924072265625, -0.081298828125, -0.0701904296875, -0.05908203125, -0.0479736328125, -0.036865234375, -0.0257568359375, -0.0146484375, -0.0035400390625, 0.007568359375, 0.0186767578125, 0.02978515625, 0.0408935546875, 0.052001953125, 0.0631103515625, 0.07421875, 0.0853271484375, 0.096435546875, 0.1075439453125, 0.11865234375, 0.1297607421875, 0.140869140625, 0.1519775390625, 0.1630859375, 0.1741943359375, 0.185302734375, 0.1964111328125, 0.20751953125, 0.2186279296875, 0.229736328125, 0.2408447265625, 0.251953125, 0.2630615234375, 0.274169921875, 0.2852783203125, 0.29638671875, 0.3074951171875, 0.318603515625, 0.3297119140625, 0.3408203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 8.0, 7.0, 11.0, 14.0, 19.0, 20.0, 28.0, 29.0, 39.0, 45.0, 46.0, 34.0, 41.0, 50.0, 34.0, 59.0, 56.0, 61.0, 49.0, 44.0, 40.0, 35.0, 37.0, 30.0, 31.0, 18.0, 20.0, 18.0, 8.0, 16.0, 9.0, 17.0, 5.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.96038818359375, -7.7098388671875, -7.45928955078125, -7.208740234375, -6.95819091796875, -6.7076416015625, -6.45709228515625, -6.20654296875, -5.95599365234375, -5.7054443359375, -5.45489501953125, -5.204345703125, -4.95379638671875, -4.7032470703125, -4.45269775390625, -4.2021484375, -3.95159912109375, -3.7010498046875, -3.45050048828125, -3.199951171875, -2.94940185546875, -2.6988525390625, -2.44830322265625, -2.19775390625, -1.94720458984375, -1.6966552734375, -1.44610595703125, -1.195556640625, -0.94500732421875, -0.6944580078125, -0.44390869140625, -0.193359375, 0.05718994140625, 0.3077392578125, 0.55828857421875, 0.808837890625, 1.05938720703125, 1.3099365234375, 1.56048583984375, 1.81103515625, 2.06158447265625, 2.3121337890625, 2.56268310546875, 2.813232421875, 3.06378173828125, 3.3143310546875, 3.56488037109375, 3.8154296875, 4.06597900390625, 4.3165283203125, 4.56707763671875, 4.817626953125, 5.06817626953125, 5.3187255859375, 5.56927490234375, 5.81982421875, 6.07037353515625, 6.3209228515625, 6.57147216796875, 6.822021484375, 7.07257080078125, 7.3231201171875, 7.57366943359375, 7.82421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 12.0, 17.0, 25.0, 39.0, 62.0, 85.0, 159.0, 355.0, 664.0, 1451.0, 3368.0, 8278.0, 23301.0, 79817.0, 260619.0, 398191.0, 190468.0, 54204.0, 16533.0, 6057.0, 2466.0, 1129.0, 527.0, 311.0, 172.0, 81.0, 53.0, 34.0, 28.0, 20.0, 5.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059295654296875, -0.05746269226074219, -0.055629730224609375, -0.05379676818847656, -0.05196380615234375, -0.05013084411621094, -0.048297882080078125, -0.04646492004394531, -0.0446319580078125, -0.04279899597167969, -0.040966033935546875, -0.03913307189941406, -0.03730010986328125, -0.03546714782714844, -0.033634185791015625, -0.03180122375488281, -0.02996826171875, -0.028135299682617188, -0.026302337646484375, -0.024469375610351562, -0.02263641357421875, -0.020803451538085938, -0.018970489501953125, -0.017137527465820312, -0.0153045654296875, -0.013471603393554688, -0.011638641357421875, -0.009805679321289062, -0.00797271728515625, -0.0061397552490234375, -0.004306793212890625, -0.0024738311767578125, -0.000640869140625, 0.0011920928955078125, 0.003025054931640625, 0.0048580169677734375, 0.00669097900390625, 0.008523941040039062, 0.010356903076171875, 0.012189865112304688, 0.0140228271484375, 0.015855789184570312, 0.017688751220703125, 0.019521713256835938, 0.02135467529296875, 0.023187637329101562, 0.025020599365234375, 0.026853561401367188, 0.0286865234375, 0.030519485473632812, 0.032352447509765625, 0.03418540954589844, 0.03601837158203125, 0.03785133361816406, 0.039684295654296875, 0.04151725769042969, 0.0433502197265625, 0.04518318176269531, 0.047016143798828125, 0.04884910583496094, 0.05068206787109375, 0.05251502990722656, 0.054347991943359375, 0.05618095397949219, 0.058013916015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 20.0, 33.0, 31.0, 61.0, 59.0, 86.0, 101.0, 85.0, 110.0, 102.0, 72.0, 58.0, 38.0, 36.0, 30.0, 22.0, 12.0, 7.0, 7.0, 5.0, 1.0, 2.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.849931716918945e-05, -7.619522511959076e-05, -7.389113306999207e-05, -7.158704102039337e-05, -6.928294897079468e-05, -6.697885692119598e-05, -6.467476487159729e-05, -6.23706728219986e-05, -6.00665807723999e-05, -5.776248872280121e-05, -5.5458396673202515e-05, -5.315430462360382e-05, -5.085021257400513e-05, -4.854612052440643e-05, -4.624202847480774e-05, -4.3937936425209045e-05, -4.163384437561035e-05, -3.932975232601166e-05, -3.7025660276412964e-05, -3.472156822681427e-05, -3.2417476177215576e-05, -3.0113384127616882e-05, -2.780929207801819e-05, -2.5505200028419495e-05, -2.32011079788208e-05, -2.0897015929222107e-05, -1.8592923879623413e-05, -1.628883183002472e-05, -1.3984739780426025e-05, -1.1680647730827332e-05, -9.376555681228638e-06, -7.072463631629944e-06, -4.76837158203125e-06, -2.464279532432556e-06, -1.601874828338623e-07, 2.1439045667648315e-06, 4.447996616363525e-06, 6.752088665962219e-06, 9.056180715560913e-06, 1.1360272765159607e-05, 1.36643648147583e-05, 1.5968456864356995e-05, 1.827254891395569e-05, 2.0576640963554382e-05, 2.2880733013153076e-05, 2.518482506275177e-05, 2.7488917112350464e-05, 2.9793009161949158e-05, 3.209710121154785e-05, 3.4401193261146545e-05, 3.670528531074524e-05, 3.900937736034393e-05, 4.131346940994263e-05, 4.361756145954132e-05, 4.5921653509140015e-05, 4.822574555873871e-05, 5.05298376083374e-05, 5.2833929657936096e-05, 5.513802170753479e-05, 5.7442113757133484e-05, 5.974620580673218e-05, 6.205029785633087e-05, 6.435438990592957e-05, 6.665848195552826e-05, 6.896257400512695e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 13.0, 9.0, 10.0, 14.0, 13.0, 20.0, 24.0, 23.0, 45.0, 49.0, 54.0, 112.0, 169.0, 318.0, 752.0, 2433.0, 11592.0, 119073.0, 688188.0, 202802.0, 17817.0, 3086.0, 916.0, 397.0, 181.0, 111.0, 81.0, 60.0, 39.0, 35.0, 24.0, 16.0, 14.0, 10.0, 16.0, 9.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.10467529296875, -0.1013631820678711, -0.09805107116699219, -0.09473896026611328, -0.09142684936523438, -0.08811473846435547, -0.08480262756347656, -0.08149051666259766, -0.07817840576171875, -0.07486629486083984, -0.07155418395996094, -0.06824207305908203, -0.06492996215820312, -0.06161785125732422, -0.05830574035644531, -0.054993629455566406, -0.0516815185546875, -0.048369407653808594, -0.04505729675292969, -0.04174518585205078, -0.038433074951171875, -0.03512096405029297, -0.03180885314941406, -0.028496742248535156, -0.02518463134765625, -0.021872520446777344, -0.018560409545898438, -0.015248298645019531, -0.011936187744140625, -0.008624076843261719, -0.0053119659423828125, -0.0019998550415039062, 0.001312255859375, 0.004624366760253906, 0.007936477661132812, 0.011248588562011719, 0.014560699462890625, 0.01787281036376953, 0.021184921264648438, 0.024497032165527344, 0.02780914306640625, 0.031121253967285156, 0.03443336486816406, 0.03774547576904297, 0.041057586669921875, 0.04436969757080078, 0.04768180847167969, 0.050993919372558594, 0.0543060302734375, 0.057618141174316406, 0.06093025207519531, 0.06424236297607422, 0.06755447387695312, 0.07086658477783203, 0.07417869567871094, 0.07749080657958984, 0.08080291748046875, 0.08411502838134766, 0.08742713928222656, 0.09073925018310547, 0.09405136108398438, 0.09736347198486328, 0.10067558288574219, 0.1039876937866211, 0.1072998046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 7.0, 7.0, 10.0, 13.0, 19.0, 20.0, 24.0, 29.0, 25.0, 41.0, 36.0, 50.0, 55.0, 61.0, 58.0, 62.0, 65.0, 59.0, 41.0, 38.0, 42.0, 51.0, 24.0, 36.0, 17.0, 21.0, 11.0, 18.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01386260986328125, -0.01343393325805664, -0.013005256652832031, -0.012576580047607422, -0.012147903442382812, -0.011719226837158203, -0.011290550231933594, -0.010861873626708984, -0.010433197021484375, -0.010004520416259766, -0.009575843811035156, -0.009147167205810547, -0.008718490600585938, -0.008289813995361328, -0.007861137390136719, -0.007432460784912109, -0.0070037841796875, -0.006575107574462891, -0.006146430969238281, -0.005717754364013672, -0.0052890777587890625, -0.004860401153564453, -0.004431724548339844, -0.004003047943115234, -0.003574371337890625, -0.0031456947326660156, -0.0027170181274414062, -0.002288341522216797, -0.0018596649169921875, -0.0014309883117675781, -0.0010023117065429688, -0.0005736351013183594, -0.00014495849609375, 0.0002837181091308594, 0.0007123947143554688, 0.0011410713195800781, 0.0015697479248046875, 0.001998424530029297, 0.0024271011352539062, 0.0028557777404785156, 0.003284454345703125, 0.0037131309509277344, 0.004141807556152344, 0.004570484161376953, 0.0049991607666015625, 0.005427837371826172, 0.005856513977050781, 0.006285190582275391, 0.0067138671875, 0.007142543792724609, 0.007571220397949219, 0.007999897003173828, 0.008428573608398438, 0.008857250213623047, 0.009285926818847656, 0.009714603424072266, 0.010143280029296875, 0.010571956634521484, 0.011000633239746094, 0.011429309844970703, 0.011857986450195312, 0.012286663055419922, 0.012715339660644531, 0.01314401626586914, 0.01357269287109375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 6.0, 21.0, 80.0, 186.0, 300.0, 253.0, 128.0, 28.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.939656972885132, -3.3574652671813965, -2.7752737998962402, -2.193082094192505, -1.6108903884887695, -1.0286986827850342, -0.44650721549987793, 0.13568472862243652, 0.7178761959075928, 1.3000679016113281, 1.882259488105774, 2.4644510746002197, 3.046642780303955, 3.6288344860076904, 4.211026191711426, 4.793217658996582, 5.375409126281738, 5.9576005935668945, 6.539792537689209, 7.121984004974365, 7.70417594909668, 8.286367416381836, 8.868558883666992, 9.450750350952148, 10.032942771911621, 10.615134239196777, 11.197325706481934, 11.779518127441406, 12.361709594726562, 12.943901062011719, 13.526092529296875, 14.108283996582031, 14.69047737121582, 15.272668838500977, 15.854860305786133, 16.43705177307129, 17.019243240356445, 17.601436614990234, 18.18362808227539, 18.765819549560547, 19.348011016845703, 19.93020248413086, 20.512393951416016, 21.094585418701172, 21.676776885986328, 22.258968353271484, 22.84115982055664, 23.42335319519043, 24.005542755126953, 24.58773422241211, 25.169925689697266, 25.752117156982422, 26.334308624267578, 26.916500091552734, 27.49869155883789, 28.08088493347168, 28.663076400756836, 29.245267868041992, 29.82745933532715, 30.409650802612305, 30.99184226989746, 31.57403564453125, 32.156227111816406, 32.73841857910156, 33.32061004638672]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 7.0, 10.0, 15.0, 17.0, 9.0, 27.0, 21.0, 37.0, 31.0, 45.0, 50.0, 37.0, 48.0, 50.0, 51.0, 43.0, 41.0, 46.0, 30.0, 42.0, 44.0, 39.0, 36.0, 33.0, 33.0, 28.0, 25.0, 12.0, 17.0, 16.0, 9.0, 11.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.5944013595581055, -3.4812874794006348, -3.368173599243164, -3.2550597190856934, -3.1419458389282227, -3.028831958770752, -2.9157183170318604, -2.8026044368743896, -2.689490556716919, -2.5763766765594482, -2.4632627964019775, -2.350148916244507, -2.2370352745056152, -2.1239213943481445, -2.010807514190674, -1.8976936340332031, -1.7845797538757324, -1.6714658737182617, -1.558351993560791, -1.4452382326126099, -1.3321243524551392, -1.2190104722976685, -1.1058967113494873, -0.9927828311920166, -0.8796689510345459, -0.7665550708770752, -0.6534412503242493, -0.5403274297714233, -0.42721354961395264, -0.31409966945648193, -0.200985848903656, -0.08787202835083008, 0.025242090225219727, 0.13835594058036804, 0.25146979093551636, 0.3645836412906647, 0.477697491645813, 0.5908113718032837, 0.7039251923561096, 0.8170390129089355, 0.9301528930664062, 1.043266773223877, 1.1563806533813477, 1.2694944143295288, 1.3826082944869995, 1.4957221746444702, 1.6088359355926514, 1.721949815750122, 1.8350636959075928, 1.9481775760650635, 2.061291456222534, 2.174405336380005, 2.2875189781188965, 2.400632858276367, 2.513746738433838, 2.6268606185913086, 2.7399744987487793, 2.85308837890625, 2.9662022590637207, 3.0793161392211914, 3.192430019378662, 3.305543899536133, 3.4186575412750244, 3.531771421432495, 3.644885301589966]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 8.0, 8.0, 12.0, 26.0, 35.0, 74.0, 85.0, 178.0, 280.0, 453.0, 744.0, 1389.0, 2479.0, 4200.0, 6982.0, 12547.0, 21282.0, 37298.0, 62309.0, 100772.0, 149799.0, 186360.0, 165873.0, 116339.0, 73352.0, 44447.0, 25962.0, 15084.0, 8524.0, 4909.0, 2820.0, 1661.0, 910.0, 555.0, 330.0, 203.0, 111.0, 51.0, 47.0, 25.0, 13.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.2035675048828125, -1.160064697265625, -1.1165618896484375, -1.07305908203125, -1.0295562744140625, -0.986053466796875, -0.9425506591796875, -0.8990478515625, -0.8555450439453125, -0.812042236328125, -0.7685394287109375, -0.72503662109375, -0.6815338134765625, -0.638031005859375, -0.5945281982421875, -0.551025390625, -0.5075225830078125, -0.464019775390625, -0.4205169677734375, -0.37701416015625, -0.3335113525390625, -0.290008544921875, -0.2465057373046875, -0.2030029296875, -0.1595001220703125, -0.115997314453125, -0.0724945068359375, -0.02899169921875, 0.0145111083984375, 0.058013916015625, 0.1015167236328125, 0.14501953125, 0.1885223388671875, 0.232025146484375, 0.2755279541015625, 0.31903076171875, 0.3625335693359375, 0.406036376953125, 0.4495391845703125, 0.4930419921875, 0.5365447998046875, 0.580047607421875, 0.6235504150390625, 0.66705322265625, 0.7105560302734375, 0.754058837890625, 0.7975616455078125, 0.841064453125, 0.8845672607421875, 0.928070068359375, 0.9715728759765625, 1.01507568359375, 1.0585784912109375, 1.102081298828125, 1.1455841064453125, 1.1890869140625, 1.2325897216796875, 1.276092529296875, 1.3195953369140625, 1.36309814453125, 1.4066009521484375, 1.450103759765625, 1.4936065673828125, 1.537109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 2.0, 6.0, 6.0, 9.0, 17.0, 10.0, 20.0, 18.0, 16.0, 19.0, 22.0, 29.0, 37.0, 34.0, 40.0, 36.0, 42.0, 35.0, 52.0, 47.0, 52.0, 49.0, 30.0, 34.0, 39.0, 45.0, 41.0, 24.0, 22.0, 28.0, 27.0, 19.0, 11.0, 15.0, 14.0, 10.0, 5.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.152099609375, -12.67919921875, -12.206298828125, -11.7333984375, -11.260498046875, -10.78759765625, -10.314697265625, -9.841796875, -9.368896484375, -8.89599609375, -8.423095703125, -7.9501953125, -7.477294921875, -7.00439453125, -6.531494140625, -6.05859375, -5.585693359375, -5.11279296875, -4.639892578125, -4.1669921875, -3.694091796875, -3.22119140625, -2.748291015625, -2.275390625, -1.802490234375, -1.32958984375, -0.856689453125, -0.3837890625, 0.089111328125, 0.56201171875, 1.034912109375, 1.5078125, 1.980712890625, 2.45361328125, 2.926513671875, 3.3994140625, 3.872314453125, 4.34521484375, 4.818115234375, 5.291015625, 5.763916015625, 6.23681640625, 6.709716796875, 7.1826171875, 7.655517578125, 8.12841796875, 8.601318359375, 9.07421875, 9.547119140625, 10.02001953125, 10.492919921875, 10.9658203125, 11.438720703125, 11.91162109375, 12.384521484375, 12.857421875, 13.330322265625, 13.80322265625, 14.276123046875, 14.7490234375, 15.221923828125, 15.69482421875, 16.167724609375, 16.640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 13.0, 13.0, 19.0, 20.0, 26.0, 28.0, 35.0, 36.0, 48.0, 86.0, 94.0, 133.0, 139.0, 215.0, 377.0, 742.0, 2933.0, 41602.0, 735100.0, 253538.0, 10386.0, 1408.0, 485.0, 293.0, 181.0, 119.0, 79.0, 78.0, 75.0, 43.0, 43.0, 29.0, 25.0, 24.0, 13.0, 19.0, 17.0, 10.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.296875, -8.0181884765625, -7.739501953125, -7.4608154296875, -7.18212890625, -6.9034423828125, -6.624755859375, -6.3460693359375, -6.0673828125, -5.7886962890625, -5.510009765625, -5.2313232421875, -4.95263671875, -4.6739501953125, -4.395263671875, -4.1165771484375, -3.837890625, -3.5592041015625, -3.280517578125, -3.0018310546875, -2.72314453125, -2.4444580078125, -2.165771484375, -1.8870849609375, -1.6083984375, -1.3297119140625, -1.051025390625, -0.7723388671875, -0.49365234375, -0.2149658203125, 0.063720703125, 0.3424072265625, 0.62109375, 0.8997802734375, 1.178466796875, 1.4571533203125, 1.73583984375, 2.0145263671875, 2.293212890625, 2.5718994140625, 2.8505859375, 3.1292724609375, 3.407958984375, 3.6866455078125, 3.96533203125, 4.2440185546875, 4.522705078125, 4.8013916015625, 5.080078125, 5.3587646484375, 5.637451171875, 5.9161376953125, 6.19482421875, 6.4735107421875, 6.752197265625, 7.0308837890625, 7.3095703125, 7.5882568359375, 7.866943359375, 8.1456298828125, 8.42431640625, 8.7030029296875, 8.981689453125, 9.2603759765625, 9.5390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 4.0, 8.0, 9.0, 12.0, 9.0, 15.0, 24.0, 36.0, 25.0, 23.0, 41.0, 46.0, 40.0, 50.0, 50.0, 60.0, 55.0, 46.0, 58.0, 48.0, 49.0, 43.0, 45.0, 37.0, 30.0, 25.0, 22.0, 20.0, 12.0, 12.0, 6.0, 10.0, 3.0, 8.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5703125, -14.0638427734375, -13.557373046875, -13.0509033203125, -12.54443359375, -12.0379638671875, -11.531494140625, -11.0250244140625, -10.5185546875, -10.0120849609375, -9.505615234375, -8.9991455078125, -8.49267578125, -7.9862060546875, -7.479736328125, -6.9732666015625, -6.466796875, -5.9603271484375, -5.453857421875, -4.9473876953125, -4.44091796875, -3.9344482421875, -3.427978515625, -2.9215087890625, -2.4150390625, -1.9085693359375, -1.402099609375, -0.8956298828125, -0.38916015625, 0.1173095703125, 0.623779296875, 1.1302490234375, 1.63671875, 2.1431884765625, 2.649658203125, 3.1561279296875, 3.66259765625, 4.1690673828125, 4.675537109375, 5.1820068359375, 5.6884765625, 6.1949462890625, 6.701416015625, 7.2078857421875, 7.71435546875, 8.2208251953125, 8.727294921875, 9.2337646484375, 9.740234375, 10.2467041015625, 10.753173828125, 11.2596435546875, 11.76611328125, 12.2725830078125, 12.779052734375, 13.2855224609375, 13.7919921875, 14.2984619140625, 14.804931640625, 15.3114013671875, 15.81787109375, 16.3243408203125, 16.830810546875, 17.3372802734375, 17.84375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 18.0, 26.0, 42.0, 116.0, 360.0, 2112.0, 204656.0, 836049.0, 4450.0, 420.0, 152.0, 68.0, 23.0, 18.0, 4.0, 7.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.41107177734375, -4.2596435546875, -4.10821533203125, -3.956787109375, -3.80535888671875, -3.6539306640625, -3.50250244140625, -3.35107421875, -3.19964599609375, -3.0482177734375, -2.89678955078125, -2.745361328125, -2.59393310546875, -2.4425048828125, -2.29107666015625, -2.1396484375, -1.98822021484375, -1.8367919921875, -1.68536376953125, -1.533935546875, -1.38250732421875, -1.2310791015625, -1.07965087890625, -0.92822265625, -0.77679443359375, -0.6253662109375, -0.47393798828125, -0.322509765625, -0.17108154296875, -0.0196533203125, 0.13177490234375, 0.283203125, 0.43463134765625, 0.5860595703125, 0.73748779296875, 0.888916015625, 1.04034423828125, 1.1917724609375, 1.34320068359375, 1.49462890625, 1.64605712890625, 1.7974853515625, 1.94891357421875, 2.100341796875, 2.25177001953125, 2.4031982421875, 2.55462646484375, 2.7060546875, 2.85748291015625, 3.0089111328125, 3.16033935546875, 3.311767578125, 3.46319580078125, 3.6146240234375, 3.76605224609375, 3.91748046875, 4.06890869140625, 4.2203369140625, 4.37176513671875, 4.523193359375, 4.67462158203125, 4.8260498046875, 4.97747802734375, 5.12890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 8.0, 12.0, 27.0, 46.0, 76.0, 117.0, 156.0, 161.0, 168.0, 107.0, 58.0, 38.0, 12.0, 7.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001703500747680664, -0.00015920214354991913, -0.00014805421233177185, -0.00013690628111362457, -0.0001257583498954773, -0.00011461041867733002, -0.00010346248745918274, -9.231455624103546e-05, -8.116662502288818e-05, -7.00186938047409e-05, -5.887076258659363e-05, -4.772283136844635e-05, -3.657490015029907e-05, -2.5426968932151794e-05, -1.4279037714004517e-05, -3.1311064958572388e-06, 8.016824722290039e-06, 1.9164755940437317e-05, 3.0312687158584595e-05, 4.146061837673187e-05, 5.260854959487915e-05, 6.375648081302643e-05, 7.49044120311737e-05, 8.605234324932098e-05, 9.720027446746826e-05, 0.00010834820568561554, 0.00011949613690376282, 0.0001306440681219101, 0.00014179199934005737, 0.00015293993055820465, 0.00016408786177635193, 0.0001752357929944992, 0.00018638372421264648, 0.00019753165543079376, 0.00020867958664894104, 0.00021982751786708832, 0.0002309754490852356, 0.00024212338030338287, 0.00025327131152153015, 0.00026441924273967743, 0.0002755671739578247, 0.000286715105175972, 0.00029786303639411926, 0.00030901096761226654, 0.0003201588988304138, 0.0003313068300485611, 0.0003424547612667084, 0.00035360269248485565, 0.00036475062370300293, 0.0003758985549211502, 0.0003870464861392975, 0.00039819441735744476, 0.00040934234857559204, 0.0004204902797937393, 0.0004316382110118866, 0.0004427861422300339, 0.00045393407344818115, 0.00046508200466632843, 0.0004762299358844757, 0.000487377867102623, 0.0004985257983207703, 0.0005096737295389175, 0.0005208216607570648, 0.0005319695919752121, 0.0005431175231933594]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 8.0, 9.0, 6.0, 20.0, 21.0, 26.0, 38.0, 48.0, 88.0, 125.0, 241.0, 531.0, 1405.0, 5451.0, 39788.0, 601109.0, 371386.0, 22372.0, 3826.0, 1093.0, 427.0, 203.0, 99.0, 72.0, 59.0, 27.0, 20.0, 14.0, 14.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.171875, -2.1129913330078125, -2.054107666015625, -1.9952239990234375, -1.93634033203125, -1.8774566650390625, -1.818572998046875, -1.7596893310546875, -1.7008056640625, -1.6419219970703125, -1.583038330078125, -1.5241546630859375, -1.46527099609375, -1.4063873291015625, -1.347503662109375, -1.2886199951171875, -1.229736328125, -1.1708526611328125, -1.111968994140625, -1.0530853271484375, -0.99420166015625, -0.9353179931640625, -0.876434326171875, -0.8175506591796875, -0.7586669921875, -0.6997833251953125, -0.640899658203125, -0.5820159912109375, -0.52313232421875, -0.4642486572265625, -0.405364990234375, -0.3464813232421875, -0.28759765625, -0.2287139892578125, -0.169830322265625, -0.1109466552734375, -0.05206298828125, 0.0068206787109375, 0.065704345703125, 0.1245880126953125, 0.1834716796875, 0.2423553466796875, 0.301239013671875, 0.3601226806640625, 0.41900634765625, 0.4778900146484375, 0.536773681640625, 0.5956573486328125, 0.654541015625, 0.7134246826171875, 0.772308349609375, 0.8311920166015625, 0.89007568359375, 0.9489593505859375, 1.007843017578125, 1.0667266845703125, 1.1256103515625, 1.1844940185546875, 1.243377685546875, 1.3022613525390625, 1.36114501953125, 1.4200286865234375, 1.478912353515625, 1.5377960205078125, 1.5966796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 6.0, 10.0, 13.0, 20.0, 23.0, 32.0, 46.0, 50.0, 72.0, 113.0, 101.0, 120.0, 106.0, 69.0, 54.0, 53.0, 37.0, 22.0, 13.0, 9.0, 7.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66064453125, -0.6432762145996094, -0.6259078979492188, -0.6085395812988281, -0.5911712646484375, -0.5738029479980469, -0.5564346313476562, -0.5390663146972656, -0.521697998046875, -0.5043296813964844, -0.48696136474609375, -0.4695930480957031, -0.4522247314453125, -0.4348564147949219, -0.41748809814453125, -0.4001197814941406, -0.38275146484375, -0.3653831481933594, -0.34801483154296875, -0.3306465148925781, -0.3132781982421875, -0.2959098815917969, -0.27854156494140625, -0.2611732482910156, -0.243804931640625, -0.22643661499023438, -0.20906829833984375, -0.19169998168945312, -0.1743316650390625, -0.15696334838867188, -0.13959503173828125, -0.12222671508789062, -0.1048583984375, -0.08749008178710938, -0.07012176513671875, -0.052753448486328125, -0.0353851318359375, -0.018016815185546875, -0.00064849853515625, 0.016719818115234375, 0.034088134765625, 0.051456451416015625, 0.06882476806640625, 0.08619308471679688, 0.1035614013671875, 0.12092971801757812, 0.13829803466796875, 0.15566635131835938, 0.17303466796875, 0.19040298461914062, 0.20777130126953125, 0.22513961791992188, 0.2425079345703125, 0.2598762512207031, 0.27724456787109375, 0.2946128845214844, 0.311981201171875, 0.3293495178222656, 0.34671783447265625, 0.3640861511230469, 0.3814544677734375, 0.3988227844238281, 0.41619110107421875, 0.4335594177246094, 0.450927734375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [34.0, 390.0, 538.0, 55.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.862199783325195, -2.5998141765594482, -0.33742856979370117, 1.924957275390625, 4.187342643737793, 6.449728012084961, 8.712114334106445, 10.974499702453613, 13.236885070800781, 15.49927043914795, 17.761655807495117, 20.0240421295166, 22.286426544189453, 24.548812866210938, 26.811199188232422, 29.073585510253906, 31.335969924926758, 33.59835433959961, 35.860740661621094, 38.12312698364258, 40.38551330566406, 42.64789581298828, 44.91028594970703, 47.17266845703125, 49.435054779052734, 51.69744110107422, 53.9598274230957, 56.22221374511719, 58.484596252441406, 60.74698257446289, 63.009368896484375, 65.2717514038086, 67.53414154052734, 69.79652404785156, 72.05891418457031, 74.32129669189453, 76.58368682861328, 78.8460693359375, 81.10845947265625, 83.37084197998047, 85.63322448730469, 87.8956069946289, 90.15799713134766, 92.42037963867188, 94.68276977539062, 96.94515228271484, 99.20753479003906, 101.46992492675781, 103.73231506347656, 105.99469757080078, 108.25708770751953, 110.51947021484375, 112.7818603515625, 115.04424285888672, 117.30662536621094, 119.56901550292969, 121.8313980102539, 124.09378051757812, 126.35617065429688, 128.61856079101562, 130.8809356689453, 133.14332580566406, 135.4057159423828, 137.6680908203125, 139.93048095703125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 3.0, 5.0, 0.0, 4.0, 8.0, 9.0, 14.0, 12.0, 17.0, 17.0, 10.0, 21.0, 24.0, 32.0, 30.0, 26.0, 29.0, 29.0, 37.0, 31.0, 37.0, 44.0, 37.0, 40.0, 41.0, 40.0, 37.0, 31.0, 26.0, 35.0, 29.0, 35.0, 33.0, 27.0, 19.0, 16.0, 10.0, 17.0, 17.0, 11.0, 9.0, 11.0, 6.0, 4.0, 7.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-19.045766830444336, -18.42285919189453, -17.79995346069336, -17.177045822143555, -16.55413818359375, -15.931232452392578, -15.308324813842773, -14.685418128967285, -14.062511444091797, -13.439604759216309, -12.81669807434082, -12.193790435791016, -11.570883750915527, -10.947977066040039, -10.325069427490234, -9.702162742614746, -9.079256057739258, -8.45634937286377, -7.833442211151123, -7.210535049438477, -6.587628364562988, -5.9647216796875, -5.3418145179748535, -4.718907356262207, -4.096000671386719, -3.4730937480926514, -2.850186824798584, -2.2272799015045166, -1.6043729782104492, -0.9814660549163818, -0.35855913162231445, 0.26434803009033203, 0.8872566223144531, 1.5101635456085205, 2.133070468902588, 2.7559773921966553, 3.3788843154907227, 4.001791000366211, 4.624698162078857, 5.247605323791504, 5.870512008666992, 6.4934186935424805, 7.116325855255127, 7.739233016967773, 8.362139701843262, 8.98504638671875, 9.607954025268555, 10.230860710144043, 10.853767395019531, 11.47667407989502, 12.099580764770508, 12.722488403320312, 13.3453950881958, 13.968301773071289, 14.591209411621094, 15.214116096496582, 15.83702278137207, 16.459930419921875, 17.082836151123047, 17.70574378967285, 18.328651428222656, 18.951557159423828, 19.574464797973633, 20.197372436523438, 20.82027816772461]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 5.0, 10.0, 13.0, 18.0, 21.0, 31.0, 51.0, 62.0, 92.0, 157.0, 291.0, 639.0, 1507.0, 3489.0, 9277.0, 29386.0, 110256.0, 480342.0, 1417413.0, 1481870.0, 498426.0, 115312.0, 30100.0, 9341.0, 3347.0, 1304.0, 649.0, 306.0, 200.0, 117.0, 75.0, 40.0, 32.0, 24.0, 25.0, 8.0, 12.0, 5.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.66796875, -5.506103515625, -5.34423828125, -5.182373046875, -5.0205078125, -4.858642578125, -4.69677734375, -4.534912109375, -4.373046875, -4.211181640625, -4.04931640625, -3.887451171875, -3.7255859375, -3.563720703125, -3.40185546875, -3.239990234375, -3.078125, -2.916259765625, -2.75439453125, -2.592529296875, -2.4306640625, -2.268798828125, -2.10693359375, -1.945068359375, -1.783203125, -1.621337890625, -1.45947265625, -1.297607421875, -1.1357421875, -0.973876953125, -0.81201171875, -0.650146484375, -0.48828125, -0.326416015625, -0.16455078125, -0.002685546875, 0.1591796875, 0.321044921875, 0.48291015625, 0.644775390625, 0.806640625, 0.968505859375, 1.13037109375, 1.292236328125, 1.4541015625, 1.615966796875, 1.77783203125, 1.939697265625, 2.1015625, 2.263427734375, 2.42529296875, 2.587158203125, 2.7490234375, 2.910888671875, 3.07275390625, 3.234619140625, 3.396484375, 3.558349609375, 3.72021484375, 3.882080078125, 4.0439453125, 4.205810546875, 4.36767578125, 4.529541015625, 4.69140625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 7.0, 18.0, 23.0, 23.0, 39.0, 39.0, 51.0, 53.0, 66.0, 63.0, 81.0, 72.0, 70.0, 51.0, 45.0, 54.0, 39.0, 52.0, 31.0, 37.0, 25.0, 14.0, 16.0, 9.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.271240234375, -4.07373046875, -3.876220703125, -3.6787109375, -3.481201171875, -3.28369140625, -3.086181640625, -2.888671875, -2.691162109375, -2.49365234375, -2.296142578125, -2.0986328125, -1.901123046875, -1.70361328125, -1.506103515625, -1.30859375, -1.111083984375, -0.91357421875, -0.716064453125, -0.5185546875, -0.321044921875, -0.12353515625, 0.073974609375, 0.271484375, 0.468994140625, 0.66650390625, 0.864013671875, 1.0615234375, 1.259033203125, 1.45654296875, 1.654052734375, 1.8515625, 2.049072265625, 2.24658203125, 2.444091796875, 2.6416015625, 2.839111328125, 3.03662109375, 3.234130859375, 3.431640625, 3.629150390625, 3.82666015625, 4.024169921875, 4.2216796875, 4.419189453125, 4.61669921875, 4.814208984375, 5.01171875, 5.209228515625, 5.40673828125, 5.604248046875, 5.8017578125, 5.999267578125, 6.19677734375, 6.394287109375, 6.591796875, 6.789306640625, 6.98681640625, 7.184326171875, 7.3818359375, 7.579345703125, 7.77685546875, 7.974365234375, 8.171875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 14.0, 11.0, 24.0, 37.0, 444.0, 4193042.0, 565.0, 52.0, 28.0, 14.0, 9.0, 13.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.75, -174.1103515625, -169.470703125, -164.8310546875, -160.19140625, -155.5517578125, -150.912109375, -146.2724609375, -141.6328125, -136.9931640625, -132.353515625, -127.7138671875, -123.07421875, -118.4345703125, -113.794921875, -109.1552734375, -104.515625, -99.8759765625, -95.236328125, -90.5966796875, -85.95703125, -81.3173828125, -76.677734375, -72.0380859375, -67.3984375, -62.7587890625, -58.119140625, -53.4794921875, -48.83984375, -44.2001953125, -39.560546875, -34.9208984375, -30.28125, -25.6416015625, -21.001953125, -16.3623046875, -11.72265625, -7.0830078125, -2.443359375, 2.1962890625, 6.8359375, 11.4755859375, 16.115234375, 20.7548828125, 25.39453125, 30.0341796875, 34.673828125, 39.3134765625, 43.953125, 48.5927734375, 53.232421875, 57.8720703125, 62.51171875, 67.1513671875, 71.791015625, 76.4306640625, 81.0703125, 85.7099609375, 90.349609375, 94.9892578125, 99.62890625, 104.2685546875, 108.908203125, 113.5478515625, 118.1875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 21.0, 31.0, 83.0, 116.0, 206.0, 409.0, 731.0, 921.0, 699.0, 400.0, 206.0, 119.0, 49.0, 27.0, 27.0, 10.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.404510498046875, -5.28558349609375, -5.166656494140625, -5.0477294921875, -4.928802490234375, -4.80987548828125, -4.690948486328125, -4.572021484375, -4.453094482421875, -4.33416748046875, -4.215240478515625, -4.0963134765625, -3.977386474609375, -3.85845947265625, -3.739532470703125, -3.62060546875, -3.501678466796875, -3.38275146484375, -3.263824462890625, -3.1448974609375, -3.025970458984375, -2.90704345703125, -2.788116455078125, -2.669189453125, -2.550262451171875, -2.43133544921875, -2.312408447265625, -2.1934814453125, -2.074554443359375, -1.95562744140625, -1.836700439453125, -1.7177734375, -1.598846435546875, -1.47991943359375, -1.360992431640625, -1.2420654296875, -1.123138427734375, -1.00421142578125, -0.885284423828125, -0.766357421875, -0.647430419921875, -0.52850341796875, -0.409576416015625, -0.2906494140625, -0.171722412109375, -0.05279541015625, 0.066131591796875, 0.18505859375, 0.303985595703125, 0.42291259765625, 0.541839599609375, 0.6607666015625, 0.779693603515625, 0.89862060546875, 1.017547607421875, 1.136474609375, 1.255401611328125, 1.37432861328125, 1.493255615234375, 1.6121826171875, 1.731109619140625, 1.85003662109375, 1.968963623046875, 2.087890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 15.0, 22.0, 50.0, 42.0, 93.0, 106.0, 155.0, 151.0, 112.0, 86.0, 68.0, 48.0, 27.0, 12.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.405216693878174, -4.099130630493164, -3.793044328689575, -3.4869580268859863, -3.1808719635009766, -2.8747856616973877, -2.568699359893799, -2.262613296508789, -1.9565269947052002, -1.6504408121109009, -1.3443546295166016, -1.0382683277130127, -0.7321821451187134, -0.42609596252441406, -0.1200096607208252, 0.18607640266418457, 0.49216270446777344, 0.7982488870620728, 1.104335069656372, 1.410421371459961, 1.7165075540542603, 2.0225937366485596, 2.3286800384521484, 2.634766101837158, 2.940852403640747, 3.246938705444336, 3.5530247688293457, 3.8591110706329346, 4.165197372436523, 4.471283435821533, 4.777369499206543, 5.083456039428711, 5.389542579650879, 5.695628643035889, 6.001715183258057, 6.307801246643066, 6.613887310028076, 6.919973373413086, 7.226059913635254, 7.532145977020264, 7.838232040405273, 8.144318580627441, 8.450404167175293, 8.756490707397461, 9.062577247619629, 9.36866283416748, 9.674749374389648, 9.9808349609375, 10.286922454833984, 10.593008995056152, 10.899094581604004, 11.205181121826172, 11.51126766204834, 11.817353248596191, 12.12343978881836, 12.429525375366211, 12.735611915588379, 13.041698455810547, 13.347784042358398, 13.653870582580566, 13.959957122802734, 14.266042709350586, 14.572129249572754, 14.878215789794922, 15.184301376342773]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 6.0, 11.0, 9.0, 14.0, 19.0, 13.0, 22.0, 13.0, 27.0, 30.0, 31.0, 40.0, 25.0, 39.0, 39.0, 35.0, 33.0, 42.0, 38.0, 42.0, 34.0, 53.0, 34.0, 50.0, 21.0, 29.0, 24.0, 30.0, 27.0, 15.0, 30.0, 15.0, 26.0, 15.0, 10.0, 9.0, 4.0, 14.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9068353176116943, -2.788784980773926, -2.6707346439361572, -2.5526843070983887, -2.434633731842041, -2.3165836334228516, -2.198533058166504, -2.0804827213287354, -1.9624323844909668, -1.8443820476531982, -1.7263317108154297, -1.6082812547683716, -1.490230917930603, -1.3721805810928345, -1.2541301250457764, -1.1360797882080078, -1.0180294513702393, -0.8999791145324707, -0.7819287180900574, -0.663878321647644, -0.5458279848098755, -0.42777764797210693, -0.3097272515296936, -0.19167685508728027, -0.07362651824951172, 0.044423848390579224, 0.16247421503067017, 0.2805245816707611, 0.39857494831085205, 0.5166252851486206, 0.6346756815910339, 0.7527260780334473, 0.8707766532897949, 0.9888269901275635, 1.106877326965332, 1.2249277830123901, 1.3429781198501587, 1.4610284566879272, 1.5790789127349854, 1.697129249572754, 1.8151795864105225, 1.933229923248291, 2.0512802600860596, 2.169330596923828, 2.287381172180176, 2.4054312705993652, 2.523481845855713, 2.6415321826934814, 2.75958251953125, 2.8776328563690186, 2.995683193206787, 3.1137335300445557, 3.231783866882324, 3.349834442138672, 3.4678847789764404, 3.585935115814209, 3.7039854526519775, 3.822035789489746, 3.9400861263275146, 4.058136463165283, 4.176187038421631, 4.29423713684082, 4.412287712097168, 4.530338287353516, 4.648388385772705]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 19.0, 18.0, 29.0, 28.0, 57.0, 64.0, 122.0, 163.0, 214.0, 289.0, 421.0, 551.0, 739.0, 1030.0, 1427.0, 2277.0, 4210.0, 12796.0, 61923.0, 336347.0, 478877.0, 112197.0, 20584.0, 5727.0, 2617.0, 1593.0, 1159.0, 801.0, 647.0, 454.0, 330.0, 214.0, 184.0, 130.0, 85.0, 61.0, 47.0, 24.0, 32.0, 10.0, 13.0, 13.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.84912109375, -0.8218765258789062, -0.7946319580078125, -0.7673873901367188, -0.740142822265625, -0.7128982543945312, -0.6856536865234375, -0.6584091186523438, -0.63116455078125, -0.6039199829101562, -0.5766754150390625, -0.5494308471679688, -0.522186279296875, -0.49494171142578125, -0.4676971435546875, -0.44045257568359375, -0.4132080078125, -0.38596343994140625, -0.3587188720703125, -0.33147430419921875, -0.304229736328125, -0.27698516845703125, -0.2497406005859375, -0.22249603271484375, -0.19525146484375, -0.16800689697265625, -0.1407623291015625, -0.11351776123046875, -0.086273193359375, -0.05902862548828125, -0.0317840576171875, -0.00453948974609375, 0.022705078125, 0.04994964599609375, 0.0771942138671875, 0.10443878173828125, 0.131683349609375, 0.15892791748046875, 0.1861724853515625, 0.21341705322265625, 0.24066162109375, 0.26790618896484375, 0.2951507568359375, 0.32239532470703125, 0.349639892578125, 0.37688446044921875, 0.4041290283203125, 0.43137359619140625, 0.4586181640625, 0.48586273193359375, 0.5131072998046875, 0.5403518676757812, 0.567596435546875, 0.5948410034179688, 0.6220855712890625, 0.6493301391601562, 0.67657470703125, 0.7038192749023438, 0.7310638427734375, 0.7583084106445312, 0.785552978515625, 0.8127975463867188, 0.8400421142578125, 0.8672866821289062, 0.89453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 13.0, 7.0, 13.0, 17.0, 19.0, 20.0, 27.0, 21.0, 28.0, 37.0, 36.0, 34.0, 34.0, 40.0, 39.0, 35.0, 44.0, 46.0, 38.0, 44.0, 45.0, 33.0, 42.0, 28.0, 26.0, 38.0, 30.0, 18.0, 14.0, 19.0, 18.0, 16.0, 11.0, 13.0, 15.0, 5.0, 5.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.34765625, -2.264862060546875, -2.18206787109375, -2.099273681640625, -2.0164794921875, -1.933685302734375, -1.85089111328125, -1.768096923828125, -1.685302734375, -1.602508544921875, -1.51971435546875, -1.436920166015625, -1.3541259765625, -1.271331787109375, -1.18853759765625, -1.105743408203125, -1.02294921875, -0.940155029296875, -0.85736083984375, -0.774566650390625, -0.6917724609375, -0.608978271484375, -0.52618408203125, -0.443389892578125, -0.360595703125, -0.277801513671875, -0.19500732421875, -0.112213134765625, -0.0294189453125, 0.053375244140625, 0.13616943359375, 0.218963623046875, 0.3017578125, 0.384552001953125, 0.46734619140625, 0.550140380859375, 0.6329345703125, 0.715728759765625, 0.79852294921875, 0.881317138671875, 0.964111328125, 1.046905517578125, 1.12969970703125, 1.212493896484375, 1.2952880859375, 1.378082275390625, 1.46087646484375, 1.543670654296875, 1.62646484375, 1.709259033203125, 1.79205322265625, 1.874847412109375, 1.9576416015625, 2.040435791015625, 2.12322998046875, 2.206024169921875, 2.288818359375, 2.371612548828125, 2.45440673828125, 2.537200927734375, 2.6199951171875, 2.702789306640625, 2.78558349609375, 2.868377685546875, 2.951171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 13.0, 22.0, 31.0, 35.0, 85.0, 110.0, 182.0, 361.0, 687.0, 1394.0, 2772.0, 6147.0, 12890.0, 26797.0, 54376.0, 106192.0, 181186.0, 231310.0, 191609.0, 116104.0, 60086.0, 29387.0, 13715.0, 6709.0, 3206.0, 1446.0, 778.0, 393.0, 219.0, 115.0, 76.0, 31.0, 26.0, 16.0, 5.0, 12.0, 3.0, 10.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2980079650878906, -0.28913116455078125, -0.2802543640136719, -0.2713775634765625, -0.2625007629394531, -0.25362396240234375, -0.24474716186523438, -0.235870361328125, -0.22699356079101562, -0.21811676025390625, -0.20923995971679688, -0.2003631591796875, -0.19148635864257812, -0.18260955810546875, -0.17373275756835938, -0.16485595703125, -0.15597915649414062, -0.14710235595703125, -0.13822555541992188, -0.1293487548828125, -0.12047195434570312, -0.11159515380859375, -0.10271835327148438, -0.093841552734375, -0.08496475219726562, -0.07608795166015625, -0.06721115112304688, -0.0583343505859375, -0.049457550048828125, -0.04058074951171875, -0.031703948974609375, -0.0228271484375, -0.013950347900390625, -0.00507354736328125, 0.003803253173828125, 0.0126800537109375, 0.021556854248046875, 0.03043365478515625, 0.039310455322265625, 0.048187255859375, 0.057064056396484375, 0.06594085693359375, 0.07481765747070312, 0.0836944580078125, 0.09257125854492188, 0.10144805908203125, 0.11032485961914062, 0.11920166015625, 0.12807846069335938, 0.13695526123046875, 0.14583206176757812, 0.1547088623046875, 0.16358566284179688, 0.17246246337890625, 0.18133926391601562, 0.190216064453125, 0.19909286499023438, 0.20796966552734375, 0.21684646606445312, 0.2257232666015625, 0.23460006713867188, 0.24347686767578125, 0.2523536682128906, 0.26123046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 9.0, 11.0, 12.0, 6.0, 11.0, 25.0, 24.0, 24.0, 24.0, 31.0, 34.0, 31.0, 37.0, 33.0, 44.0, 43.0, 55.0, 51.0, 41.0, 31.0, 39.0, 40.0, 38.0, 33.0, 37.0, 45.0, 20.0, 25.0, 32.0, 18.0, 13.0, 9.0, 13.0, 9.0, 6.0, 5.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4530029296875, -4.300537109375, -4.1480712890625, -3.99560546875, -3.8431396484375, -3.690673828125, -3.5382080078125, -3.3857421875, -3.2332763671875, -3.080810546875, -2.9283447265625, -2.77587890625, -2.6234130859375, -2.470947265625, -2.3184814453125, -2.166015625, -2.0135498046875, -1.861083984375, -1.7086181640625, -1.55615234375, -1.4036865234375, -1.251220703125, -1.0987548828125, -0.9462890625, -0.7938232421875, -0.641357421875, -0.4888916015625, -0.33642578125, -0.1839599609375, -0.031494140625, 0.1209716796875, 0.2734375, 0.4259033203125, 0.578369140625, 0.7308349609375, 0.88330078125, 1.0357666015625, 1.188232421875, 1.3406982421875, 1.4931640625, 1.6456298828125, 1.798095703125, 1.9505615234375, 2.10302734375, 2.2554931640625, 2.407958984375, 2.5604248046875, 2.712890625, 2.8653564453125, 3.017822265625, 3.1702880859375, 3.32275390625, 3.4752197265625, 3.627685546875, 3.7801513671875, 3.9326171875, 4.0850830078125, 4.237548828125, 4.3900146484375, 4.54248046875, 4.6949462890625, 4.847412109375, 4.9998779296875, 5.15234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 3.0, 5.0, 5.0, 10.0, 18.0, 22.0, 34.0, 47.0, 79.0, 107.0, 185.0, 252.0, 419.0, 568.0, 1050.0, 1661.0, 3041.0, 6277.0, 13507.0, 32187.0, 82166.0, 195805.0, 315849.0, 225803.0, 98689.0, 38870.0, 16138.0, 7272.0, 3536.0, 1906.0, 1084.0, 688.0, 420.0, 286.0, 176.0, 134.0, 73.0, 70.0, 38.0, 30.0, 12.0, 5.0, 8.0, 8.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.038177490234375, -0.03710508346557617, -0.036032676696777344, -0.034960269927978516, -0.03388786315917969, -0.03281545639038086, -0.03174304962158203, -0.030670642852783203, -0.029598236083984375, -0.028525829315185547, -0.02745342254638672, -0.02638101577758789, -0.025308609008789062, -0.024236202239990234, -0.023163795471191406, -0.022091388702392578, -0.02101898193359375, -0.019946575164794922, -0.018874168395996094, -0.017801761627197266, -0.016729354858398438, -0.01565694808959961, -0.014584541320800781, -0.013512134552001953, -0.012439727783203125, -0.011367321014404297, -0.010294914245605469, -0.00922250747680664, -0.008150100708007812, -0.007077693939208984, -0.006005287170410156, -0.004932880401611328, -0.0038604736328125, -0.002788066864013672, -0.0017156600952148438, -0.0006432533264160156, 0.0004291534423828125, 0.0015015602111816406, 0.0025739669799804688, 0.003646373748779297, 0.004718780517578125, 0.005791187286376953, 0.006863594055175781, 0.00793600082397461, 0.009008407592773438, 0.010080814361572266, 0.011153221130371094, 0.012225627899169922, 0.01329803466796875, 0.014370441436767578, 0.015442848205566406, 0.016515254974365234, 0.017587661743164062, 0.01866006851196289, 0.01973247528076172, 0.020804882049560547, 0.021877288818359375, 0.022949695587158203, 0.02402210235595703, 0.02509450912475586, 0.026166915893554688, 0.027239322662353516, 0.028311729431152344, 0.029384136199951172, 0.03045654296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 14.0, 15.0, 20.0, 30.0, 44.0, 52.0, 58.0, 87.0, 84.0, 106.0, 103.0, 73.0, 85.0, 48.0, 36.0, 46.0, 26.0, 17.0, 19.0, 13.0, 5.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.091594696044922e-05, -5.925167351961136e-05, -5.75874000787735e-05, -5.592312663793564e-05, -5.425885319709778e-05, -5.259457975625992e-05, -5.093030631542206e-05, -4.92660328745842e-05, -4.760175943374634e-05, -4.593748599290848e-05, -4.427321255207062e-05, -4.260893911123276e-05, -4.09446656703949e-05, -3.928039222955704e-05, -3.761611878871918e-05, -3.595184534788132e-05, -3.428757190704346e-05, -3.26232984662056e-05, -3.095902502536774e-05, -2.9294751584529877e-05, -2.7630478143692017e-05, -2.5966204702854156e-05, -2.4301931262016296e-05, -2.2637657821178436e-05, -2.0973384380340576e-05, -1.9309110939502716e-05, -1.7644837498664856e-05, -1.5980564057826996e-05, -1.4316290616989136e-05, -1.2652017176151276e-05, -1.0987743735313416e-05, -9.323470294475555e-06, -7.659196853637695e-06, -5.994923412799835e-06, -4.330649971961975e-06, -2.666376531124115e-06, -1.0021030902862549e-06, 6.621703505516052e-07, 2.3264437913894653e-06, 3.9907172322273254e-06, 5.6549906730651855e-06, 7.319264113903046e-06, 8.983537554740906e-06, 1.0647810995578766e-05, 1.2312084436416626e-05, 1.3976357877254486e-05, 1.5640631318092346e-05, 1.7304904758930206e-05, 1.8969178199768066e-05, 2.0633451640605927e-05, 2.2297725081443787e-05, 2.3961998522281647e-05, 2.5626271963119507e-05, 2.7290545403957367e-05, 2.8954818844795227e-05, 3.061909228563309e-05, 3.228336572647095e-05, 3.394763916730881e-05, 3.561191260814667e-05, 3.727618604898453e-05, 3.894045948982239e-05, 4.060473293066025e-05, 4.226900637149811e-05, 4.393327981233597e-05, 4.559755325317383e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 7.0, 3.0, 3.0, 6.0, 9.0, 5.0, 15.0, 15.0, 12.0, 28.0, 24.0, 32.0, 48.0, 69.0, 106.0, 229.0, 754.0, 4758.0, 57136.0, 774193.0, 197481.0, 11200.0, 1578.0, 352.0, 153.0, 79.0, 54.0, 49.0, 27.0, 23.0, 27.0, 15.0, 7.0, 11.0, 5.0, 13.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1231689453125, -0.11951351165771484, -0.11585807800292969, -0.11220264434814453, -0.10854721069335938, -0.10489177703857422, -0.10123634338378906, -0.0975809097290039, -0.09392547607421875, -0.0902700424194336, -0.08661460876464844, -0.08295917510986328, -0.07930374145507812, -0.07564830780029297, -0.07199287414550781, -0.06833744049072266, -0.0646820068359375, -0.061026573181152344, -0.05737113952636719, -0.05371570587158203, -0.050060272216796875, -0.04640483856201172, -0.04274940490722656, -0.039093971252441406, -0.03543853759765625, -0.031783103942871094, -0.028127670288085938, -0.02447223663330078, -0.020816802978515625, -0.01716136932373047, -0.013505935668945312, -0.009850502014160156, -0.006195068359375, -0.0025396347045898438, 0.0011157989501953125, 0.004771232604980469, 0.008426666259765625, 0.012082099914550781, 0.015737533569335938, 0.019392967224121094, 0.02304840087890625, 0.026703834533691406, 0.030359268188476562, 0.03401470184326172, 0.037670135498046875, 0.04132556915283203, 0.04498100280761719, 0.048636436462402344, 0.0522918701171875, 0.055947303771972656, 0.05960273742675781, 0.06325817108154297, 0.06691360473632812, 0.07056903839111328, 0.07422447204589844, 0.0778799057006836, 0.08153533935546875, 0.0851907730102539, 0.08884620666503906, 0.09250164031982422, 0.09615707397460938, 0.09981250762939453, 0.10346794128417969, 0.10712337493896484, 0.11077880859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 5.0, 12.0, 10.0, 11.0, 15.0, 16.0, 32.0, 24.0, 33.0, 33.0, 31.0, 56.0, 58.0, 61.0, 52.0, 73.0, 73.0, 50.0, 47.0, 44.0, 32.0, 37.0, 32.0, 27.0, 24.0, 17.0, 14.0, 14.0, 11.0, 14.0, 3.0, 10.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.011566162109375, -0.011238932609558105, -0.010911703109741211, -0.010584473609924316, -0.010257244110107422, -0.009930014610290527, -0.009602785110473633, -0.009275555610656738, -0.008948326110839844, -0.00862109661102295, -0.008293867111206055, -0.00796663761138916, -0.007639408111572266, -0.007312178611755371, -0.0069849491119384766, -0.006657719612121582, -0.0063304901123046875, -0.006003260612487793, -0.0056760311126708984, -0.005348801612854004, -0.005021572113037109, -0.004694342613220215, -0.00436711311340332, -0.004039883613586426, -0.0037126541137695312, -0.0033854246139526367, -0.003058195114135742, -0.0027309656143188477, -0.002403736114501953, -0.0020765066146850586, -0.001749277114868164, -0.0014220476150512695, -0.001094818115234375, -0.0007675886154174805, -0.00044035911560058594, -0.0001131296157836914, 0.00021409988403320312, 0.0005413293838500977, 0.0008685588836669922, 0.0011957883834838867, 0.0015230178833007812, 0.0018502473831176758, 0.0021774768829345703, 0.002504706382751465, 0.0028319358825683594, 0.003159165382385254, 0.0034863948822021484, 0.003813624382019043, 0.0041408538818359375, 0.004468083381652832, 0.0047953128814697266, 0.005122542381286621, 0.005449771881103516, 0.00577700138092041, 0.006104230880737305, 0.006431460380554199, 0.006758689880371094, 0.007085919380187988, 0.007413148880004883, 0.007740378379821777, 0.008067607879638672, 0.008394837379455566, 0.008722066879272461, 0.009049296379089355, 0.00937652587890625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 32.0, 48.0, 74.0, 137.0, 197.0, 179.0, 131.0, 86.0, 61.0, 25.0, 16.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.822754383087158, -4.570793628692627, -4.3188323974609375, -4.066871643066406, -3.814910888671875, -3.5629498958587646, -3.3109889030456543, -3.059028148651123, -2.8070671558380127, -2.5551061630249023, -2.303145408630371, -2.0511844158172607, -1.79922354221344, -1.5472626686096191, -1.2953016757965088, -1.043340802192688, -0.7913799285888672, -0.5394190549850464, -0.2874581217765808, -0.035497188568115234, 0.21646368503570557, 0.46842455863952637, 0.7203855514526367, 0.9723464250564575, 1.2243072986602783, 1.4762681722640991, 1.72822904586792, 1.9801900386810303, 2.2321510314941406, 2.484111785888672, 2.7360727787017822, 2.9880337715148926, 3.2399940490722656, 3.491955041885376, 3.7439157962799072, 3.9958767890930176, 4.247837543487549, 4.499798774719238, 4.7517595291137695, 5.003720283508301, 5.255681037902832, 5.507641792297363, 5.759603023529053, 6.011563777923584, 6.263524532318115, 6.515485763549805, 6.767446517944336, 7.019407272338867, 7.271368503570557, 7.523329257965088, 7.775290489196777, 8.027251243591309, 8.27921199798584, 8.531172752380371, 8.783134460449219, 9.03509521484375, 9.287055969238281, 9.539016723632812, 9.790977478027344, 10.042938232421875, 10.294899940490723, 10.546860694885254, 10.798821449279785, 11.050782203674316, 11.302742958068848]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 9.0, 9.0, 11.0, 11.0, 7.0, 16.0, 26.0, 16.0, 17.0, 24.0, 26.0, 34.0, 41.0, 27.0, 36.0, 39.0, 41.0, 31.0, 35.0, 49.0, 43.0, 43.0, 44.0, 42.0, 41.0, 25.0, 27.0, 33.0, 26.0, 24.0, 25.0, 22.0, 16.0, 23.0, 12.0, 7.0, 6.0, 10.0, 7.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1633431911468506, -2.08503794670105, -2.006732940673828, -1.928427815437317, -1.8501226902008057, -1.7718174457550049, -1.6935123205184937, -1.6152071952819824, -1.5369020700454712, -1.45859694480896, -1.3802918195724487, -1.3019866943359375, -1.2236814498901367, -1.145376443862915, -1.0670711994171143, -0.988766074180603, -0.9104609489440918, -0.8321558237075806, -0.7538506984710693, -0.6755455136299133, -0.5972403883934021, -0.5189352631568909, -0.44063010811805725, -0.36232495307922363, -0.2840198278427124, -0.20571468770503998, -0.12740954756736755, -0.04910440742969513, 0.029200732707977295, 0.10750585794448853, 0.18581101298332214, 0.26411616802215576, 0.3424210548400879, 0.4207261800765991, 0.49903133511543274, 0.5773364901542664, 0.6556416153907776, 0.7339467406272888, 0.8122519254684448, 0.890557050704956, 0.9688621759414673, 1.0471673011779785, 1.1254724264144897, 1.203777551651001, 1.2820827960968018, 1.3603878021240234, 1.4386930465698242, 1.5169981718063354, 1.5953032970428467, 1.673608422279358, 1.7519135475158691, 1.8302186727523804, 1.9085237979888916, 1.9868290424346924, 2.065134048461914, 2.143439292907715, 2.2217445373535156, 2.3000497817993164, 2.378354787826538, 2.456660032272339, 2.5349650382995605, 2.6132702827453613, 2.691575288772583, 2.769880533218384, 2.8481855392456055]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 11.0, 14.0, 22.0, 29.0, 51.0, 54.0, 114.0, 140.0, 260.0, 401.0, 682.0, 1226.0, 2198.0, 3942.0, 7589.0, 15040.0, 32195.0, 68410.0, 140061.0, 229077.0, 240571.0, 155659.0, 78191.0, 36676.0, 17171.0, 8627.0, 4272.0, 2426.0, 1372.0, 782.0, 452.0, 296.0, 184.0, 113.0, 62.0, 49.0, 35.0, 26.0, 20.0, 14.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.7685546875, -1.71343994140625, -1.6583251953125, -1.60321044921875, -1.548095703125, -1.49298095703125, -1.4378662109375, -1.38275146484375, -1.32763671875, -1.27252197265625, -1.2174072265625, -1.16229248046875, -1.107177734375, -1.05206298828125, -0.9969482421875, -0.94183349609375, -0.88671875, -0.83160400390625, -0.7764892578125, -0.72137451171875, -0.666259765625, -0.61114501953125, -0.5560302734375, -0.50091552734375, -0.44580078125, -0.39068603515625, -0.3355712890625, -0.28045654296875, -0.225341796875, -0.17022705078125, -0.1151123046875, -0.05999755859375, -0.0048828125, 0.05023193359375, 0.1053466796875, 0.16046142578125, 0.215576171875, 0.27069091796875, 0.3258056640625, 0.38092041015625, 0.43603515625, 0.49114990234375, 0.5462646484375, 0.60137939453125, 0.656494140625, 0.71160888671875, 0.7667236328125, 0.82183837890625, 0.876953125, 0.93206787109375, 0.9871826171875, 1.04229736328125, 1.097412109375, 1.15252685546875, 1.2076416015625, 1.26275634765625, 1.31787109375, 1.37298583984375, 1.4281005859375, 1.48321533203125, 1.538330078125, 1.59344482421875, 1.6485595703125, 1.70367431640625, 1.7587890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 15.0, 7.0, 14.0, 19.0, 20.0, 25.0, 30.0, 43.0, 36.0, 36.0, 45.0, 51.0, 42.0, 59.0, 67.0, 67.0, 49.0, 48.0, 42.0, 37.0, 39.0, 34.0, 24.0, 18.0, 31.0, 18.0, 8.0, 10.0, 10.0, 10.0, 12.0, 6.0, 4.0, 3.0, 0.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.398193359375, -8.12451171875, -7.850830078125, -7.5771484375, -7.303466796875, -7.02978515625, -6.756103515625, -6.482421875, -6.208740234375, -5.93505859375, -5.661376953125, -5.3876953125, -5.114013671875, -4.84033203125, -4.566650390625, -4.29296875, -4.019287109375, -3.74560546875, -3.471923828125, -3.1982421875, -2.924560546875, -2.65087890625, -2.377197265625, -2.103515625, -1.829833984375, -1.55615234375, -1.282470703125, -1.0087890625, -0.735107421875, -0.46142578125, -0.187744140625, 0.0859375, 0.359619140625, 0.63330078125, 0.906982421875, 1.1806640625, 1.454345703125, 1.72802734375, 2.001708984375, 2.275390625, 2.549072265625, 2.82275390625, 3.096435546875, 3.3701171875, 3.643798828125, 3.91748046875, 4.191162109375, 4.46484375, 4.738525390625, 5.01220703125, 5.285888671875, 5.5595703125, 5.833251953125, 6.10693359375, 6.380615234375, 6.654296875, 6.927978515625, 7.20166015625, 7.475341796875, 7.7490234375, 8.022705078125, 8.29638671875, 8.570068359375, 8.84375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 5.0, 5.0, 6.0, 12.0, 15.0, 15.0, 17.0, 25.0, 27.0, 40.0, 40.0, 70.0, 102.0, 167.0, 401.0, 1312.0, 900233.0, 144331.0, 844.0, 306.0, 161.0, 105.0, 60.0, 48.0, 26.0, 25.0, 34.0, 15.0, 11.0, 18.0, 11.0, 7.0, 6.0, 9.0, 9.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-23.203125, -22.4970703125, -21.791015625, -21.0849609375, -20.37890625, -19.6728515625, -18.966796875, -18.2607421875, -17.5546875, -16.8486328125, -16.142578125, -15.4365234375, -14.73046875, -14.0244140625, -13.318359375, -12.6123046875, -11.90625, -11.2001953125, -10.494140625, -9.7880859375, -9.08203125, -8.3759765625, -7.669921875, -6.9638671875, -6.2578125, -5.5517578125, -4.845703125, -4.1396484375, -3.43359375, -2.7275390625, -2.021484375, -1.3154296875, -0.609375, 0.0966796875, 0.802734375, 1.5087890625, 2.21484375, 2.9208984375, 3.626953125, 4.3330078125, 5.0390625, 5.7451171875, 6.451171875, 7.1572265625, 7.86328125, 8.5693359375, 9.275390625, 9.9814453125, 10.6875, 11.3935546875, 12.099609375, 12.8056640625, 13.51171875, 14.2177734375, 14.923828125, 15.6298828125, 16.3359375, 17.0419921875, 17.748046875, 18.4541015625, 19.16015625, 19.8662109375, 20.572265625, 21.2783203125, 21.984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 5.0, 4.0, 10.0, 5.0, 12.0, 11.0, 19.0, 12.0, 30.0, 21.0, 29.0, 39.0, 47.0, 36.0, 56.0, 48.0, 58.0, 37.0, 60.0, 41.0, 65.0, 59.0, 53.0, 31.0, 25.0, 27.0, 26.0, 24.0, 22.0, 12.0, 7.0, 14.0, 11.0, 9.0, 4.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.09375, -9.7830810546875, -9.472412109375, -9.1617431640625, -8.85107421875, -8.5404052734375, -8.229736328125, -7.9190673828125, -7.6083984375, -7.2977294921875, -6.987060546875, -6.6763916015625, -6.36572265625, -6.0550537109375, -5.744384765625, -5.4337158203125, -5.123046875, -4.8123779296875, -4.501708984375, -4.1910400390625, -3.88037109375, -3.5697021484375, -3.259033203125, -2.9483642578125, -2.6376953125, -2.3270263671875, -2.016357421875, -1.7056884765625, -1.39501953125, -1.0843505859375, -0.773681640625, -0.4630126953125, -0.15234375, 0.1583251953125, 0.468994140625, 0.7796630859375, 1.09033203125, 1.4010009765625, 1.711669921875, 2.0223388671875, 2.3330078125, 2.6436767578125, 2.954345703125, 3.2650146484375, 3.57568359375, 3.8863525390625, 4.197021484375, 4.5076904296875, 4.818359375, 5.1290283203125, 5.439697265625, 5.7503662109375, 6.06103515625, 6.3717041015625, 6.682373046875, 6.9930419921875, 7.3037109375, 7.6143798828125, 7.925048828125, 8.2357177734375, 8.54638671875, 8.8570556640625, 9.167724609375, 9.4783935546875, 9.7890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 11.0, 12.0, 27.0, 46.0, 46.0, 81.0, 185.0, 396.0, 1612.0, 11685.0, 612505.0, 411295.0, 8632.0, 1319.0, 328.0, 152.0, 81.0, 45.0, 16.0, 20.0, 9.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.37310791015625, -2.2696533203125, -2.16619873046875, -2.062744140625, -1.95928955078125, -1.8558349609375, -1.75238037109375, -1.64892578125, -1.54547119140625, -1.4420166015625, -1.33856201171875, -1.235107421875, -1.13165283203125, -1.0281982421875, -0.92474365234375, -0.8212890625, -0.71783447265625, -0.6143798828125, -0.51092529296875, -0.407470703125, -0.30401611328125, -0.2005615234375, -0.09710693359375, 0.00634765625, 0.10980224609375, 0.2132568359375, 0.31671142578125, 0.420166015625, 0.52362060546875, 0.6270751953125, 0.73052978515625, 0.833984375, 0.93743896484375, 1.0408935546875, 1.14434814453125, 1.247802734375, 1.35125732421875, 1.4547119140625, 1.55816650390625, 1.66162109375, 1.76507568359375, 1.8685302734375, 1.97198486328125, 2.075439453125, 2.17889404296875, 2.2823486328125, 2.38580322265625, 2.4892578125, 2.59271240234375, 2.6961669921875, 2.79962158203125, 2.903076171875, 3.00653076171875, 3.1099853515625, 3.21343994140625, 3.31689453125, 3.42034912109375, 3.5238037109375, 3.62725830078125, 3.730712890625, 3.83416748046875, 3.9376220703125, 4.04107666015625, 4.14453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 12.0, 25.0, 16.0, 55.0, 54.0, 72.0, 97.0, 118.0, 110.0, 99.0, 80.0, 72.0, 47.0, 36.0, 24.0, 18.0, 18.0, 10.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00021147727966308594, -0.00020375102758407593, -0.00019602477550506592, -0.0001882985234260559, -0.0001805722713470459, -0.0001728460192680359, -0.00016511976718902588, -0.00015739351511001587, -0.00014966726303100586, -0.00014194101095199585, -0.00013421475887298584, -0.00012648850679397583, -0.00011876225471496582, -0.00011103600263595581, -0.0001033097505569458, -9.558349847793579e-05, -8.785724639892578e-05, -8.013099431991577e-05, -7.240474224090576e-05, -6.467849016189575e-05, -5.695223808288574e-05, -4.922598600387573e-05, -4.149973392486572e-05, -3.377348184585571e-05, -2.6047229766845703e-05, -1.8320977687835693e-05, -1.0594725608825684e-05, -2.868473529815674e-06, 4.857778549194336e-06, 1.2584030628204346e-05, 2.0310282707214355e-05, 2.8036534786224365e-05, 3.5762786865234375e-05, 4.3489038944244385e-05, 5.1215291023254395e-05, 5.8941543102264404e-05, 6.666779518127441e-05, 7.439404726028442e-05, 8.212029933929443e-05, 8.984655141830444e-05, 9.757280349731445e-05, 0.00010529905557632446, 0.00011302530765533447, 0.00012075155973434448, 0.0001284778118133545, 0.0001362040638923645, 0.0001439303159713745, 0.00015165656805038452, 0.00015938282012939453, 0.00016710907220840454, 0.00017483532428741455, 0.00018256157636642456, 0.00019028782844543457, 0.00019801408052444458, 0.0002057403326034546, 0.0002134665846824646, 0.0002211928367614746, 0.00022891908884048462, 0.00023664534091949463, 0.00024437159299850464, 0.00025209784507751465, 0.00025982409715652466, 0.00026755034923553467, 0.0002752766013145447, 0.0002830028533935547]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 4.0, 12.0, 19.0, 18.0, 43.0, 49.0, 74.0, 114.0, 240.0, 543.0, 1624.0, 7053.0, 82935.0, 820575.0, 123093.0, 8916.0, 1888.0, 660.0, 278.0, 137.0, 74.0, 49.0, 39.0, 24.0, 19.0, 11.0, 13.0, 1.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.443359375, -2.365936279296875, -2.28851318359375, -2.211090087890625, -2.1336669921875, -2.056243896484375, -1.97882080078125, -1.901397705078125, -1.823974609375, -1.746551513671875, -1.66912841796875, -1.591705322265625, -1.5142822265625, -1.436859130859375, -1.35943603515625, -1.282012939453125, -1.20458984375, -1.127166748046875, -1.04974365234375, -0.972320556640625, -0.8948974609375, -0.817474365234375, -0.74005126953125, -0.662628173828125, -0.585205078125, -0.507781982421875, -0.43035888671875, -0.352935791015625, -0.2755126953125, -0.198089599609375, -0.12066650390625, -0.043243408203125, 0.0341796875, 0.111602783203125, 0.18902587890625, 0.266448974609375, 0.3438720703125, 0.421295166015625, 0.49871826171875, 0.576141357421875, 0.653564453125, 0.730987548828125, 0.80841064453125, 0.885833740234375, 0.9632568359375, 1.040679931640625, 1.11810302734375, 1.195526123046875, 1.27294921875, 1.350372314453125, 1.42779541015625, 1.505218505859375, 1.5826416015625, 1.660064697265625, 1.73748779296875, 1.814910888671875, 1.892333984375, 1.969757080078125, 2.04718017578125, 2.124603271484375, 2.2020263671875, 2.279449462890625, 2.35687255859375, 2.434295654296875, 2.51171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 9.0, 8.0, 7.0, 22.0, 37.0, 53.0, 70.0, 85.0, 131.0, 132.0, 114.0, 94.0, 71.0, 46.0, 44.0, 24.0, 11.0, 13.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7392578125, -0.7151718139648438, -0.6910858154296875, -0.6669998168945312, -0.642913818359375, -0.6188278198242188, -0.5947418212890625, -0.5706558227539062, -0.54656982421875, -0.5224838256835938, -0.4983978271484375, -0.47431182861328125, -0.450225830078125, -0.42613983154296875, -0.4020538330078125, -0.37796783447265625, -0.3538818359375, -0.32979583740234375, -0.3057098388671875, -0.28162384033203125, -0.257537841796875, -0.23345184326171875, -0.2093658447265625, -0.18527984619140625, -0.16119384765625, -0.13710784912109375, -0.1130218505859375, -0.08893585205078125, -0.064849853515625, -0.04076385498046875, -0.0166778564453125, 0.00740814208984375, 0.031494140625, 0.05558013916015625, 0.0796661376953125, 0.10375213623046875, 0.127838134765625, 0.15192413330078125, 0.1760101318359375, 0.20009613037109375, 0.22418212890625, 0.24826812744140625, 0.2723541259765625, 0.29644012451171875, 0.320526123046875, 0.34461212158203125, 0.3686981201171875, 0.39278411865234375, 0.4168701171875, 0.44095611572265625, 0.4650421142578125, 0.48912811279296875, 0.513214111328125, 0.5373001098632812, 0.5613861083984375, 0.5854721069335938, 0.60955810546875, 0.6336441040039062, 0.6577301025390625, 0.6818161010742188, 0.705902099609375, 0.7299880981445312, 0.7540740966796875, 0.7781600952148438, 0.80224609375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 2.0, 9.0, 19.0, 31.0, 34.0, 33.0, 39.0, 51.0, 83.0, 100.0, 83.0, 84.0, 84.0, 65.0, 53.0, 63.0, 48.0, 44.0, 23.0, 12.0, 11.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.072953224182129, -5.83391809463501, -5.594883441925049, -5.35584831237793, -5.1168131828308105, -4.877778053283691, -4.6387434005737305, -4.399708271026611, -4.160673141479492, -3.921638250350952, -3.682603120803833, -3.443568229675293, -3.204533100128174, -2.965498208999634, -2.7264633178710938, -2.4874281883239746, -2.2483932971954346, -2.0093584060668945, -1.7703232765197754, -1.5312883853912354, -1.2922532558441162, -1.0532183647155762, -0.8141833543777466, -0.575148344039917, -0.3361133337020874, -0.097078338265419, 0.1419566571712494, 0.3809916377067566, 0.6200266480445862, 0.859061598777771, 1.0980966091156006, 1.3371316194534302, 1.5761666297912598, 1.8152016401290894, 2.054236650466919, 2.293271541595459, 2.532306671142578, 2.771341562271118, 3.010376453399658, 3.2494115829467773, 3.4884467124938965, 3.7274816036224365, 3.9665167331695557, 4.205551624298096, 4.444586753845215, 4.683621406555176, 4.922656536102295, 5.161691665649414, 5.400726318359375, 5.639761447906494, 5.878796100616455, 6.117831230163574, 6.356866359710693, 6.5959014892578125, 6.834936141967773, 7.073971271514893, 7.313006401062012, 7.552041530609131, 7.791076183319092, 8.030111312866211, 8.269145965576172, 8.50818157196045, 8.74721622467041, 8.986251831054688, 9.225286483764648]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 8.0, 6.0, 6.0, 6.0, 16.0, 18.0, 16.0, 23.0, 17.0, 23.0, 26.0, 30.0, 38.0, 40.0, 29.0, 39.0, 47.0, 50.0, 60.0, 61.0, 57.0, 39.0, 44.0, 36.0, 40.0, 28.0, 26.0, 30.0, 23.0, 24.0, 21.0, 19.0, 14.0, 7.0, 12.0, 4.0, 6.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-14.550750732421875, -14.161721229553223, -13.772692680358887, -13.383663177490234, -12.994634628295898, -12.605605125427246, -12.216575622558594, -11.827547073364258, -11.438517570495605, -11.049488067626953, -10.660459518432617, -10.271430015563965, -9.882401466369629, -9.493371963500977, -9.10434341430664, -8.715313911437988, -8.326284408569336, -7.937255382537842, -7.548226356506348, -7.159196853637695, -6.770167827606201, -6.381138801574707, -5.992109775543213, -5.603080749511719, -5.214052200317383, -4.825023174285889, -4.4359941482543945, -4.046964645385742, -3.657935619354248, -3.268906593322754, -2.8798775672912598, -2.4908483028411865, -2.1018190383911133, -1.7127898931503296, -1.323760747909546, -0.9347317218780518, -0.5457025766372681, -0.15667343139648438, 0.23235559463500977, 0.621384859085083, 1.0104138851165771, 1.3994430303573608, 1.7884721755981445, 2.1775012016296387, 2.566530227661133, 2.955559492111206, 3.3445885181427, 3.7336177825927734, 4.122646808624268, 4.511675834655762, 4.900704860687256, 5.28973388671875, 5.678763389587402, 6.0677924156188965, 6.456821441650391, 6.845850944519043, 7.234879493713379, 7.623908519744873, 8.012937545776367, 8.40196704864502, 8.790995597839355, 9.180025100708008, 9.569053649902344, 9.958083152770996, 10.347112655639648]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 8.0, 8.0, 13.0, 11.0, 16.0, 31.0, 29.0, 45.0, 42.0, 62.0, 80.0, 134.0, 235.0, 550.0, 2298.0, 13465.0, 149582.0, 1830310.0, 2004396.0, 174086.0, 14942.0, 2463.0, 664.0, 263.0, 148.0, 104.0, 74.0, 52.0, 30.0, 36.0, 25.0, 19.0, 11.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.46875, -9.19842529296875, -8.9281005859375, -8.65777587890625, -8.387451171875, -8.11712646484375, -7.8468017578125, -7.57647705078125, -7.30615234375, -7.03582763671875, -6.7655029296875, -6.49517822265625, -6.224853515625, -5.95452880859375, -5.6842041015625, -5.41387939453125, -5.1435546875, -4.87322998046875, -4.6029052734375, -4.33258056640625, -4.062255859375, -3.79193115234375, -3.5216064453125, -3.25128173828125, -2.98095703125, -2.71063232421875, -2.4403076171875, -2.16998291015625, -1.899658203125, -1.62933349609375, -1.3590087890625, -1.08868408203125, -0.818359375, -0.54803466796875, -0.2777099609375, -0.00738525390625, 0.262939453125, 0.53326416015625, 0.8035888671875, 1.07391357421875, 1.34423828125, 1.61456298828125, 1.8848876953125, 2.15521240234375, 2.425537109375, 2.69586181640625, 2.9661865234375, 3.23651123046875, 3.5068359375, 3.77716064453125, 4.0474853515625, 4.31781005859375, 4.588134765625, 4.85845947265625, 5.1287841796875, 5.39910888671875, 5.66943359375, 5.93975830078125, 6.2100830078125, 6.48040771484375, 6.750732421875, 7.02105712890625, 7.2913818359375, 7.56170654296875, 7.83203125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 10.0, 14.0, 14.0, 8.0, 25.0, 10.0, 29.0, 33.0, 31.0, 45.0, 39.0, 45.0, 39.0, 41.0, 40.0, 71.0, 47.0, 53.0, 40.0, 34.0, 41.0, 40.0, 37.0, 34.0, 31.0, 22.0, 19.0, 14.0, 31.0, 14.0, 10.0, 7.0, 9.0, 4.0, 3.0, 6.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.468658447265625, -3.34942626953125, -3.230194091796875, -3.1109619140625, -2.991729736328125, -2.87249755859375, -2.753265380859375, -2.634033203125, -2.514801025390625, -2.39556884765625, -2.276336669921875, -2.1571044921875, -2.037872314453125, -1.91864013671875, -1.799407958984375, -1.68017578125, -1.560943603515625, -1.44171142578125, -1.322479248046875, -1.2032470703125, -1.084014892578125, -0.96478271484375, -0.845550537109375, -0.726318359375, -0.607086181640625, -0.48785400390625, -0.368621826171875, -0.2493896484375, -0.130157470703125, -0.01092529296875, 0.108306884765625, 0.2275390625, 0.346771240234375, 0.46600341796875, 0.585235595703125, 0.7044677734375, 0.823699951171875, 0.94293212890625, 1.062164306640625, 1.181396484375, 1.300628662109375, 1.41986083984375, 1.539093017578125, 1.6583251953125, 1.777557373046875, 1.89678955078125, 2.016021728515625, 2.13525390625, 2.254486083984375, 2.37371826171875, 2.492950439453125, 2.6121826171875, 2.731414794921875, 2.85064697265625, 2.969879150390625, 3.089111328125, 3.208343505859375, 3.32757568359375, 3.446807861328125, 3.5660400390625, 3.685272216796875, 3.80450439453125, 3.923736572265625, 4.04296875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 13.0, 11.0, 27.0, 39.0, 70.0, 108.0, 238.0, 614.0, 6794.0, 4162716.0, 22257.0, 791.0, 261.0, 138.0, 75.0, 37.0, 22.0, 13.0, 13.0, 15.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.724609375, -37.63671875, -36.548828125, -35.4609375, -34.373046875, -33.28515625, -32.197265625, -31.109375, -30.021484375, -28.93359375, -27.845703125, -26.7578125, -25.669921875, -24.58203125, -23.494140625, -22.40625, -21.318359375, -20.23046875, -19.142578125, -18.0546875, -16.966796875, -15.87890625, -14.791015625, -13.703125, -12.615234375, -11.52734375, -10.439453125, -9.3515625, -8.263671875, -7.17578125, -6.087890625, -5.0, -3.912109375, -2.82421875, -1.736328125, -0.6484375, 0.439453125, 1.52734375, 2.615234375, 3.703125, 4.791015625, 5.87890625, 6.966796875, 8.0546875, 9.142578125, 10.23046875, 11.318359375, 12.40625, 13.494140625, 14.58203125, 15.669921875, 16.7578125, 17.845703125, 18.93359375, 20.021484375, 21.109375, 22.197265625, 23.28515625, 24.373046875, 25.4609375, 26.548828125, 27.63671875, 28.724609375, 29.8125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 3.0, 5.0, 11.0, 7.0, 6.0, 12.0, 18.0, 25.0, 33.0, 47.0, 53.0, 92.0, 146.0, 165.0, 262.0, 315.0, 453.0, 537.0, 456.0, 379.0, 319.0, 181.0, 186.0, 110.0, 63.0, 49.0, 33.0, 34.0, 23.0, 17.0, 5.0, 8.0, 8.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.1680755615234375, -2.105682373046875, -2.0432891845703125, -1.98089599609375, -1.9185028076171875, -1.856109619140625, -1.7937164306640625, -1.7313232421875, -1.6689300537109375, -1.606536865234375, -1.5441436767578125, -1.48175048828125, -1.4193572998046875, -1.356964111328125, -1.2945709228515625, -1.232177734375, -1.1697845458984375, -1.107391357421875, -1.0449981689453125, -0.98260498046875, -0.9202117919921875, -0.857818603515625, -0.7954254150390625, -0.7330322265625, -0.6706390380859375, -0.608245849609375, -0.5458526611328125, -0.48345947265625, -0.4210662841796875, -0.358673095703125, -0.2962799072265625, -0.23388671875, -0.1714935302734375, -0.109100341796875, -0.0467071533203125, 0.01568603515625, 0.0780792236328125, 0.140472412109375, 0.2028656005859375, 0.2652587890625, 0.3276519775390625, 0.390045166015625, 0.4524383544921875, 0.51483154296875, 0.5772247314453125, 0.639617919921875, 0.7020111083984375, 0.764404296875, 0.8267974853515625, 0.889190673828125, 0.9515838623046875, 1.01397705078125, 1.0763702392578125, 1.138763427734375, 1.2011566162109375, 1.2635498046875, 1.3259429931640625, 1.388336181640625, 1.4507293701171875, 1.51312255859375, 1.5755157470703125, 1.637908935546875, 1.7003021240234375, 1.7626953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 0.0, 5.0, 7.0, 11.0, 26.0, 31.0, 42.0, 72.0, 83.0, 114.0, 122.0, 105.0, 120.0, 89.0, 57.0, 48.0, 33.0, 14.0, 11.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93251633644104, -3.671781063079834, -3.411045789718628, -3.150310516357422, -2.889575242996216, -2.6288399696350098, -2.3681046962738037, -2.1073694229125977, -1.8466341495513916, -1.5858988761901855, -1.3251636028289795, -1.0644283294677734, -0.8036930561065674, -0.5429577827453613, -0.2822225093841553, -0.02148723602294922, 0.23924803733825684, 0.4999833106994629, 0.760718584060669, 1.021453857421875, 1.282189130783081, 1.542924404144287, 1.8036596775054932, 2.064394950866699, 2.3251302242279053, 2.5858654975891113, 2.8466007709503174, 3.1073360443115234, 3.3680713176727295, 3.6288065910339355, 3.8895418643951416, 4.150277137756348, 4.411011695861816, 4.671747207641602, 4.9324822425842285, 5.1932172775268555, 5.453952789306641, 5.714688301086426, 5.975423336029053, 6.23615837097168, 6.496893882751465, 6.75762939453125, 7.018364429473877, 7.279099464416504, 7.539834976196289, 7.800570487976074, 8.06130599975586, 8.322040557861328, 8.582776069641113, 8.843511581420898, 9.104246139526367, 9.364981651306152, 9.625717163085938, 9.886452674865723, 10.147188186645508, 10.407922744750977, 10.668658256530762, 10.929393768310547, 11.190128326416016, 11.4508638381958, 11.711599349975586, 11.972334861755371, 12.233070373535156, 12.493804931640625, 12.75454044342041]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 5.0, 6.0, 14.0, 13.0, 22.0, 21.0, 21.0, 26.0, 29.0, 23.0, 32.0, 38.0, 31.0, 27.0, 39.0, 46.0, 41.0, 37.0, 26.0, 50.0, 44.0, 47.0, 32.0, 40.0, 31.0, 28.0, 29.0, 33.0, 24.0, 30.0, 15.0, 12.0, 10.0, 11.0, 13.0, 11.0, 9.0, 6.0, 7.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.7853381633758545, -3.6622438430786133, -3.539149522781372, -3.416055202484131, -3.2929606437683105, -3.1698663234710693, -3.046772003173828, -2.923677682876587, -2.8005833625793457, -2.6774890422821045, -2.5543947219848633, -2.431300163269043, -2.3082058429718018, -2.1851115226745605, -2.0620172023773193, -1.9389228820800781, -1.8158283233642578, -1.6927340030670166, -1.5696395635604858, -1.4465452432632446, -1.3234508037567139, -1.2003564834594727, -1.0772621631622314, -0.9541677832603455, -0.8310734033584595, -0.7079790234565735, -0.5848846435546875, -0.4617903232574463, -0.3386959433555603, -0.21560156345367432, -0.0925072431564331, 0.03058713674545288, 0.15368175506591797, 0.27677613496780396, 0.39987048506736755, 0.5229648351669312, 0.6460592150688171, 0.7691535949707031, 0.8922479152679443, 1.0153422355651855, 1.1384366750717163, 1.2615309953689575, 1.3846254348754883, 1.5077197551727295, 1.6308140754699707, 1.7539085149765015, 1.8770028352737427, 2.0000972747802734, 2.1231915950775146, 2.246285915374756, 2.369380235671997, 2.4924745559692383, 2.6155691146850586, 2.7386634349823, 2.861757755279541, 2.9848520755767822, 3.1079463958740234, 3.2310407161712646, 3.354135036468506, 3.477229595184326, 3.6003239154815674, 3.7234182357788086, 3.84651255607605, 3.969606876373291, 4.092701435089111]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 12.0, 15.0, 21.0, 35.0, 53.0, 70.0, 96.0, 168.0, 254.0, 491.0, 737.0, 1283.0, 2125.0, 3975.0, 8755.0, 38424.0, 408356.0, 512041.0, 51386.0, 10115.0, 4342.0, 2339.0, 1328.0, 832.0, 483.0, 282.0, 166.0, 118.0, 78.0, 61.0, 36.0, 25.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.3331527709960938, -1.2961883544921875, -1.2592239379882812, -1.222259521484375, -1.1852951049804688, -1.1483306884765625, -1.1113662719726562, -1.07440185546875, -1.0374374389648438, -1.0004730224609375, -0.9635086059570312, -0.926544189453125, -0.8895797729492188, -0.8526153564453125, -0.8156509399414062, -0.7786865234375, -0.7417221069335938, -0.7047576904296875, -0.6677932739257812, -0.630828857421875, -0.5938644409179688, -0.5569000244140625, -0.5199356079101562, -0.48297119140625, -0.44600677490234375, -0.4090423583984375, -0.37207794189453125, -0.335113525390625, -0.29814910888671875, -0.2611846923828125, -0.22422027587890625, -0.187255859375, -0.15029144287109375, -0.1133270263671875, -0.07636260986328125, -0.039398193359375, -0.00243377685546875, 0.0345306396484375, 0.07149505615234375, 0.10845947265625, 0.14542388916015625, 0.1823883056640625, 0.21935272216796875, 0.256317138671875, 0.29328155517578125, 0.3302459716796875, 0.36721038818359375, 0.4041748046875, 0.44113922119140625, 0.4781036376953125, 0.5150680541992188, 0.552032470703125, 0.5889968872070312, 0.6259613037109375, 0.6629257202148438, 0.69989013671875, 0.7368545532226562, 0.7738189697265625, 0.8107833862304688, 0.847747802734375, 0.8847122192382812, 0.9216766357421875, 0.9586410522460938, 0.99560546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 21.0, 14.0, 24.0, 21.0, 36.0, 26.0, 34.0, 49.0, 33.0, 48.0, 47.0, 31.0, 52.0, 56.0, 51.0, 47.0, 49.0, 36.0, 37.0, 40.0, 30.0, 38.0, 29.0, 20.0, 21.0, 17.0, 16.0, 15.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3828125, -2.29443359375, -2.2060546875, -2.11767578125, -2.029296875, -1.94091796875, -1.8525390625, -1.76416015625, -1.67578125, -1.58740234375, -1.4990234375, -1.41064453125, -1.322265625, -1.23388671875, -1.1455078125, -1.05712890625, -0.96875, -0.88037109375, -0.7919921875, -0.70361328125, -0.615234375, -0.52685546875, -0.4384765625, -0.35009765625, -0.26171875, -0.17333984375, -0.0849609375, 0.00341796875, 0.091796875, 0.18017578125, 0.2685546875, 0.35693359375, 0.4453125, 0.53369140625, 0.6220703125, 0.71044921875, 0.798828125, 0.88720703125, 0.9755859375, 1.06396484375, 1.15234375, 1.24072265625, 1.3291015625, 1.41748046875, 1.505859375, 1.59423828125, 1.6826171875, 1.77099609375, 1.859375, 1.94775390625, 2.0361328125, 2.12451171875, 2.212890625, 2.30126953125, 2.3896484375, 2.47802734375, 2.56640625, 2.65478515625, 2.7431640625, 2.83154296875, 2.919921875, 3.00830078125, 3.0966796875, 3.18505859375, 3.2734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 0.0, 4.0, 4.0, 9.0, 18.0, 20.0, 33.0, 50.0, 76.0, 157.0, 256.0, 495.0, 887.0, 1849.0, 3573.0, 7503.0, 15702.0, 33672.0, 71589.0, 143527.0, 233575.0, 239498.0, 151516.0, 76512.0, 35753.0, 16600.0, 7884.0, 3766.0, 1873.0, 991.0, 504.0, 276.0, 144.0, 85.0, 49.0, 34.0, 15.0, 21.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.273193359375, -0.2651691436767578, -0.2571449279785156, -0.24912071228027344, -0.24109649658203125, -0.23307228088378906, -0.22504806518554688, -0.2170238494873047, -0.2089996337890625, -0.2009754180908203, -0.19295120239257812, -0.18492698669433594, -0.17690277099609375, -0.16887855529785156, -0.16085433959960938, -0.1528301239013672, -0.144805908203125, -0.1367816925048828, -0.12875747680664062, -0.12073326110839844, -0.11270904541015625, -0.10468482971191406, -0.09666061401367188, -0.08863639831542969, -0.0806121826171875, -0.07258796691894531, -0.06456375122070312, -0.05653953552246094, -0.04851531982421875, -0.04049110412597656, -0.032466888427734375, -0.024442672729492188, -0.01641845703125, -0.008394241333007812, -0.000370025634765625, 0.0076541900634765625, 0.01567840576171875, 0.023702621459960938, 0.031726837158203125, 0.03975105285644531, 0.0477752685546875, 0.05579948425292969, 0.06382369995117188, 0.07184791564941406, 0.07987213134765625, 0.08789634704589844, 0.09592056274414062, 0.10394477844238281, 0.111968994140625, 0.11999320983886719, 0.12801742553710938, 0.13604164123535156, 0.14406585693359375, 0.15209007263183594, 0.16011428833007812, 0.1681385040283203, 0.1761627197265625, 0.1841869354248047, 0.19221115112304688, 0.20023536682128906, 0.20825958251953125, 0.21628379821777344, 0.22430801391601562, 0.2323322296142578, 0.2403564453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 5.0, 15.0, 9.0, 8.0, 11.0, 12.0, 14.0, 20.0, 28.0, 25.0, 26.0, 38.0, 42.0, 34.0, 48.0, 39.0, 43.0, 45.0, 53.0, 46.0, 50.0, 55.0, 35.0, 33.0, 31.0, 30.0, 25.0, 21.0, 28.0, 19.0, 24.0, 12.0, 17.0, 11.0, 10.0, 3.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.03887939453125, -3.8980712890625, -3.75726318359375, -3.616455078125, -3.47564697265625, -3.3348388671875, -3.19403076171875, -3.05322265625, -2.91241455078125, -2.7716064453125, -2.63079833984375, -2.489990234375, -2.34918212890625, -2.2083740234375, -2.06756591796875, -1.9267578125, -1.78594970703125, -1.6451416015625, -1.50433349609375, -1.363525390625, -1.22271728515625, -1.0819091796875, -0.94110107421875, -0.80029296875, -0.65948486328125, -0.5186767578125, -0.37786865234375, -0.237060546875, -0.09625244140625, 0.0445556640625, 0.18536376953125, 0.326171875, 0.46697998046875, 0.6077880859375, 0.74859619140625, 0.889404296875, 1.03021240234375, 1.1710205078125, 1.31182861328125, 1.45263671875, 1.59344482421875, 1.7342529296875, 1.87506103515625, 2.015869140625, 2.15667724609375, 2.2974853515625, 2.43829345703125, 2.5791015625, 2.71990966796875, 2.8607177734375, 3.00152587890625, 3.142333984375, 3.28314208984375, 3.4239501953125, 3.56475830078125, 3.70556640625, 3.84637451171875, 3.9871826171875, 4.12799072265625, 4.268798828125, 4.40960693359375, 4.5504150390625, 4.69122314453125, 4.83203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 2.0, 26.0, 16.0, 23.0, 51.0, 63.0, 93.0, 122.0, 209.0, 317.0, 570.0, 1141.0, 2631.0, 6482.0, 22083.0, 117587.0, 534160.0, 295702.0, 47923.0, 11663.0, 4101.0, 1638.0, 794.0, 402.0, 257.0, 166.0, 116.0, 67.0, 47.0, 37.0, 19.0, 17.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.061893463134765625, -0.05994415283203125, -0.057994842529296875, -0.0560455322265625, -0.054096221923828125, -0.05214691162109375, -0.050197601318359375, -0.048248291015625, -0.046298980712890625, -0.04434967041015625, -0.042400360107421875, -0.0404510498046875, -0.038501739501953125, -0.03655242919921875, -0.034603118896484375, -0.03265380859375, -0.030704498291015625, -0.02875518798828125, -0.026805877685546875, -0.0248565673828125, -0.022907257080078125, -0.02095794677734375, -0.019008636474609375, -0.017059326171875, -0.015110015869140625, -0.01316070556640625, -0.011211395263671875, -0.0092620849609375, -0.007312774658203125, -0.00536346435546875, -0.003414154052734375, -0.00146484375, 0.000484466552734375, 0.00243377685546875, 0.004383087158203125, 0.0063323974609375, 0.008281707763671875, 0.01023101806640625, 0.012180328369140625, 0.014129638671875, 0.016078948974609375, 0.01802825927734375, 0.019977569580078125, 0.0219268798828125, 0.023876190185546875, 0.02582550048828125, 0.027774810791015625, 0.02972412109375, 0.031673431396484375, 0.03362274169921875, 0.035572052001953125, 0.0375213623046875, 0.039470672607421875, 0.04141998291015625, 0.043369293212890625, 0.045318603515625, 0.047267913818359375, 0.04921722412109375, 0.051166534423828125, 0.0531158447265625, 0.055065155029296875, 0.05701446533203125, 0.058963775634765625, 0.0609130859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 12.0, 24.0, 25.0, 42.0, 69.0, 73.0, 94.0, 102.0, 116.0, 113.0, 94.0, 59.0, 51.0, 28.0, 28.0, 20.0, 8.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.898143768310547e-05, -3.737863153219223e-05, -3.577582538127899e-05, -3.417301923036575e-05, -3.2570213079452515e-05, -3.0967406928539276e-05, -2.9364600777626038e-05, -2.77617946267128e-05, -2.615898847579956e-05, -2.4556182324886322e-05, -2.2953376173973083e-05, -2.1350570023059845e-05, -1.9747763872146606e-05, -1.8144957721233368e-05, -1.654215157032013e-05, -1.4939345419406891e-05, -1.3336539268493652e-05, -1.1733733117580414e-05, -1.0130926966667175e-05, -8.528120815753937e-06, -6.925314664840698e-06, -5.32250851392746e-06, -3.719702363014221e-06, -2.1168962121009827e-06, -5.140900611877441e-07, 1.0887160897254944e-06, 2.691522240638733e-06, 4.2943283915519714e-06, 5.89713454246521e-06, 7.4999406933784485e-06, 9.102746844291687e-06, 1.0705552995204926e-05, 1.2308359146118164e-05, 1.3911165297031403e-05, 1.551397144794464e-05, 1.711677759885788e-05, 1.8719583749771118e-05, 2.0322389900684357e-05, 2.1925196051597595e-05, 2.3528002202510834e-05, 2.5130808353424072e-05, 2.673361450433731e-05, 2.833642065525055e-05, 2.9939226806163788e-05, 3.1542032957077026e-05, 3.3144839107990265e-05, 3.4747645258903503e-05, 3.635045140981674e-05, 3.795325756072998e-05, 3.955606371164322e-05, 4.115886986255646e-05, 4.2761676013469696e-05, 4.4364482164382935e-05, 4.596728831529617e-05, 4.757009446620941e-05, 4.917290061712265e-05, 5.077570676803589e-05, 5.237851291894913e-05, 5.3981319069862366e-05, 5.5584125220775604e-05, 5.718693137168884e-05, 5.878973752260208e-05, 6.039254367351532e-05, 6.199534982442856e-05, 6.35981559753418e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 13.0, 32.0, 89.0, 290.0, 1200.0, 5460.0, 432144.0, 601490.0, 6067.0, 1241.0, 338.0, 103.0, 46.0, 9.0, 9.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2315673828125, -0.2226696014404297, -0.21377182006835938, -0.20487403869628906, -0.19597625732421875, -0.18707847595214844, -0.17818069458007812, -0.1692829132080078, -0.1603851318359375, -0.1514873504638672, -0.14258956909179688, -0.13369178771972656, -0.12479400634765625, -0.11589622497558594, -0.10699844360351562, -0.09810066223144531, -0.089202880859375, -0.08030509948730469, -0.07140731811523438, -0.06250953674316406, -0.05361175537109375, -0.04471397399902344, -0.035816192626953125, -0.026918411254882812, -0.0180206298828125, -0.009122848510742188, -0.000225067138671875, 0.008672714233398438, 0.01757049560546875, 0.026468276977539062, 0.035366058349609375, 0.04426383972167969, 0.05316162109375, 0.06205940246582031, 0.07095718383789062, 0.07985496520996094, 0.08875274658203125, 0.09765052795410156, 0.10654830932617188, 0.11544609069824219, 0.1243438720703125, 0.1332416534423828, 0.14213943481445312, 0.15103721618652344, 0.15993499755859375, 0.16883277893066406, 0.17773056030273438, 0.1866283416748047, 0.195526123046875, 0.2044239044189453, 0.21332168579101562, 0.22221946716308594, 0.23111724853515625, 0.24001502990722656, 0.24891281127929688, 0.2578105926513672, 0.2667083740234375, 0.2756061553955078, 0.2845039367675781, 0.29340171813964844, 0.30229949951171875, 0.31119728088378906, 0.3200950622558594, 0.3289928436279297, 0.337890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 2.0, 9.0, 12.0, 16.0, 28.0, 42.0, 62.0, 99.0, 133.0, 162.0, 133.0, 101.0, 76.0, 48.0, 26.0, 17.0, 8.0, 8.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157318115234375, -0.015091657638549805, -0.01445150375366211, -0.013811349868774414, -0.013171195983886719, -0.012531042098999023, -0.011890888214111328, -0.011250734329223633, -0.010610580444335938, -0.009970426559448242, -0.009330272674560547, -0.008690118789672852, -0.008049964904785156, -0.007409811019897461, -0.006769657135009766, -0.00612950325012207, -0.005489349365234375, -0.00484919548034668, -0.004209041595458984, -0.003568887710571289, -0.0029287338256835938, -0.0022885799407958984, -0.0016484260559082031, -0.0010082721710205078, -0.0003681182861328125, 0.0002720355987548828, 0.0009121894836425781, 0.0015523433685302734, 0.0021924972534179688, 0.002832651138305664, 0.0034728050231933594, 0.004112958908081055, 0.00475311279296875, 0.005393266677856445, 0.006033420562744141, 0.006673574447631836, 0.007313728332519531, 0.007953882217407227, 0.008594036102294922, 0.009234189987182617, 0.009874343872070312, 0.010514497756958008, 0.011154651641845703, 0.011794805526733398, 0.012434959411621094, 0.013075113296508789, 0.013715267181396484, 0.01435542106628418, 0.014995574951171875, 0.01563572883605957, 0.016275882720947266, 0.01691603660583496, 0.017556190490722656, 0.01819634437561035, 0.018836498260498047, 0.019476652145385742, 0.020116806030273438, 0.020756959915161133, 0.021397113800048828, 0.022037267684936523, 0.02267742156982422, 0.023317575454711914, 0.02395772933959961, 0.024597883224487305, 0.025238037109375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 10.0, 15.0, 19.0, 24.0, 48.0, 46.0, 58.0, 68.0, 76.0, 88.0, 91.0, 78.0, 87.0, 68.0, 45.0, 48.0, 33.0, 24.0, 18.0, 12.0, 7.0, 5.0, 4.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4695677757263184, -2.3598077297210693, -2.250047445297241, -2.140287399291992, -2.030527353286743, -1.9207671880722046, -1.811007022857666, -1.701246976852417, -1.5914868116378784, -1.4817266464233398, -1.3719666004180908, -1.2622064352035522, -1.1524462699890137, -1.0426862239837646, -0.9329260587692261, -0.8231659531593323, -0.7134058475494385, -0.6036457419395447, -0.4938856065273285, -0.3841254711151123, -0.2743653655052185, -0.1646052598953247, -0.05484509468078613, 0.054915010929107666, 0.16467511653900146, 0.27443522214889526, 0.38419535756111145, 0.49395549297332764, 0.6037155985832214, 0.7134757041931152, 0.8232358694076538, 0.9329959750175476, 1.0427560806274414, 1.15251624584198, 1.262276291847229, 1.3720364570617676, 1.4817965030670166, 1.5915566682815552, 1.7013168334960938, 1.8110768795013428, 1.9208370447158813, 2.03059720993042, 2.140357255935669, 2.250117301940918, 2.359877586364746, 2.469637632369995, 2.579397678375244, 2.6891579627990723, 2.7989180088043213, 2.9086780548095703, 3.0184383392333984, 3.1281983852386475, 3.2379584312438965, 3.3477187156677246, 3.4574787616729736, 3.5672388076782227, 3.676999092102051, 3.7867591381073, 3.896519422531128, 4.006279468536377, 4.116039752960205, 4.225799560546875, 4.335559844970703, 4.445320129394531, 4.555079936981201]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 8.0, 10.0, 12.0, 17.0, 22.0, 27.0, 28.0, 41.0, 35.0, 43.0, 38.0, 29.0, 58.0, 50.0, 46.0, 38.0, 51.0, 60.0, 48.0, 51.0, 34.0, 30.0, 41.0, 34.0, 26.0, 23.0, 15.0, 20.0, 10.0, 12.0, 11.0, 8.0, 3.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3690061569213867, -2.2802863121032715, -2.1915667057037354, -2.10284686088562, -2.014127254486084, -1.9254074096679688, -1.8366875648498535, -1.7479678392410278, -1.6592481136322021, -1.5705283880233765, -1.4818086624145508, -1.3930888175964355, -1.3043690919876099, -1.2156493663787842, -1.126929521560669, -1.0382097959518433, -0.9494900703430176, -0.8607703447341919, -0.7720505595207214, -0.683330774307251, -0.5946110486984253, -0.5058913230895996, -0.41717153787612915, -0.3284517526626587, -0.239732027053833, -0.15101227164268494, -0.062292516231536865, 0.026427239179611206, 0.11514699459075928, 0.20386675000190735, 0.2925865054130554, 0.3813062906265259, 0.47002577781677246, 0.5587455034255981, 0.6474652886390686, 0.7361850738525391, 0.8249047994613647, 0.9136245250701904, 1.0023443698883057, 1.0910640954971313, 1.179783821105957, 1.2685035467147827, 1.3572232723236084, 1.4459431171417236, 1.5346628427505493, 1.623382568359375, 1.7121024131774902, 1.800822138786316, 1.8895418643951416, 1.9782615900039673, 2.066981315612793, 2.155701160430908, 2.2444210052490234, 2.3331406116485596, 2.421860456466675, 2.510580062866211, 2.599299907684326, 2.6880197525024414, 2.7767393589019775, 2.8654592037200928, 2.954178810119629, 3.042898654937744, 3.1316184997558594, 3.2203383445739746, 3.3090579509735107]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 11.0, 20.0, 31.0, 45.0, 67.0, 107.0, 149.0, 229.0, 427.0, 768.0, 1384.0, 2663.0, 5784.0, 12788.0, 29780.0, 72798.0, 167260.0, 294792.0, 247963.0, 121387.0, 50840.0, 21095.0, 9256.0, 4195.0, 2098.0, 1076.0, 599.0, 319.0, 186.0, 145.0, 84.0, 57.0, 37.0, 26.0, 20.0, 20.0, 11.0, 8.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.140625, -2.06878662109375, -1.9969482421875, -1.92510986328125, -1.853271484375, -1.78143310546875, -1.7095947265625, -1.63775634765625, -1.56591796875, -1.49407958984375, -1.4222412109375, -1.35040283203125, -1.278564453125, -1.20672607421875, -1.1348876953125, -1.06304931640625, -0.9912109375, -0.91937255859375, -0.8475341796875, -0.77569580078125, -0.703857421875, -0.63201904296875, -0.5601806640625, -0.48834228515625, -0.41650390625, -0.34466552734375, -0.2728271484375, -0.20098876953125, -0.129150390625, -0.05731201171875, 0.0145263671875, 0.08636474609375, 0.158203125, 0.23004150390625, 0.3018798828125, 0.37371826171875, 0.445556640625, 0.51739501953125, 0.5892333984375, 0.66107177734375, 0.73291015625, 0.80474853515625, 0.8765869140625, 0.94842529296875, 1.020263671875, 1.09210205078125, 1.1639404296875, 1.23577880859375, 1.3076171875, 1.37945556640625, 1.4512939453125, 1.52313232421875, 1.594970703125, 1.66680908203125, 1.7386474609375, 1.81048583984375, 1.88232421875, 1.95416259765625, 2.0260009765625, 2.09783935546875, 2.169677734375, 2.24151611328125, 2.3133544921875, 2.38519287109375, 2.45703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 7.0, 11.0, 21.0, 17.0, 32.0, 28.0, 16.0, 26.0, 39.0, 29.0, 45.0, 36.0, 36.0, 45.0, 23.0, 34.0, 39.0, 35.0, 43.0, 34.0, 32.0, 32.0, 36.0, 39.0, 31.0, 24.0, 31.0, 21.0, 22.0, 12.0, 12.0, 14.0, 12.0, 14.0, 3.0, 5.0, 9.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-4.0546875, -3.91815185546875, -3.7816162109375, -3.64508056640625, -3.508544921875, -3.37200927734375, -3.2354736328125, -3.09893798828125, -2.96240234375, -2.82586669921875, -2.6893310546875, -2.55279541015625, -2.416259765625, -2.27972412109375, -2.1431884765625, -2.00665283203125, -1.8701171875, -1.73358154296875, -1.5970458984375, -1.46051025390625, -1.323974609375, -1.18743896484375, -1.0509033203125, -0.91436767578125, -0.77783203125, -0.64129638671875, -0.5047607421875, -0.36822509765625, -0.231689453125, -0.09515380859375, 0.0413818359375, 0.17791748046875, 0.314453125, 0.45098876953125, 0.5875244140625, 0.72406005859375, 0.860595703125, 0.99713134765625, 1.1336669921875, 1.27020263671875, 1.40673828125, 1.54327392578125, 1.6798095703125, 1.81634521484375, 1.952880859375, 2.08941650390625, 2.2259521484375, 2.36248779296875, 2.4990234375, 2.63555908203125, 2.7720947265625, 2.90863037109375, 3.045166015625, 3.18170166015625, 3.3182373046875, 3.45477294921875, 3.59130859375, 3.72784423828125, 3.8643798828125, 4.00091552734375, 4.137451171875, 4.27398681640625, 4.4105224609375, 4.54705810546875, 4.68359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 8.0, 10.0, 6.0, 11.0, 27.0, 28.0, 30.0, 37.0, 52.0, 51.0, 106.0, 131.0, 226.0, 634.0, 80643.0, 962925.0, 2621.0, 339.0, 177.0, 108.0, 87.0, 72.0, 40.0, 35.0, 27.0, 25.0, 24.0, 14.0, 6.0, 12.0, 3.0, 3.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.859375, -23.200927734375, -22.54248046875, -21.884033203125, -21.2255859375, -20.567138671875, -19.90869140625, -19.250244140625, -18.591796875, -17.933349609375, -17.27490234375, -16.616455078125, -15.9580078125, -15.299560546875, -14.64111328125, -13.982666015625, -13.32421875, -12.665771484375, -12.00732421875, -11.348876953125, -10.6904296875, -10.031982421875, -9.37353515625, -8.715087890625, -8.056640625, -7.398193359375, -6.73974609375, -6.081298828125, -5.4228515625, -4.764404296875, -4.10595703125, -3.447509765625, -2.7890625, -2.130615234375, -1.47216796875, -0.813720703125, -0.1552734375, 0.503173828125, 1.16162109375, 1.820068359375, 2.478515625, 3.136962890625, 3.79541015625, 4.453857421875, 5.1123046875, 5.770751953125, 6.42919921875, 7.087646484375, 7.74609375, 8.404541015625, 9.06298828125, 9.721435546875, 10.3798828125, 11.038330078125, 11.69677734375, 12.355224609375, 13.013671875, 13.672119140625, 14.33056640625, 14.989013671875, 15.6474609375, 16.305908203125, 16.96435546875, 17.622802734375, 18.28125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 7.0, 8.0, 11.0, 9.0, 12.0, 13.0, 14.0, 29.0, 26.0, 27.0, 39.0, 38.0, 45.0, 37.0, 31.0, 29.0, 39.0, 40.0, 55.0, 40.0, 68.0, 44.0, 48.0, 29.0, 36.0, 33.0, 30.0, 29.0, 14.0, 24.0, 17.0, 20.0, 9.0, 9.0, 4.0, 6.0, 5.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.40234375, -5.24273681640625, -5.0831298828125, -4.92352294921875, -4.763916015625, -4.60430908203125, -4.4447021484375, -4.28509521484375, -4.12548828125, -3.96588134765625, -3.8062744140625, -3.64666748046875, -3.487060546875, -3.32745361328125, -3.1678466796875, -3.00823974609375, -2.8486328125, -2.68902587890625, -2.5294189453125, -2.36981201171875, -2.210205078125, -2.05059814453125, -1.8909912109375, -1.73138427734375, -1.57177734375, -1.41217041015625, -1.2525634765625, -1.09295654296875, -0.933349609375, -0.77374267578125, -0.6141357421875, -0.45452880859375, -0.294921875, -0.13531494140625, 0.0242919921875, 0.18389892578125, 0.343505859375, 0.50311279296875, 0.6627197265625, 0.82232666015625, 0.98193359375, 1.14154052734375, 1.3011474609375, 1.46075439453125, 1.620361328125, 1.77996826171875, 1.9395751953125, 2.09918212890625, 2.2587890625, 2.41839599609375, 2.5780029296875, 2.73760986328125, 2.897216796875, 3.05682373046875, 3.2164306640625, 3.37603759765625, 3.53564453125, 3.69525146484375, 3.8548583984375, 4.01446533203125, 4.174072265625, 4.33367919921875, 4.4932861328125, 4.65289306640625, 4.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 14.0, 16.0, 23.0, 34.0, 36.0, 58.0, 111.0, 168.0, 275.0, 626.0, 1770.0, 7267.0, 59375.0, 579348.0, 361691.0, 30592.0, 4634.0, 1328.0, 509.0, 258.0, 131.0, 79.0, 50.0, 29.0, 37.0, 17.0, 15.0, 7.0, 8.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.802734375, -1.74432373046875, -1.6859130859375, -1.62750244140625, -1.569091796875, -1.51068115234375, -1.4522705078125, -1.39385986328125, -1.33544921875, -1.27703857421875, -1.2186279296875, -1.16021728515625, -1.101806640625, -1.04339599609375, -0.9849853515625, -0.92657470703125, -0.8681640625, -0.80975341796875, -0.7513427734375, -0.69293212890625, -0.634521484375, -0.57611083984375, -0.5177001953125, -0.45928955078125, -0.40087890625, -0.34246826171875, -0.2840576171875, -0.22564697265625, -0.167236328125, -0.10882568359375, -0.0504150390625, 0.00799560546875, 0.06640625, 0.12481689453125, 0.1832275390625, 0.24163818359375, 0.300048828125, 0.35845947265625, 0.4168701171875, 0.47528076171875, 0.53369140625, 0.59210205078125, 0.6505126953125, 0.70892333984375, 0.767333984375, 0.82574462890625, 0.8841552734375, 0.94256591796875, 1.0009765625, 1.05938720703125, 1.1177978515625, 1.17620849609375, 1.234619140625, 1.29302978515625, 1.3514404296875, 1.40985107421875, 1.46826171875, 1.52667236328125, 1.5850830078125, 1.64349365234375, 1.701904296875, 1.76031494140625, 1.8187255859375, 1.87713623046875, 1.935546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 0.0, 1.0, 6.0, 7.0, 7.0, 10.0, 14.0, 19.0, 15.0, 24.0, 32.0, 23.0, 37.0, 53.0, 51.0, 47.0, 46.0, 62.0, 62.0, 60.0, 81.0, 49.0, 39.0, 41.0, 28.0, 29.0, 32.0, 22.0, 19.0, 17.0, 15.0, 12.0, 7.0, 7.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00015091896057128906, -0.00014655105769634247, -0.00014218315482139587, -0.00013781525194644928, -0.00013344734907150269, -0.0001290794461965561, -0.0001247115433216095, -0.0001203436404466629, -0.00011597573757171631, -0.00011160783469676971, -0.00010723993182182312, -0.00010287202894687653, -9.850412607192993e-05, -9.413622319698334e-05, -8.976832032203674e-05, -8.540041744709015e-05, -8.103251457214355e-05, -7.666461169719696e-05, -7.229670882225037e-05, -6.792880594730377e-05, -6.356090307235718e-05, -5.9193000197410583e-05, -5.482509732246399e-05, -5.0457194447517395e-05, -4.60892915725708e-05, -4.1721388697624207e-05, -3.735348582267761e-05, -3.298558294773102e-05, -2.8617680072784424e-05, -2.424977719783783e-05, -1.9881874322891235e-05, -1.551397144794464e-05, -1.1146068572998047e-05, -6.778165698051453e-06, -2.4102628231048584e-06, 1.957640051841736e-06, 6.32554292678833e-06, 1.0693445801734924e-05, 1.5061348676681519e-05, 1.9429251551628113e-05, 2.3797154426574707e-05, 2.81650573015213e-05, 3.2532960176467896e-05, 3.690086305141449e-05, 4.1268765926361084e-05, 4.563666880130768e-05, 5.000457167625427e-05, 5.437247455120087e-05, 5.874037742614746e-05, 6.310828030109406e-05, 6.747618317604065e-05, 7.184408605098724e-05, 7.621198892593384e-05, 8.057989180088043e-05, 8.494779467582703e-05, 8.931569755077362e-05, 9.368360042572021e-05, 9.805150330066681e-05, 0.0001024194061756134, 0.00010678730905056, 0.00011115521192550659, 0.00011552311480045319, 0.00011989101767539978, 0.00012425892055034637, 0.00012862682342529297]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 14.0, 18.0, 18.0, 51.0, 77.0, 151.0, 266.0, 750.0, 2634.0, 18590.0, 363951.0, 620994.0, 35400.0, 3955.0, 978.0, 320.0, 134.0, 69.0, 54.0, 37.0, 23.0, 18.0, 12.0, 7.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.328125, -2.250823974609375, -2.17352294921875, -2.096221923828125, -2.0189208984375, -1.941619873046875, -1.86431884765625, -1.787017822265625, -1.709716796875, -1.632415771484375, -1.55511474609375, -1.477813720703125, -1.4005126953125, -1.323211669921875, -1.24591064453125, -1.168609619140625, -1.09130859375, -1.014007568359375, -0.93670654296875, -0.859405517578125, -0.7821044921875, -0.704803466796875, -0.62750244140625, -0.550201416015625, -0.472900390625, -0.395599365234375, -0.31829833984375, -0.240997314453125, -0.1636962890625, -0.086395263671875, -0.00909423828125, 0.068206787109375, 0.1455078125, 0.222808837890625, 0.30010986328125, 0.377410888671875, 0.4547119140625, 0.532012939453125, 0.60931396484375, 0.686614990234375, 0.763916015625, 0.841217041015625, 0.91851806640625, 0.995819091796875, 1.0731201171875, 1.150421142578125, 1.22772216796875, 1.305023193359375, 1.38232421875, 1.459625244140625, 1.53692626953125, 1.614227294921875, 1.6915283203125, 1.768829345703125, 1.84613037109375, 1.923431396484375, 2.000732421875, 2.078033447265625, 2.15533447265625, 2.232635498046875, 2.3099365234375, 2.387237548828125, 2.46453857421875, 2.541839599609375, 2.619140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 12.0, 12.0, 25.0, 26.0, 37.0, 40.0, 57.0, 93.0, 90.0, 115.0, 104.0, 97.0, 71.0, 46.0, 24.0, 38.0, 29.0, 22.0, 15.0, 9.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66259765625, -0.6429061889648438, -0.6232147216796875, -0.6035232543945312, -0.583831787109375, -0.5641403198242188, -0.5444488525390625, -0.5247573852539062, -0.50506591796875, -0.48537445068359375, -0.4656829833984375, -0.44599151611328125, -0.426300048828125, -0.40660858154296875, -0.3869171142578125, -0.36722564697265625, -0.3475341796875, -0.32784271240234375, -0.3081512451171875, -0.28845977783203125, -0.268768310546875, -0.24907684326171875, -0.2293853759765625, -0.20969390869140625, -0.19000244140625, -0.17031097412109375, -0.1506195068359375, -0.13092803955078125, -0.111236572265625, -0.09154510498046875, -0.0718536376953125, -0.05216217041015625, -0.032470703125, -0.01277923583984375, 0.0069122314453125, 0.02660369873046875, 0.046295166015625, 0.06598663330078125, 0.0856781005859375, 0.10536956787109375, 0.12506103515625, 0.14475250244140625, 0.1644439697265625, 0.18413543701171875, 0.203826904296875, 0.22351837158203125, 0.2432098388671875, 0.26290130615234375, 0.2825927734375, 0.30228424072265625, 0.3219757080078125, 0.34166717529296875, 0.361358642578125, 0.38105010986328125, 0.4007415771484375, 0.42043304443359375, 0.44012451171875, 0.45981597900390625, 0.4795074462890625, 0.49919891357421875, 0.518890380859375, 0.5385818481445312, 0.5582733154296875, 0.5779647827148438, 0.59765625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 14.0, 37.0, 82.0, 189.0, 242.0, 220.0, 142.0, 49.0, 19.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.534438133239746, -3.872635841369629, -3.2108333110809326, -2.5490307807922363, -1.8872284889221191, -1.225426197052002, -0.5636236667633057, 0.09817886352539062, 0.7599811553955078, 1.4217835664749146, 2.0835859775543213, 2.7453885078430176, 3.4071907997131348, 4.068993091583252, 4.730795860290527, 5.3925981521606445, 6.054400444030762, 6.716202735900879, 7.378005027770996, 8.039807319641113, 8.701610565185547, 9.363412857055664, 10.025215148925781, 10.687017440795898, 11.348819732666016, 12.010622024536133, 12.67242431640625, 13.334226608276367, 13.996028900146484, 14.657831192016602, 15.319634437561035, 15.981436729431152, 16.643238067626953, 17.30504035949707, 17.966842651367188, 18.628644943237305, 19.290447235107422, 19.95224952697754, 20.614051818847656, 21.275856018066406, 21.93765640258789, 22.599458694458008, 23.261260986328125, 23.923063278198242, 24.58486557006836, 25.246667861938477, 25.908470153808594, 26.570274353027344, 27.23207664489746, 27.893878936767578, 28.555681228637695, 29.217483520507812, 29.87928581237793, 30.541088104248047, 31.202890396118164, 31.86469268798828, 32.52649688720703, 33.18830108642578, 33.850101470947266, 34.511905670166016, 35.1737060546875, 35.83551025390625, 36.497310638427734, 37.159114837646484, 37.82091522216797]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 15.0, 8.0, 13.0, 14.0, 12.0, 23.0, 19.0, 30.0, 45.0, 54.0, 59.0, 46.0, 58.0, 37.0, 45.0, 42.0, 52.0, 47.0, 48.0, 42.0, 36.0, 32.0, 29.0, 26.0, 34.0, 18.0, 21.0, 10.0, 17.0, 9.0, 9.0, 9.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0], "bins": [-9.6424560546875, -9.384234428405762, -9.126012802124023, -8.867792129516602, -8.609570503234863, -8.351348876953125, -8.093127250671387, -7.834906101226807, -7.576684951782227, -7.318463325500488, -7.060242176055908, -6.80202054977417, -6.54379940032959, -6.285577774047852, -6.027356147766113, -5.769134998321533, -5.510913372039795, -5.252691745758057, -4.994470596313477, -4.736248970031738, -4.478027820587158, -4.21980619430542, -3.9615848064422607, -3.7033634185791016, -3.4451420307159424, -3.186920642852783, -2.928699254989624, -2.670477867126465, -2.4122562408447266, -2.1540350914001465, -1.8958134651184082, -1.637592077255249, -1.3793706893920898, -1.1211493015289307, -0.8629278540611267, -0.6047064065933228, -0.3464850187301636, -0.0882636308670044, 0.16995787620544434, 0.4281792640686035, 0.6864006519317627, 0.9446220397949219, 1.202843427658081, 1.4610649347305298, 1.719286322593689, 1.9775077104568481, 2.235729217529297, 2.493950605392456, 2.7521719932556152, 3.0103933811187744, 3.2686147689819336, 3.526836395263672, 3.785057544708252, 4.04327917098999, 4.30150032043457, 4.559721946716309, 4.817943572998047, 5.076165199279785, 5.334386348724365, 5.5926079750061035, 5.850829124450684, 6.109050750732422, 6.36727237701416, 6.62549352645874, 6.88371467590332]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 6.0, 13.0, 9.0, 8.0, 11.0, 33.0, 43.0, 46.0, 58.0, 105.0, 160.0, 236.0, 478.0, 1455.0, 10492.0, 166283.0, 2239553.0, 1668347.0, 97657.0, 6853.0, 1157.0, 496.0, 270.0, 154.0, 116.0, 80.0, 48.0, 34.0, 30.0, 17.0, 9.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.7239990234375, -8.432373046875, -8.1407470703125, -7.84912109375, -7.5574951171875, -7.265869140625, -6.9742431640625, -6.6826171875, -6.3909912109375, -6.099365234375, -5.8077392578125, -5.51611328125, -5.2244873046875, -4.932861328125, -4.6412353515625, -4.349609375, -4.0579833984375, -3.766357421875, -3.4747314453125, -3.18310546875, -2.8914794921875, -2.599853515625, -2.3082275390625, -2.0166015625, -1.7249755859375, -1.433349609375, -1.1417236328125, -0.85009765625, -0.5584716796875, -0.266845703125, 0.0247802734375, 0.31640625, 0.6080322265625, 0.899658203125, 1.1912841796875, 1.48291015625, 1.7745361328125, 2.066162109375, 2.3577880859375, 2.6494140625, 2.9410400390625, 3.232666015625, 3.5242919921875, 3.81591796875, 4.1075439453125, 4.399169921875, 4.6907958984375, 4.982421875, 5.2740478515625, 5.565673828125, 5.8572998046875, 6.14892578125, 6.4405517578125, 6.732177734375, 7.0238037109375, 7.3154296875, 7.6070556640625, 7.898681640625, 8.1903076171875, 8.48193359375, 8.7735595703125, 9.065185546875, 9.3568115234375, 9.6484375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 7.0, 9.0, 17.0, 20.0, 22.0, 19.0, 27.0, 39.0, 36.0, 34.0, 53.0, 63.0, 67.0, 50.0, 68.0, 61.0, 60.0, 49.0, 40.0, 47.0, 36.0, 36.0, 25.0, 27.0, 26.0, 6.0, 11.0, 10.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.146728515625, -4.00048828125, -3.854248046875, -3.7080078125, -3.561767578125, -3.41552734375, -3.269287109375, -3.123046875, -2.976806640625, -2.83056640625, -2.684326171875, -2.5380859375, -2.391845703125, -2.24560546875, -2.099365234375, -1.953125, -1.806884765625, -1.66064453125, -1.514404296875, -1.3681640625, -1.221923828125, -1.07568359375, -0.929443359375, -0.783203125, -0.636962890625, -0.49072265625, -0.344482421875, -0.1982421875, -0.052001953125, 0.09423828125, 0.240478515625, 0.38671875, 0.532958984375, 0.67919921875, 0.825439453125, 0.9716796875, 1.117919921875, 1.26416015625, 1.410400390625, 1.556640625, 1.702880859375, 1.84912109375, 1.995361328125, 2.1416015625, 2.287841796875, 2.43408203125, 2.580322265625, 2.7265625, 2.872802734375, 3.01904296875, 3.165283203125, 3.3115234375, 3.457763671875, 3.60400390625, 3.750244140625, 3.896484375, 4.042724609375, 4.18896484375, 4.335205078125, 4.4814453125, 4.627685546875, 4.77392578125, 4.920166015625, 5.06640625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 25.0, 40.0, 62.0, 108.0, 232.0, 548.0, 2325.0, 71072.0, 4023860.0, 92403.0, 2496.0, 588.0, 220.0, 117.0, 76.0, 28.0, 26.0, 14.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.6875, -20.1640625, -19.640625, -19.1171875, -18.59375, -18.0703125, -17.546875, -17.0234375, -16.5, -15.9765625, -15.453125, -14.9296875, -14.40625, -13.8828125, -13.359375, -12.8359375, -12.3125, -11.7890625, -11.265625, -10.7421875, -10.21875, -9.6953125, -9.171875, -8.6484375, -8.125, -7.6015625, -7.078125, -6.5546875, -6.03125, -5.5078125, -4.984375, -4.4609375, -3.9375, -3.4140625, -2.890625, -2.3671875, -1.84375, -1.3203125, -0.796875, -0.2734375, 0.25, 0.7734375, 1.296875, 1.8203125, 2.34375, 2.8671875, 3.390625, 3.9140625, 4.4375, 4.9609375, 5.484375, 6.0078125, 6.53125, 7.0546875, 7.578125, 8.1015625, 8.625, 9.1484375, 9.671875, 10.1953125, 10.71875, 11.2421875, 11.765625, 12.2890625, 12.8125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 13.0, 26.0, 32.0, 52.0, 91.0, 120.0, 207.0, 301.0, 468.0, 620.0, 613.0, 548.0, 366.0, 223.0, 137.0, 97.0, 50.0, 35.0, 25.0, 13.0, 12.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.0682373046875, -1.986083984375, -1.9039306640625, -1.82177734375, -1.7396240234375, -1.657470703125, -1.5753173828125, -1.4931640625, -1.4110107421875, -1.328857421875, -1.2467041015625, -1.16455078125, -1.0823974609375, -1.000244140625, -0.9180908203125, -0.8359375, -0.7537841796875, -0.671630859375, -0.5894775390625, -0.50732421875, -0.4251708984375, -0.343017578125, -0.2608642578125, -0.1787109375, -0.0965576171875, -0.014404296875, 0.0677490234375, 0.14990234375, 0.2320556640625, 0.314208984375, 0.3963623046875, 0.478515625, 0.5606689453125, 0.642822265625, 0.7249755859375, 0.80712890625, 0.8892822265625, 0.971435546875, 1.0535888671875, 1.1357421875, 1.2178955078125, 1.300048828125, 1.3822021484375, 1.46435546875, 1.5465087890625, 1.628662109375, 1.7108154296875, 1.79296875, 1.8751220703125, 1.957275390625, 2.0394287109375, 2.12158203125, 2.2037353515625, 2.285888671875, 2.3680419921875, 2.4501953125, 2.5323486328125, 2.614501953125, 2.6966552734375, 2.77880859375, 2.8609619140625, 2.943115234375, 3.0252685546875, 3.107421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 9.0, 11.0, 9.0, 21.0, 19.0, 39.0, 38.0, 44.0, 57.0, 58.0, 68.0, 54.0, 79.0, 71.0, 71.0, 50.0, 71.0, 47.0, 37.0, 36.0, 25.0, 19.0, 17.0, 9.0, 11.0, 8.0, 8.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.863565444946289, -3.708813428878784, -3.5540616512298584, -3.3993096351623535, -3.2445576190948486, -3.0898056030273438, -2.935053825378418, -2.780301809310913, -2.625549793243408, -2.4707977771759033, -2.3160459995269775, -2.1612939834594727, -2.0065419673919678, -1.8517900705337524, -1.697038173675537, -1.5422861576080322, -1.3875343799591064, -1.2327824831008911, -1.0780304670333862, -0.9232785701751709, -0.7685266137123108, -0.6137746572494507, -0.45902276039123535, -0.30427074432373047, -0.14951884746551514, 0.005233094096183777, 0.1599850356578827, 0.3147369623184204, 0.4694889187812805, 0.6242408752441406, 0.778992772102356, 0.9337447881698608, 1.0884966850280762, 1.2432485818862915, 1.3980005979537964, 1.5527524948120117, 1.7075045108795166, 1.862256407737732, 2.0170083045959473, 2.171760320663452, 2.326512336730957, 2.481264352798462, 2.6360161304473877, 2.7907681465148926, 2.9455201625823975, 3.1002721786499023, 3.255023956298828, 3.409775972366333, 3.564527750015259, 3.7192797660827637, 3.8740315437316895, 4.028783798217773, 4.183535575866699, 4.338287353515625, 4.493039131164551, 4.647791385650635, 4.8025431632995605, 4.957294940948486, 5.11204719543457, 5.266798973083496, 5.421550750732422, 5.576303005218506, 5.731054782867432, 5.885807037353516, 6.040558815002441]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 8.0, 14.0, 16.0, 11.0, 11.0, 24.0, 17.0, 19.0, 12.0, 22.0, 28.0, 33.0, 41.0, 38.0, 39.0, 38.0, 42.0, 38.0, 47.0, 44.0, 29.0, 44.0, 37.0, 43.0, 27.0, 33.0, 27.0, 33.0, 27.0, 22.0, 21.0, 16.0, 12.0, 11.0, 9.0, 12.0, 7.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.933236837387085, -3.8160433769226074, -3.698850154876709, -3.5816566944122314, -3.464463472366333, -3.3472700119018555, -3.230076789855957, -3.1128833293914795, -2.995689868927002, -2.8784964084625244, -2.761303186416626, -2.6441097259521484, -2.52691650390625, -2.4097230434417725, -2.292529582977295, -2.1753363609313965, -2.058143138885498, -1.94094979763031, -1.823756456375122, -1.7065629959106445, -1.589369773864746, -1.4721763134002686, -1.3549829721450806, -1.2377896308898926, -1.1205962896347046, -1.0034029483795166, -0.8862096071243286, -0.7690162062644958, -0.6518228650093079, -0.5346295237541199, -0.4174361228942871, -0.3002427816390991, -0.18304944038391113, -0.06585608422756195, 0.05133727192878723, 0.1685306429862976, 0.2857239842414856, 0.4029173254966736, 0.5201107263565063, 0.6373040676116943, 0.7544974088668823, 0.8716907501220703, 0.9888840913772583, 1.1060774326324463, 1.2232708930969238, 1.3404641151428223, 1.4576575756072998, 1.5748509168624878, 1.6920442581176758, 1.8092375993728638, 1.9264309406280518, 2.0436244010925293, 2.1608176231384277, 2.2780110836029053, 2.395204544067383, 2.5123977661132812, 2.6295909881591797, 2.7467844486236572, 2.8639776706695557, 2.981171131134033, 3.0983643531799316, 3.215557813644409, 3.3327512741088867, 3.449944496154785, 3.5671379566192627]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 5.0, 5.0, 13.0, 12.0, 20.0, 31.0, 35.0, 36.0, 72.0, 88.0, 145.0, 223.0, 303.0, 484.0, 824.0, 1284.0, 2663.0, 7221.0, 33546.0, 242462.0, 599360.0, 129795.0, 19640.0, 5157.0, 2026.0, 1138.0, 643.0, 437.0, 268.0, 170.0, 121.0, 94.0, 44.0, 41.0, 36.0, 23.0, 19.0, 15.0, 8.0, 13.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82763671875, -0.7973709106445312, -0.7671051025390625, -0.7368392944335938, -0.706573486328125, -0.6763076782226562, -0.6460418701171875, -0.6157760620117188, -0.58551025390625, -0.5552444458007812, -0.5249786376953125, -0.49471282958984375, -0.464447021484375, -0.43418121337890625, -0.4039154052734375, -0.37364959716796875, -0.3433837890625, -0.31311798095703125, -0.2828521728515625, -0.25258636474609375, -0.222320556640625, -0.19205474853515625, -0.1617889404296875, -0.13152313232421875, -0.10125732421875, -0.07099151611328125, -0.0407257080078125, -0.01045989990234375, 0.019805908203125, 0.05007171630859375, 0.0803375244140625, 0.11060333251953125, 0.140869140625, 0.17113494873046875, 0.2014007568359375, 0.23166656494140625, 0.261932373046875, 0.29219818115234375, 0.3224639892578125, 0.35272979736328125, 0.38299560546875, 0.41326141357421875, 0.4435272216796875, 0.47379302978515625, 0.504058837890625, 0.5343246459960938, 0.5645904541015625, 0.5948562622070312, 0.6251220703125, 0.6553878784179688, 0.6856536865234375, 0.7159194946289062, 0.746185302734375, 0.7764511108398438, 0.8067169189453125, 0.8369827270507812, 0.86724853515625, 0.8975143432617188, 0.9277801513671875, 0.9580459594726562, 0.988311767578125, 1.0185775756835938, 1.0488433837890625, 1.0791091918945312, 1.109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 9.0, 3.0, 5.0, 8.0, 8.0, 16.0, 15.0, 15.0, 13.0, 18.0, 25.0, 15.0, 24.0, 24.0, 35.0, 36.0, 43.0, 41.0, 46.0, 30.0, 36.0, 48.0, 42.0, 41.0, 45.0, 40.0, 30.0, 38.0, 38.0, 30.0, 21.0, 32.0, 19.0, 12.0, 16.0, 15.0, 10.0, 10.0, 14.0, 6.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.9647216796875, -1.890380859375, -1.8160400390625, -1.74169921875, -1.6673583984375, -1.593017578125, -1.5186767578125, -1.4443359375, -1.3699951171875, -1.295654296875, -1.2213134765625, -1.14697265625, -1.0726318359375, -0.998291015625, -0.9239501953125, -0.849609375, -0.7752685546875, -0.700927734375, -0.6265869140625, -0.55224609375, -0.4779052734375, -0.403564453125, -0.3292236328125, -0.2548828125, -0.1805419921875, -0.106201171875, -0.0318603515625, 0.04248046875, 0.1168212890625, 0.191162109375, 0.2655029296875, 0.33984375, 0.4141845703125, 0.488525390625, 0.5628662109375, 0.63720703125, 0.7115478515625, 0.785888671875, 0.8602294921875, 0.9345703125, 1.0089111328125, 1.083251953125, 1.1575927734375, 1.23193359375, 1.3062744140625, 1.380615234375, 1.4549560546875, 1.529296875, 1.6036376953125, 1.677978515625, 1.7523193359375, 1.82666015625, 1.9010009765625, 1.975341796875, 2.0496826171875, 2.1240234375, 2.1983642578125, 2.272705078125, 2.3470458984375, 2.42138671875, 2.4957275390625, 2.570068359375, 2.6444091796875, 2.71875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 16.0, 24.0, 38.0, 67.0, 111.0, 237.0, 442.0, 930.0, 1998.0, 4555.0, 10756.0, 26702.0, 64817.0, 155579.0, 292838.0, 268852.0, 130481.0, 53239.0, 21366.0, 8745.0, 3717.0, 1571.0, 735.0, 336.0, 180.0, 84.0, 47.0, 36.0, 15.0, 8.0, 3.0, 2.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.350341796875, -0.3400077819824219, -0.32967376708984375, -0.3193397521972656, -0.3090057373046875, -0.2986717224121094, -0.28833770751953125, -0.2780036926269531, -0.267669677734375, -0.2573356628417969, -0.24700164794921875, -0.23666763305664062, -0.2263336181640625, -0.21599960327148438, -0.20566558837890625, -0.19533157348632812, -0.18499755859375, -0.17466354370117188, -0.16432952880859375, -0.15399551391601562, -0.1436614990234375, -0.13332748413085938, -0.12299346923828125, -0.11265945434570312, -0.102325439453125, -0.09199142456054688, -0.08165740966796875, -0.07132339477539062, -0.0609893798828125, -0.050655364990234375, -0.04032135009765625, -0.029987335205078125, -0.0196533203125, -0.009319305419921875, 0.00101470947265625, 0.011348724365234375, 0.0216827392578125, 0.032016754150390625, 0.04235076904296875, 0.052684783935546875, 0.063018798828125, 0.07335281372070312, 0.08368682861328125, 0.09402084350585938, 0.1043548583984375, 0.11468887329101562, 0.12502288818359375, 0.13535690307617188, 0.14569091796875, 0.15602493286132812, 0.16635894775390625, 0.17669296264648438, 0.1870269775390625, 0.19736099243164062, 0.20769500732421875, 0.21802902221679688, 0.228363037109375, 0.23869705200195312, 0.24903106689453125, 0.2593650817871094, 0.2696990966796875, 0.2800331115722656, 0.29036712646484375, 0.3007011413574219, 0.31103515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 5.0, 8.0, 11.0, 14.0, 19.0, 14.0, 19.0, 27.0, 32.0, 41.0, 37.0, 38.0, 42.0, 57.0, 44.0, 59.0, 49.0, 61.0, 59.0, 52.0, 32.0, 28.0, 34.0, 37.0, 27.0, 24.0, 23.0, 22.0, 16.0, 10.0, 8.0, 10.0, 3.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62109375, -5.455322265625, -5.28955078125, -5.123779296875, -4.9580078125, -4.792236328125, -4.62646484375, -4.460693359375, -4.294921875, -4.129150390625, -3.96337890625, -3.797607421875, -3.6318359375, -3.466064453125, -3.30029296875, -3.134521484375, -2.96875, -2.802978515625, -2.63720703125, -2.471435546875, -2.3056640625, -2.139892578125, -1.97412109375, -1.808349609375, -1.642578125, -1.476806640625, -1.31103515625, -1.145263671875, -0.9794921875, -0.813720703125, -0.64794921875, -0.482177734375, -0.31640625, -0.150634765625, 0.01513671875, 0.180908203125, 0.3466796875, 0.512451171875, 0.67822265625, 0.843994140625, 1.009765625, 1.175537109375, 1.34130859375, 1.507080078125, 1.6728515625, 1.838623046875, 2.00439453125, 2.170166015625, 2.3359375, 2.501708984375, 2.66748046875, 2.833251953125, 2.9990234375, 3.164794921875, 3.33056640625, 3.496337890625, 3.662109375, 3.827880859375, 3.99365234375, 4.159423828125, 4.3251953125, 4.490966796875, 4.65673828125, 4.822509765625, 4.98828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 6.0, 7.0, 3.0, 11.0, 24.0, 29.0, 56.0, 82.0, 120.0, 151.0, 278.0, 489.0, 874.0, 1646.0, 3544.0, 8362.0, 22484.0, 69244.0, 212298.0, 403790.0, 216322.0, 70364.0, 22712.0, 8280.0, 3548.0, 1763.0, 852.0, 447.0, 281.0, 197.0, 100.0, 63.0, 51.0, 29.0, 16.0, 7.0, 8.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.03779315948486328, -0.03655433654785156, -0.035315513610839844, -0.034076690673828125, -0.032837867736816406, -0.03159904479980469, -0.03036022186279297, -0.02912139892578125, -0.02788257598876953, -0.026643753051757812, -0.025404930114746094, -0.024166107177734375, -0.022927284240722656, -0.021688461303710938, -0.02044963836669922, -0.0192108154296875, -0.01797199249267578, -0.016733169555664062, -0.015494346618652344, -0.014255523681640625, -0.013016700744628906, -0.011777877807617188, -0.010539054870605469, -0.00930023193359375, -0.008061408996582031, -0.0068225860595703125, -0.005583763122558594, -0.004344940185546875, -0.0031061172485351562, -0.0018672943115234375, -0.0006284713745117188, 0.0006103515625, 0.0018491744995117188, 0.0030879974365234375, 0.004326820373535156, 0.005565643310546875, 0.006804466247558594, 0.008043289184570312, 0.009282112121582031, 0.01052093505859375, 0.011759757995605469, 0.012998580932617188, 0.014237403869628906, 0.015476226806640625, 0.016715049743652344, 0.017953872680664062, 0.01919269561767578, 0.0204315185546875, 0.02167034149169922, 0.022909164428710938, 0.024147987365722656, 0.025386810302734375, 0.026625633239746094, 0.027864456176757812, 0.02910327911376953, 0.03034210205078125, 0.03158092498779297, 0.03281974792480469, 0.034058570861816406, 0.035297393798828125, 0.036536216735839844, 0.03777503967285156, 0.03901386260986328, 0.040252685546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 2.0, 6.0, 8.0, 16.0, 15.0, 19.0, 20.0, 20.0, 18.0, 29.0, 38.0, 34.0, 59.0, 70.0, 61.0, 58.0, 69.0, 71.0, 56.0, 60.0, 40.0, 28.0, 45.0, 35.0, 21.0, 23.0, 10.0, 10.0, 13.0, 9.0, 9.0, 2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7179718017578125e-05, -2.6227906346321106e-05, -2.5276094675064087e-05, -2.4324283003807068e-05, -2.337247133255005e-05, -2.242065966129303e-05, -2.146884799003601e-05, -2.0517036318778992e-05, -1.9565224647521973e-05, -1.8613412976264954e-05, -1.7661601305007935e-05, -1.6709789633750916e-05, -1.5757977962493896e-05, -1.4806166291236877e-05, -1.3854354619979858e-05, -1.290254294872284e-05, -1.195073127746582e-05, -1.0998919606208801e-05, -1.0047107934951782e-05, -9.095296263694763e-06, -8.143484592437744e-06, -7.191672921180725e-06, -6.239861249923706e-06, -5.288049578666687e-06, -4.336237907409668e-06, -3.384426236152649e-06, -2.43261456489563e-06, -1.4808028936386108e-06, -5.289912223815918e-07, 4.2282044887542725e-07, 1.3746321201324463e-06, 2.3264437913894653e-06, 3.2782554626464844e-06, 4.230067133903503e-06, 5.1818788051605225e-06, 6.1336904764175415e-06, 7.0855021476745605e-06, 8.03731381893158e-06, 8.989125490188599e-06, 9.940937161445618e-06, 1.0892748832702637e-05, 1.1844560503959656e-05, 1.2796372175216675e-05, 1.3748183846473694e-05, 1.4699995517730713e-05, 1.5651807188987732e-05, 1.660361886024475e-05, 1.755543053150177e-05, 1.850724220275879e-05, 1.9459053874015808e-05, 2.0410865545272827e-05, 2.1362677216529846e-05, 2.2314488887786865e-05, 2.3266300559043884e-05, 2.4218112230300903e-05, 2.5169923901557922e-05, 2.612173557281494e-05, 2.707354724407196e-05, 2.802535891532898e-05, 2.8977170586586e-05, 2.9928982257843018e-05, 3.088079392910004e-05, 3.1832605600357056e-05, 3.2784417271614075e-05, 3.3736228942871094e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 10.0, 11.0, 19.0, 33.0, 53.0, 107.0, 326.0, 1194.0, 6039.0, 78114.0, 827616.0, 124567.0, 8362.0, 1446.0, 373.0, 139.0, 58.0, 25.0, 10.0, 19.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.10894775390625, -0.10526371002197266, -0.10157966613769531, -0.09789562225341797, -0.09421157836914062, -0.09052753448486328, -0.08684349060058594, -0.0831594467163086, -0.07947540283203125, -0.0757913589477539, -0.07210731506347656, -0.06842327117919922, -0.06473922729492188, -0.06105518341064453, -0.05737113952636719, -0.053687095642089844, -0.0500030517578125, -0.046319007873535156, -0.04263496398925781, -0.03895092010498047, -0.035266876220703125, -0.03158283233642578, -0.027898788452148438, -0.024214744567871094, -0.02053070068359375, -0.016846656799316406, -0.013162612915039062, -0.009478569030761719, -0.005794525146484375, -0.0021104812622070312, 0.0015735626220703125, 0.005257606506347656, 0.008941650390625, 0.012625694274902344, 0.016309738159179688, 0.01999378204345703, 0.023677825927734375, 0.02736186981201172, 0.031045913696289062, 0.034729957580566406, 0.03841400146484375, 0.042098045349121094, 0.04578208923339844, 0.04946613311767578, 0.053150177001953125, 0.05683422088623047, 0.06051826477050781, 0.06420230865478516, 0.0678863525390625, 0.07157039642333984, 0.07525444030761719, 0.07893848419189453, 0.08262252807617188, 0.08630657196044922, 0.08999061584472656, 0.0936746597290039, 0.09735870361328125, 0.1010427474975586, 0.10472679138183594, 0.10841083526611328, 0.11209487915039062, 0.11577892303466797, 0.11946296691894531, 0.12314701080322266, 0.1268310546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 9.0, 5.0, 8.0, 7.0, 17.0, 19.0, 26.0, 43.0, 66.0, 51.0, 63.0, 103.0, 108.0, 102.0, 103.0, 67.0, 59.0, 34.0, 30.0, 23.0, 12.0, 9.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01279449462890625, -0.012346386909484863, -0.011898279190063477, -0.01145017147064209, -0.011002063751220703, -0.010553956031799316, -0.01010584831237793, -0.009657740592956543, -0.009209632873535156, -0.00876152515411377, -0.008313417434692383, -0.007865309715270996, -0.007417201995849609, -0.006969094276428223, -0.006520986557006836, -0.006072878837585449, -0.0056247711181640625, -0.005176663398742676, -0.004728555679321289, -0.004280447959899902, -0.0038323402404785156, -0.003384232521057129, -0.002936124801635742, -0.0024880170822143555, -0.0020399093627929688, -0.001591801643371582, -0.0011436939239501953, -0.0006955862045288086, -0.0002474784851074219, 0.00020062923431396484, 0.0006487369537353516, 0.0010968446731567383, 0.001544952392578125, 0.0019930601119995117, 0.0024411678314208984, 0.002889275550842285, 0.003337383270263672, 0.0037854909896850586, 0.004233598709106445, 0.004681706428527832, 0.005129814147949219, 0.0055779218673706055, 0.006026029586791992, 0.006474137306213379, 0.006922245025634766, 0.007370352745056152, 0.007818460464477539, 0.008266568183898926, 0.008714675903320312, 0.0091627836227417, 0.009610891342163086, 0.010058999061584473, 0.01050710678100586, 0.010955214500427246, 0.011403322219848633, 0.01185142993927002, 0.012299537658691406, 0.012747645378112793, 0.01319575309753418, 0.013643860816955566, 0.014091968536376953, 0.01454007625579834, 0.014988183975219727, 0.015436291694641113, 0.0158843994140625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 8.0, 2.0, 8.0, 14.0, 17.0, 33.0, 44.0, 43.0, 65.0, 57.0, 69.0, 76.0, 76.0, 78.0, 70.0, 82.0, 61.0, 54.0, 35.0, 29.0, 18.0, 15.0, 14.0, 11.0, 10.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7015740871429443, -2.600919008255005, -2.5002639293670654, -2.399608850479126, -2.2989537715911865, -2.198298692703247, -2.0976436138153076, -1.9969885349273682, -1.8963334560394287, -1.7956783771514893, -1.6950232982635498, -1.5943682193756104, -1.493713140487671, -1.3930580615997314, -1.292402982711792, -1.1917479038238525, -1.0910929441452026, -0.9904378652572632, -0.8897827863693237, -0.7891277074813843, -0.6884726285934448, -0.5878176093101501, -0.4871625304222107, -0.38650745153427124, -0.2858523726463318, -0.18519729375839233, -0.08454222977161407, 0.016112834215164185, 0.11676791310310364, 0.2174229621887207, 0.31807804107666016, 0.4187331199645996, 0.5193881988525391, 0.6200432777404785, 0.720698356628418, 0.8213534355163574, 0.9220085144042969, 1.0226635932922363, 1.1233186721801758, 1.2239737510681152, 1.3246288299560547, 1.4252839088439941, 1.5259389877319336, 1.626594066619873, 1.7272491455078125, 1.827904224395752, 1.9285593032836914, 2.029214382171631, 2.1298694610595703, 2.2305245399475098, 2.331179618835449, 2.4318346977233887, 2.532489776611328, 2.6331448554992676, 2.733799934387207, 2.8344550132751465, 2.935109853744507, 3.0357649326324463, 3.1364200115203857, 3.237075090408325, 3.3377301692962646, 3.438385248184204, 3.5390403270721436, 3.639695405960083, 3.7403504848480225]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 6.0, 6.0, 8.0, 11.0, 11.0, 8.0, 17.0, 16.0, 20.0, 21.0, 23.0, 23.0, 21.0, 42.0, 45.0, 48.0, 47.0, 40.0, 49.0, 58.0, 45.0, 43.0, 43.0, 55.0, 32.0, 39.0, 38.0, 33.0, 28.0, 23.0, 23.0, 14.0, 12.0, 11.0, 12.0, 10.0, 9.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.437103033065796, -2.3552041053771973, -2.2733054161071777, -2.191406488418579, -2.1095077991485596, -2.027608871459961, -1.9457100629806519, -1.8638112545013428, -1.7819124460220337, -1.7000136375427246, -1.6181148290634155, -1.5362160205841064, -1.4543170928955078, -1.3724184036254883, -1.2905194759368896, -1.2086206674575806, -1.1267218589782715, -1.0448230504989624, -0.9629242420196533, -0.8810253739356995, -0.7991265654563904, -0.7172277569770813, -0.6353288888931274, -0.5534300804138184, -0.4715312719345093, -0.3896324634552002, -0.3077336251735687, -0.22583480179309845, -0.14393597841262817, -0.06203716993331909, 0.019861668348312378, 0.10176050662994385, 0.18365931510925293, 0.265558123588562, 0.3474569618701935, 0.42935580015182495, 0.511254608631134, 0.5931534171104431, 0.675052285194397, 0.756951093673706, 0.8388499021530151, 0.9207487106323242, 1.0026475191116333, 1.0845463275909424, 1.166445255279541, 1.2483439445495605, 1.3302428722381592, 1.4121416807174683, 1.4940404891967773, 1.5759392976760864, 1.6578381061553955, 1.7397369146347046, 1.8216357231140137, 1.9035346508026123, 1.9854334592819214, 2.0673322677612305, 2.14923095703125, 2.2311298847198486, 2.313028573989868, 2.394927501678467, 2.4768261909484863, 2.558725118637085, 2.6406238079071045, 2.722522735595703, 2.8044216632843018]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 6.0, 19.0, 16.0, 19.0, 24.0, 35.0, 43.0, 78.0, 116.0, 161.0, 228.0, 389.0, 747.0, 1377.0, 2784.0, 5944.0, 13273.0, 29546.0, 65430.0, 130818.0, 208518.0, 232557.0, 174100.0, 97600.0, 46392.0, 20447.0, 9150.0, 4164.0, 2017.0, 1005.0, 592.0, 320.0, 197.0, 140.0, 88.0, 66.0, 45.0, 40.0, 23.0, 10.0, 9.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.350616455078125, -2.27545166015625, -2.200286865234375, -2.1251220703125, -2.049957275390625, -1.97479248046875, -1.899627685546875, -1.824462890625, -1.749298095703125, -1.67413330078125, -1.598968505859375, -1.5238037109375, -1.448638916015625, -1.37347412109375, -1.298309326171875, -1.22314453125, -1.147979736328125, -1.07281494140625, -0.997650146484375, -0.9224853515625, -0.847320556640625, -0.77215576171875, -0.696990966796875, -0.621826171875, -0.546661376953125, -0.47149658203125, -0.396331787109375, -0.3211669921875, -0.246002197265625, -0.17083740234375, -0.095672607421875, -0.0205078125, 0.054656982421875, 0.12982177734375, 0.204986572265625, 0.2801513671875, 0.355316162109375, 0.43048095703125, 0.505645751953125, 0.580810546875, 0.655975341796875, 0.73114013671875, 0.806304931640625, 0.8814697265625, 0.956634521484375, 1.03179931640625, 1.106964111328125, 1.18212890625, 1.257293701171875, 1.33245849609375, 1.407623291015625, 1.4827880859375, 1.557952880859375, 1.63311767578125, 1.708282470703125, 1.783447265625, 1.858612060546875, 1.93377685546875, 2.008941650390625, 2.0841064453125, 2.159271240234375, 2.23443603515625, 2.309600830078125, 2.384765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 5.0, 11.0, 6.0, 6.0, 8.0, 11.0, 12.0, 23.0, 26.0, 23.0, 31.0, 26.0, 30.0, 28.0, 43.0, 45.0, 36.0, 42.0, 64.0, 45.0, 38.0, 34.0, 43.0, 52.0, 39.0, 28.0, 42.0, 28.0, 27.0, 16.0, 19.0, 16.0, 19.0, 8.0, 9.0, 12.0, 15.0, 5.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.45703125, -4.32012939453125, -4.1832275390625, -4.04632568359375, -3.909423828125, -3.77252197265625, -3.6356201171875, -3.49871826171875, -3.36181640625, -3.22491455078125, -3.0880126953125, -2.95111083984375, -2.814208984375, -2.67730712890625, -2.5404052734375, -2.40350341796875, -2.2666015625, -2.12969970703125, -1.9927978515625, -1.85589599609375, -1.718994140625, -1.58209228515625, -1.4451904296875, -1.30828857421875, -1.17138671875, -1.03448486328125, -0.8975830078125, -0.76068115234375, -0.623779296875, -0.48687744140625, -0.3499755859375, -0.21307373046875, -0.076171875, 0.06072998046875, 0.1976318359375, 0.33453369140625, 0.471435546875, 0.60833740234375, 0.7452392578125, 0.88214111328125, 1.01904296875, 1.15594482421875, 1.2928466796875, 1.42974853515625, 1.566650390625, 1.70355224609375, 1.8404541015625, 1.97735595703125, 2.1142578125, 2.25115966796875, 2.3880615234375, 2.52496337890625, 2.661865234375, 2.79876708984375, 2.9356689453125, 3.07257080078125, 3.20947265625, 3.34637451171875, 3.4832763671875, 3.62017822265625, 3.757080078125, 3.89398193359375, 4.0308837890625, 4.16778564453125, 4.3046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 7.0, 10.0, 13.0, 15.0, 19.0, 30.0, 34.0, 32.0, 44.0, 60.0, 90.0, 104.0, 124.0, 181.0, 288.0, 357.0, 1455.0, 69769.0, 905483.0, 67573.0, 1425.0, 381.0, 249.0, 195.0, 141.0, 98.0, 86.0, 51.0, 52.0, 33.0, 28.0, 26.0, 22.0, 21.0, 14.0, 7.0, 5.0, 10.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.4609375, -13.05908203125, -12.6572265625, -12.25537109375, -11.853515625, -11.45166015625, -11.0498046875, -10.64794921875, -10.24609375, -9.84423828125, -9.4423828125, -9.04052734375, -8.638671875, -8.23681640625, -7.8349609375, -7.43310546875, -7.03125, -6.62939453125, -6.2275390625, -5.82568359375, -5.423828125, -5.02197265625, -4.6201171875, -4.21826171875, -3.81640625, -3.41455078125, -3.0126953125, -2.61083984375, -2.208984375, -1.80712890625, -1.4052734375, -1.00341796875, -0.6015625, -0.19970703125, 0.2021484375, 0.60400390625, 1.005859375, 1.40771484375, 1.8095703125, 2.21142578125, 2.61328125, 3.01513671875, 3.4169921875, 3.81884765625, 4.220703125, 4.62255859375, 5.0244140625, 5.42626953125, 5.828125, 6.22998046875, 6.6318359375, 7.03369140625, 7.435546875, 7.83740234375, 8.2392578125, 8.64111328125, 9.04296875, 9.44482421875, 9.8466796875, 10.24853515625, 10.650390625, 11.05224609375, 11.4541015625, 11.85595703125, 12.2578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 10.0, 8.0, 7.0, 5.0, 14.0, 17.0, 19.0, 18.0, 16.0, 25.0, 26.0, 23.0, 28.0, 27.0, 37.0, 44.0, 42.0, 32.0, 46.0, 37.0, 45.0, 39.0, 40.0, 42.0, 37.0, 39.0, 34.0, 33.0, 23.0, 26.0, 23.0, 27.0, 15.0, 20.0, 14.0, 6.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-4.4609375, -4.32562255859375, -4.1903076171875, -4.05499267578125, -3.919677734375, -3.78436279296875, -3.6490478515625, -3.51373291015625, -3.37841796875, -3.24310302734375, -3.1077880859375, -2.97247314453125, -2.837158203125, -2.70184326171875, -2.5665283203125, -2.43121337890625, -2.2958984375, -2.16058349609375, -2.0252685546875, -1.88995361328125, -1.754638671875, -1.61932373046875, -1.4840087890625, -1.34869384765625, -1.21337890625, -1.07806396484375, -0.9427490234375, -0.80743408203125, -0.672119140625, -0.53680419921875, -0.4014892578125, -0.26617431640625, -0.130859375, 0.00445556640625, 0.1397705078125, 0.27508544921875, 0.410400390625, 0.54571533203125, 0.6810302734375, 0.81634521484375, 0.95166015625, 1.08697509765625, 1.2222900390625, 1.35760498046875, 1.492919921875, 1.62823486328125, 1.7635498046875, 1.89886474609375, 2.0341796875, 2.16949462890625, 2.3048095703125, 2.44012451171875, 2.575439453125, 2.71075439453125, 2.8460693359375, 2.98138427734375, 3.11669921875, 3.25201416015625, 3.3873291015625, 3.52264404296875, 3.657958984375, 3.79327392578125, 3.9285888671875, 4.06390380859375, 4.19921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 6.0, 8.0, 5.0, 16.0, 25.0, 27.0, 76.0, 159.0, 417.0, 1596.0, 9944.0, 330723.0, 681902.0, 20279.0, 2350.0, 595.0, 201.0, 78.0, 58.0, 29.0, 17.0, 10.0, 9.0, 7.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.29364013671875, -4.1810302734375, -4.06842041015625, -3.955810546875, -3.84320068359375, -3.7305908203125, -3.61798095703125, -3.50537109375, -3.39276123046875, -3.2801513671875, -3.16754150390625, -3.054931640625, -2.94232177734375, -2.8297119140625, -2.71710205078125, -2.6044921875, -2.49188232421875, -2.3792724609375, -2.26666259765625, -2.154052734375, -2.04144287109375, -1.9288330078125, -1.81622314453125, -1.70361328125, -1.59100341796875, -1.4783935546875, -1.36578369140625, -1.253173828125, -1.14056396484375, -1.0279541015625, -0.91534423828125, -0.802734375, -0.69012451171875, -0.5775146484375, -0.46490478515625, -0.352294921875, -0.23968505859375, -0.1270751953125, -0.01446533203125, 0.09814453125, 0.21075439453125, 0.3233642578125, 0.43597412109375, 0.548583984375, 0.66119384765625, 0.7738037109375, 0.88641357421875, 0.9990234375, 1.11163330078125, 1.2242431640625, 1.33685302734375, 1.449462890625, 1.56207275390625, 1.6746826171875, 1.78729248046875, 1.89990234375, 2.01251220703125, 2.1251220703125, 2.23773193359375, 2.350341796875, 2.46295166015625, 2.5755615234375, 2.68817138671875, 2.80078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 7.0, 5.0, 8.0, 13.0, 10.0, 27.0, 34.0, 26.0, 43.0, 46.0, 58.0, 54.0, 89.0, 98.0, 84.0, 70.0, 61.0, 56.0, 51.0, 34.0, 24.0, 28.0, 20.0, 8.0, 11.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001609325408935547, -0.00015439093112945557, -0.00014784932136535645, -0.00014130771160125732, -0.0001347661018371582, -0.00012822449207305908, -0.00012168288230895996, -0.00011514127254486084, -0.00010859966278076172, -0.0001020580530166626, -9.551644325256348e-05, -8.897483348846436e-05, -8.243322372436523e-05, -7.589161396026611e-05, -6.935000419616699e-05, -6.280839443206787e-05, -5.626678466796875e-05, -4.972517490386963e-05, -4.318356513977051e-05, -3.664195537567139e-05, -3.0100345611572266e-05, -2.3558735847473145e-05, -1.7017126083374023e-05, -1.0475516319274902e-05, -3.933906555175781e-06, 2.60770320892334e-06, 9.149312973022461e-06, 1.5690922737121582e-05, 2.2232532501220703e-05, 2.8774142265319824e-05, 3.5315752029418945e-05, 4.1857361793518066e-05, 4.839897155761719e-05, 5.494058132171631e-05, 6.148219108581543e-05, 6.802380084991455e-05, 7.456541061401367e-05, 8.110702037811279e-05, 8.764863014221191e-05, 9.419023990631104e-05, 0.00010073184967041016, 0.00010727345943450928, 0.0001138150691986084, 0.00012035667896270752, 0.00012689828872680664, 0.00013343989849090576, 0.00013998150825500488, 0.000146523118019104, 0.00015306472778320312, 0.00015960633754730225, 0.00016614794731140137, 0.0001726895570755005, 0.0001792311668395996, 0.00018577277660369873, 0.00019231438636779785, 0.00019885599613189697, 0.0002053976058959961, 0.00021193921566009521, 0.00021848082542419434, 0.00022502243518829346, 0.00023156404495239258, 0.0002381056547164917, 0.0002446472644805908, 0.00025118887424468994, 0.00025773048400878906]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 13.0, 13.0, 23.0, 52.0, 68.0, 133.0, 266.0, 784.0, 5965.0, 252716.0, 769338.0, 16916.0, 1482.0, 359.0, 170.0, 91.0, 47.0, 36.0, 26.0, 12.0, 9.0, 12.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.47076416015625, -4.3399658203125, -4.20916748046875, -4.078369140625, -3.94757080078125, -3.8167724609375, -3.68597412109375, -3.55517578125, -3.42437744140625, -3.2935791015625, -3.16278076171875, -3.031982421875, -2.90118408203125, -2.7703857421875, -2.63958740234375, -2.5087890625, -2.37799072265625, -2.2471923828125, -2.11639404296875, -1.985595703125, -1.85479736328125, -1.7239990234375, -1.59320068359375, -1.46240234375, -1.33160400390625, -1.2008056640625, -1.07000732421875, -0.939208984375, -0.80841064453125, -0.6776123046875, -0.54681396484375, -0.416015625, -0.28521728515625, -0.1544189453125, -0.02362060546875, 0.107177734375, 0.23797607421875, 0.3687744140625, 0.49957275390625, 0.63037109375, 0.76116943359375, 0.8919677734375, 1.02276611328125, 1.153564453125, 1.28436279296875, 1.4151611328125, 1.54595947265625, 1.6767578125, 1.80755615234375, 1.9383544921875, 2.06915283203125, 2.199951171875, 2.33074951171875, 2.4615478515625, 2.59234619140625, 2.72314453125, 2.85394287109375, 2.9847412109375, 3.11553955078125, 3.246337890625, 3.37713623046875, 3.5079345703125, 3.63873291015625, 3.76953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 13.0, 8.0, 14.0, 20.0, 29.0, 32.0, 47.0, 71.0, 79.0, 92.0, 127.0, 105.0, 90.0, 64.0, 60.0, 36.0, 32.0, 18.0, 13.0, 14.0, 13.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75146484375, -0.724365234375, -0.697265625, -0.670166015625, -0.64306640625, -0.615966796875, -0.5888671875, -0.561767578125, -0.53466796875, -0.507568359375, -0.48046875, -0.453369140625, -0.42626953125, -0.399169921875, -0.3720703125, -0.344970703125, -0.31787109375, -0.290771484375, -0.263671875, -0.236572265625, -0.20947265625, -0.182373046875, -0.1552734375, -0.128173828125, -0.10107421875, -0.073974609375, -0.046875, -0.019775390625, 0.00732421875, 0.034423828125, 0.0615234375, 0.088623046875, 0.11572265625, 0.142822265625, 0.169921875, 0.197021484375, 0.22412109375, 0.251220703125, 0.2783203125, 0.305419921875, 0.33251953125, 0.359619140625, 0.38671875, 0.413818359375, 0.44091796875, 0.468017578125, 0.4951171875, 0.522216796875, 0.54931640625, 0.576416015625, 0.603515625, 0.630615234375, 0.65771484375, 0.684814453125, 0.7119140625, 0.739013671875, 0.76611328125, 0.793212890625, 0.8203125, 0.847412109375, 0.87451171875, 0.901611328125, 0.9287109375, 0.955810546875, 0.98291015625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 9.0, 23.0, 114.0, 246.0, 285.0, 212.0, 92.0, 25.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25889253616333, -4.43889856338501, -3.6189045906066895, -2.79891037940979, -1.9789164066314697, -1.1589221954345703, -0.33892822265625, 0.4810657501220703, 1.3010597229003906, 2.121053695678711, 2.9410476684570312, 3.7610418796539307, 4.581035614013672, 5.40103006362915, 6.221024036407471, 7.041018009185791, 7.861011981964111, 8.68100643157959, 9.50100040435791, 10.32099437713623, 11.14098834991455, 11.960982322692871, 12.780976295471191, 13.600970268249512, 14.420964241027832, 15.240958213806152, 16.06095314025879, 16.88094711303711, 17.70094108581543, 18.52093505859375, 19.34092903137207, 20.16092300415039, 20.98091697692871, 21.80091094970703, 22.62090492248535, 23.440898895263672, 24.260892868041992, 25.080886840820312, 25.900880813598633, 26.720874786376953, 27.540868759155273, 28.360862731933594, 29.180856704711914, 30.000850677490234, 30.820844650268555, 31.640838623046875, 32.46083450317383, 33.280826568603516, 34.10082244873047, 34.92081832885742, 35.74081039428711, 36.56080627441406, 37.38079833984375, 38.2007942199707, 39.02078628540039, 39.840782165527344, 40.66077423095703, 41.480770111083984, 42.30076217651367, 43.120758056640625, 43.94075012207031, 44.760746002197266, 45.58073806762695, 46.400733947753906, 47.220726013183594]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 8.0, 4.0, 11.0, 12.0, 12.0, 18.0, 19.0, 16.0, 23.0, 26.0, 28.0, 36.0, 33.0, 42.0, 31.0, 45.0, 35.0, 51.0, 41.0, 44.0, 36.0, 37.0, 35.0, 38.0, 30.0, 36.0, 28.0, 31.0, 26.0, 14.0, 23.0, 21.0, 15.0, 17.0, 14.0, 14.0, 8.0, 9.0, 7.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.469315052032471, -7.248369216918945, -7.027422904968262, -6.806477069854736, -6.585530757904053, -6.364584922790527, -6.143638610839844, -5.922692775726318, -5.701746940612793, -5.480801105499268, -5.259854793548584, -5.038908958435059, -4.817962646484375, -4.59701681137085, -4.376070976257324, -4.155124664306641, -3.934178352355957, -3.7132322788238525, -3.492286205291748, -3.2713403701782227, -3.050394058227539, -2.8294482231140137, -2.608502149581909, -2.3875560760498047, -2.1666100025177, -1.9456639289855957, -1.7247178554534912, -1.5037719011306763, -1.2828258275985718, -1.0618797540664673, -0.8409337997436523, -0.6199877262115479, -0.39904212951660156, -0.17809608578681946, 0.042849957942962646, 0.26379597187042236, 0.48474204540252686, 0.7056881189346313, 0.9266340732574463, 1.1475801467895508, 1.3685262203216553, 1.5894722938537598, 1.8104183673858643, 2.0313644409179688, 2.252310276031494, 2.4732565879821777, 2.694202423095703, 2.9151484966278076, 3.136094570159912, 3.3570406436920166, 3.577986717224121, 3.7989325523376465, 4.01987886428833, 4.2408246994018555, 4.461771011352539, 4.6827168464660645, 4.90366268157959, 5.124608516693115, 5.345554828643799, 5.566500663757324, 5.787446975708008, 6.008392810821533, 6.229338645935059, 6.450284957885742, 6.671231269836426]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 4.0, 7.0, 9.0, 13.0, 24.0, 31.0, 44.0, 69.0, 89.0, 129.0, 209.0, 350.0, 634.0, 2007.0, 16902.0, 366914.0, 2888807.0, 871576.0, 40217.0, 3601.0, 1046.0, 561.0, 334.0, 223.0, 146.0, 109.0, 85.0, 46.0, 33.0, 22.0, 15.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.3768310546875, -9.089599609375, -8.8023681640625, -8.51513671875, -8.2279052734375, -7.940673828125, -7.6534423828125, -7.3662109375, -7.0789794921875, -6.791748046875, -6.5045166015625, -6.21728515625, -5.9300537109375, -5.642822265625, -5.3555908203125, -5.068359375, -4.7811279296875, -4.493896484375, -4.2066650390625, -3.91943359375, -3.6322021484375, -3.344970703125, -3.0577392578125, -2.7705078125, -2.4832763671875, -2.196044921875, -1.9088134765625, -1.62158203125, -1.3343505859375, -1.047119140625, -0.7598876953125, -0.47265625, -0.1854248046875, 0.101806640625, 0.3890380859375, 0.67626953125, 0.9635009765625, 1.250732421875, 1.5379638671875, 1.8251953125, 2.1124267578125, 2.399658203125, 2.6868896484375, 2.97412109375, 3.2613525390625, 3.548583984375, 3.8358154296875, 4.123046875, 4.4102783203125, 4.697509765625, 4.9847412109375, 5.27197265625, 5.5592041015625, 5.846435546875, 6.1336669921875, 6.4208984375, 6.7081298828125, 6.995361328125, 7.2825927734375, 7.56982421875, 7.8570556640625, 8.144287109375, 8.4315185546875, 8.71875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 14.0, 17.0, 14.0, 21.0, 27.0, 36.0, 46.0, 62.0, 62.0, 74.0, 61.0, 77.0, 78.0, 63.0, 66.0, 53.0, 34.0, 43.0, 44.0, 32.0, 21.0, 16.0, 13.0, 5.0, 5.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.046875, -7.867034912109375, -7.68719482421875, -7.507354736328125, -7.3275146484375, -7.147674560546875, -6.96783447265625, -6.787994384765625, -6.608154296875, -6.428314208984375, -6.24847412109375, -6.068634033203125, -5.8887939453125, -5.708953857421875, -5.52911376953125, -5.349273681640625, -5.16943359375, -4.989593505859375, -4.80975341796875, -4.629913330078125, -4.4500732421875, -4.270233154296875, -4.09039306640625, -3.910552978515625, -3.730712890625, -3.550872802734375, -3.37103271484375, -3.191192626953125, -3.0113525390625, -2.831512451171875, -2.65167236328125, -2.471832275390625, -2.2919921875, -2.112152099609375, -1.93231201171875, -1.752471923828125, -1.5726318359375, -1.392791748046875, -1.21295166015625, -1.033111572265625, -0.853271484375, -0.673431396484375, -0.49359130859375, -0.313751220703125, -0.1339111328125, 0.045928955078125, 0.22576904296875, 0.405609130859375, 0.58544921875, 0.765289306640625, 0.94512939453125, 1.124969482421875, 1.3048095703125, 1.484649658203125, 1.66448974609375, 1.844329833984375, 2.024169921875, 2.204010009765625, 2.38385009765625, 2.563690185546875, 2.7435302734375, 2.923370361328125, 3.10321044921875, 3.283050537109375, 3.462890625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 12.0, 18.0, 28.0, 38.0, 73.0, 225.0, 930.0, 2108384.0, 2083182.0, 991.0, 194.0, 89.0, 55.0, 32.0, 11.0, 15.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.765625, -20.556396484375, -19.34716796875, -18.137939453125, -16.9287109375, -15.719482421875, -14.51025390625, -13.301025390625, -12.091796875, -10.882568359375, -9.67333984375, -8.464111328125, -7.2548828125, -6.045654296875, -4.83642578125, -3.627197265625, -2.41796875, -1.208740234375, 0.00048828125, 1.209716796875, 2.4189453125, 3.628173828125, 4.83740234375, 6.046630859375, 7.255859375, 8.465087890625, 9.67431640625, 10.883544921875, 12.0927734375, 13.302001953125, 14.51123046875, 15.720458984375, 16.9296875, 18.138916015625, 19.34814453125, 20.557373046875, 21.7666015625, 22.975830078125, 24.18505859375, 25.394287109375, 26.603515625, 27.812744140625, 29.02197265625, 30.231201171875, 31.4404296875, 32.649658203125, 33.85888671875, 35.068115234375, 36.27734375, 37.486572265625, 38.69580078125, 39.905029296875, 41.1142578125, 42.323486328125, 43.53271484375, 44.741943359375, 45.951171875, 47.160400390625, 48.36962890625, 49.578857421875, 50.7880859375, 51.997314453125, 53.20654296875, 54.415771484375, 55.625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 2.0, 5.0, 9.0, 14.0, 18.0, 16.0, 24.0, 45.0, 55.0, 70.0, 105.0, 133.0, 181.0, 263.0, 350.0, 416.0, 451.0, 416.0, 384.0, 325.0, 214.0, 157.0, 127.0, 89.0, 64.0, 36.0, 29.0, 26.0, 12.0, 7.0, 13.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7080078125, -1.65582275390625, -1.6036376953125, -1.55145263671875, -1.499267578125, -1.44708251953125, -1.3948974609375, -1.34271240234375, -1.29052734375, -1.23834228515625, -1.1861572265625, -1.13397216796875, -1.081787109375, -1.02960205078125, -0.9774169921875, -0.92523193359375, -0.873046875, -0.82086181640625, -0.7686767578125, -0.71649169921875, -0.664306640625, -0.61212158203125, -0.5599365234375, -0.50775146484375, -0.45556640625, -0.40338134765625, -0.3511962890625, -0.29901123046875, -0.246826171875, -0.19464111328125, -0.1424560546875, -0.09027099609375, -0.0380859375, 0.01409912109375, 0.0662841796875, 0.11846923828125, 0.170654296875, 0.22283935546875, 0.2750244140625, 0.32720947265625, 0.37939453125, 0.43157958984375, 0.4837646484375, 0.53594970703125, 0.588134765625, 0.64031982421875, 0.6925048828125, 0.74468994140625, 0.796875, 0.84906005859375, 0.9012451171875, 0.95343017578125, 1.005615234375, 1.05780029296875, 1.1099853515625, 1.16217041015625, 1.21435546875, 1.26654052734375, 1.3187255859375, 1.37091064453125, 1.423095703125, 1.47528076171875, 1.5274658203125, 1.57965087890625, 1.6318359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 14.0, 24.0, 30.0, 46.0, 79.0, 74.0, 88.0, 103.0, 111.0, 104.0, 86.0, 69.0, 63.0, 40.0, 28.0, 18.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1759796142578125, -3.9374821186065674, -3.6989846229553223, -3.460486888885498, -3.221989393234253, -2.983491897583008, -2.7449941635131836, -2.5064966678619385, -2.2679991722106934, -2.0295016765594482, -1.7910040616989136, -1.552506446838379, -1.3140089511871338, -1.0755114555358887, -0.837013840675354, -0.5985162258148193, -0.3600187301635742, -0.12152117490768433, 0.11697638034820557, 0.35547393560409546, 0.5939714908599854, 0.8324689865112305, 1.0709666013717651, 1.3094642162322998, 1.547961711883545, 1.78645920753479, 2.024956703186035, 2.2634544372558594, 2.5019519329071045, 2.7404494285583496, 2.978947162628174, 3.217444658279419, 3.455942153930664, 3.694439649581909, 3.9329371452331543, 4.1714348793029785, 4.4099321365356445, 4.648429870605469, 4.886927604675293, 5.125425338745117, 5.363922595977783, 5.602420330047607, 5.840917587280273, 6.079415321350098, 6.317913055419922, 6.556410312652588, 6.794908046722412, 7.033405303955078, 7.271903038024902, 7.510400772094727, 7.748898029327393, 7.987395763397217, 8.225893020629883, 8.464390754699707, 8.702888488769531, 8.941386222839355, 9.17988395690918, 9.418381690979004, 9.656879425048828, 9.895376205444336, 10.13387393951416, 10.372371673583984, 10.610869407653809, 10.849367141723633, 11.08786392211914]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 6.0, 13.0, 18.0, 12.0, 17.0, 16.0, 18.0, 17.0, 19.0, 32.0, 30.0, 35.0, 47.0, 43.0, 51.0, 46.0, 40.0, 48.0, 36.0, 42.0, 38.0, 31.0, 44.0, 41.0, 27.0, 18.0, 25.0, 25.0, 27.0, 23.0, 13.0, 16.0, 13.0, 10.0, 8.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.050779342651367, -3.934265375137329, -3.817751407623291, -3.701237440109253, -3.584723472595215, -3.4682095050811768, -3.3516955375671387, -3.2351813316345215, -3.1186676025390625, -3.0021536350250244, -2.8856396675109863, -2.7691256999969482, -2.65261173248291, -2.536097764968872, -2.419583797454834, -2.303069591522217, -2.1865556240081787, -2.0700416564941406, -1.9535276889801025, -1.8370137214660645, -1.7204997539520264, -1.6039857864379883, -1.4874716997146606, -1.3709577322006226, -1.2544437646865845, -1.1379297971725464, -1.0214158296585083, -0.9049018025398254, -0.7883878350257874, -0.6718738675117493, -0.5553598403930664, -0.4388458728790283, -0.32233166694641113, -0.20581768453121185, -0.08930370211601257, 0.0272102952003479, 0.143724262714386, 0.2602382302284241, 0.37675225734710693, 0.493266224861145, 0.6097801923751831, 0.7262941598892212, 0.8428081274032593, 0.9593221545219421, 1.075836181640625, 1.192350149154663, 1.3088641166687012, 1.4253780841827393, 1.5418920516967773, 1.6584060192108154, 1.7749199867248535, 1.8914339542388916, 2.0079479217529297, 2.1244618892669678, 2.240975856781006, 2.357490062713623, 2.474003791809082, 2.59051775932312, 2.707031726837158, 2.8235456943511963, 2.9400596618652344, 3.0565736293792725, 3.1730875968933105, 3.2896018028259277, 3.406115770339966]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 12.0, 17.0, 31.0, 65.0, 99.0, 169.0, 318.0, 612.0, 1488.0, 6178.0, 49490.0, 478298.0, 456484.0, 46643.0, 5836.0, 1473.0, 608.0, 310.0, 176.0, 92.0, 64.0, 29.0, 25.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.0610504150390625, -1.024444580078125, -0.9878387451171875, -0.95123291015625, -0.9146270751953125, -0.878021240234375, -0.8414154052734375, -0.8048095703125, -0.7682037353515625, -0.731597900390625, -0.6949920654296875, -0.65838623046875, -0.6217803955078125, -0.585174560546875, -0.5485687255859375, -0.511962890625, -0.4753570556640625, -0.438751220703125, -0.4021453857421875, -0.36553955078125, -0.3289337158203125, -0.292327880859375, -0.2557220458984375, -0.2191162109375, -0.1825103759765625, -0.145904541015625, -0.1092987060546875, -0.07269287109375, -0.0360870361328125, 0.000518798828125, 0.0371246337890625, 0.07373046875, 0.1103363037109375, 0.146942138671875, 0.1835479736328125, 0.22015380859375, 0.2567596435546875, 0.293365478515625, 0.3299713134765625, 0.3665771484375, 0.4031829833984375, 0.439788818359375, 0.4763946533203125, 0.51300048828125, 0.5496063232421875, 0.586212158203125, 0.6228179931640625, 0.659423828125, 0.6960296630859375, 0.732635498046875, 0.7692413330078125, 0.80584716796875, 0.8424530029296875, 0.879058837890625, 0.9156646728515625, 0.9522705078125, 0.9888763427734375, 1.025482177734375, 1.0620880126953125, 1.09869384765625, 1.1352996826171875, 1.171905517578125, 1.2085113525390625, 1.2451171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 6.0, 12.0, 11.0, 18.0, 30.0, 33.0, 37.0, 38.0, 60.0, 65.0, 76.0, 75.0, 80.0, 81.0, 86.0, 53.0, 63.0, 34.0, 37.0, 31.0, 23.0, 15.0, 13.0, 9.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.773651123046875, -5.63714599609375, -5.500640869140625, -5.3641357421875, -5.227630615234375, -5.09112548828125, -4.954620361328125, -4.818115234375, -4.681610107421875, -4.54510498046875, -4.408599853515625, -4.2720947265625, -4.135589599609375, -3.99908447265625, -3.862579345703125, -3.72607421875, -3.589569091796875, -3.45306396484375, -3.316558837890625, -3.1800537109375, -3.043548583984375, -2.90704345703125, -2.770538330078125, -2.634033203125, -2.497528076171875, -2.36102294921875, -2.224517822265625, -2.0880126953125, -1.951507568359375, -1.81500244140625, -1.678497314453125, -1.5419921875, -1.405487060546875, -1.26898193359375, -1.132476806640625, -0.9959716796875, -0.859466552734375, -0.72296142578125, -0.586456298828125, -0.449951171875, -0.313446044921875, -0.17694091796875, -0.040435791015625, 0.0960693359375, 0.232574462890625, 0.36907958984375, 0.505584716796875, 0.64208984375, 0.778594970703125, 0.91510009765625, 1.051605224609375, 1.1881103515625, 1.324615478515625, 1.46112060546875, 1.597625732421875, 1.734130859375, 1.870635986328125, 2.00714111328125, 2.143646240234375, 2.2801513671875, 2.416656494140625, 2.55316162109375, 2.689666748046875, 2.826171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 15.0, 16.0, 19.0, 52.0, 88.0, 105.0, 227.0, 403.0, 796.0, 1544.0, 3172.0, 6496.0, 13622.0, 27769.0, 56594.0, 109379.0, 187046.0, 235290.0, 186051.0, 108793.0, 56561.0, 27845.0, 13463.0, 6491.0, 3234.0, 1644.0, 820.0, 451.0, 184.0, 124.0, 71.0, 46.0, 39.0, 28.0, 14.0, 13.0, 5.0, 6.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2526092529296875, -0.243743896484375, -0.2348785400390625, -0.22601318359375, -0.2171478271484375, -0.208282470703125, -0.1994171142578125, -0.1905517578125, -0.1816864013671875, -0.172821044921875, -0.1639556884765625, -0.15509033203125, -0.1462249755859375, -0.137359619140625, -0.1284942626953125, -0.11962890625, -0.1107635498046875, -0.101898193359375, -0.0930328369140625, -0.08416748046875, -0.0753021240234375, -0.066436767578125, -0.0575714111328125, -0.0487060546875, -0.0398406982421875, -0.030975341796875, -0.0221099853515625, -0.01324462890625, -0.0043792724609375, 0.004486083984375, 0.0133514404296875, 0.022216796875, 0.0310821533203125, 0.039947509765625, 0.0488128662109375, 0.05767822265625, 0.0665435791015625, 0.075408935546875, 0.0842742919921875, 0.0931396484375, 0.1020050048828125, 0.110870361328125, 0.1197357177734375, 0.12860107421875, 0.1374664306640625, 0.146331787109375, 0.1551971435546875, 0.1640625, 0.1729278564453125, 0.181793212890625, 0.1906585693359375, 0.19952392578125, 0.2083892822265625, 0.217254638671875, 0.2261199951171875, 0.2349853515625, 0.2438507080078125, 0.252716064453125, 0.2615814208984375, 0.27044677734375, 0.2793121337890625, 0.288177490234375, 0.2970428466796875, 0.305908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 9.0, 10.0, 16.0, 10.0, 15.0, 30.0, 14.0, 17.0, 26.0, 26.0, 43.0, 25.0, 39.0, 41.0, 35.0, 41.0, 53.0, 50.0, 42.0, 37.0, 47.0, 40.0, 38.0, 34.0, 27.0, 26.0, 34.0, 18.0, 26.0, 17.0, 16.0, 19.0, 21.0, 7.0, 4.0, 9.0, 1.0, 7.0, 2.0, 3.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3984375, -4.2484130859375, -4.098388671875, -3.9483642578125, -3.79833984375, -3.6483154296875, -3.498291015625, -3.3482666015625, -3.1982421875, -3.0482177734375, -2.898193359375, -2.7481689453125, -2.59814453125, -2.4481201171875, -2.298095703125, -2.1480712890625, -1.998046875, -1.8480224609375, -1.697998046875, -1.5479736328125, -1.39794921875, -1.2479248046875, -1.097900390625, -0.9478759765625, -0.7978515625, -0.6478271484375, -0.497802734375, -0.3477783203125, -0.19775390625, -0.0477294921875, 0.102294921875, 0.2523193359375, 0.40234375, 0.5523681640625, 0.702392578125, 0.8524169921875, 1.00244140625, 1.1524658203125, 1.302490234375, 1.4525146484375, 1.6025390625, 1.7525634765625, 1.902587890625, 2.0526123046875, 2.20263671875, 2.3526611328125, 2.502685546875, 2.6527099609375, 2.802734375, 2.9527587890625, 3.102783203125, 3.2528076171875, 3.40283203125, 3.5528564453125, 3.702880859375, 3.8529052734375, 4.0029296875, 4.1529541015625, 4.302978515625, 4.4530029296875, 4.60302734375, 4.7530517578125, 4.903076171875, 5.0531005859375, 5.203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 20.0, 26.0, 24.0, 54.0, 75.0, 137.0, 238.0, 380.0, 710.0, 1497.0, 3748.0, 9701.0, 28239.0, 92407.0, 279020.0, 382900.0, 170681.0, 51898.0, 16361.0, 5794.0, 2286.0, 1098.0, 530.0, 294.0, 172.0, 96.0, 59.0, 51.0, 18.0, 13.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0489501953125, -0.04738426208496094, -0.045818328857421875, -0.04425239562988281, -0.04268646240234375, -0.04112052917480469, -0.039554595947265625, -0.03798866271972656, -0.0364227294921875, -0.03485679626464844, -0.033290863037109375, -0.03172492980957031, -0.03015899658203125, -0.028593063354492188, -0.027027130126953125, -0.025461196899414062, -0.023895263671875, -0.022329330444335938, -0.020763397216796875, -0.019197463989257812, -0.01763153076171875, -0.016065597534179688, -0.014499664306640625, -0.012933731079101562, -0.0113677978515625, -0.009801864624023438, -0.008235931396484375, -0.0066699981689453125, -0.00510406494140625, -0.0035381317138671875, -0.001972198486328125, -0.0004062652587890625, 0.00115966796875, 0.0027256011962890625, 0.004291534423828125, 0.0058574676513671875, 0.00742340087890625, 0.008989334106445312, 0.010555267333984375, 0.012121200561523438, 0.0136871337890625, 0.015253067016601562, 0.016819000244140625, 0.018384933471679688, 0.01995086669921875, 0.021516799926757812, 0.023082733154296875, 0.024648666381835938, 0.026214599609375, 0.027780532836914062, 0.029346466064453125, 0.030912399291992188, 0.03247833251953125, 0.03404426574707031, 0.035610198974609375, 0.03717613220214844, 0.0387420654296875, 0.04030799865722656, 0.041873931884765625, 0.04343986511230469, 0.04500579833984375, 0.04657173156738281, 0.048137664794921875, 0.04970359802246094, 0.05126953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 11.0, 17.0, 16.0, 39.0, 42.0, 56.0, 65.0, 83.0, 84.0, 87.0, 98.0, 88.0, 70.0, 54.0, 43.0, 36.0, 36.0, 17.0, 20.0, 8.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.054473876953125e-05, -4.8780813813209534e-05, -4.701688885688782e-05, -4.52529639005661e-05, -4.3489038944244385e-05, -4.172511398792267e-05, -3.996118903160095e-05, -3.8197264075279236e-05, -3.643333911895752e-05, -3.46694141626358e-05, -3.290548920631409e-05, -3.114156424999237e-05, -2.9377639293670654e-05, -2.7613714337348938e-05, -2.584978938102722e-05, -2.4085864424705505e-05, -2.232193946838379e-05, -2.0558014512062073e-05, -1.8794089555740356e-05, -1.703016459941864e-05, -1.5266239643096924e-05, -1.3502314686775208e-05, -1.1738389730453491e-05, -9.974464774131775e-06, -8.210539817810059e-06, -6.446614861488342e-06, -4.682689905166626e-06, -2.9187649488449097e-06, -1.1548399925231934e-06, 6.09084963798523e-07, 2.3730099201202393e-06, 4.1369348764419556e-06, 5.900859832763672e-06, 7.664784789085388e-06, 9.428709745407104e-06, 1.119263470172882e-05, 1.2956559658050537e-05, 1.4720484614372253e-05, 1.648440957069397e-05, 1.8248334527015686e-05, 2.0012259483337402e-05, 2.177618443965912e-05, 2.3540109395980835e-05, 2.530403435230255e-05, 2.7067959308624268e-05, 2.8831884264945984e-05, 3.05958092212677e-05, 3.2359734177589417e-05, 3.412365913391113e-05, 3.588758409023285e-05, 3.7651509046554565e-05, 3.941543400287628e-05, 4.1179358959198e-05, 4.2943283915519714e-05, 4.470720887184143e-05, 4.647113382816315e-05, 4.823505878448486e-05, 4.999898374080658e-05, 5.1762908697128296e-05, 5.352683365345001e-05, 5.529075860977173e-05, 5.7054683566093445e-05, 5.881860852241516e-05, 6.058253347873688e-05, 6.23464584350586e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 9.0, 5.0, 7.0, 8.0, 4.0, 13.0, 18.0, 24.0, 38.0, 47.0, 78.0, 167.0, 351.0, 965.0, 3419.0, 14156.0, 76432.0, 420964.0, 433414.0, 78923.0, 14418.0, 3317.0, 960.0, 374.0, 174.0, 83.0, 42.0, 48.0, 20.0, 27.0, 17.0, 13.0, 9.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060791015625, -0.05854034423828125, -0.0562896728515625, -0.05403900146484375, -0.051788330078125, -0.04953765869140625, -0.0472869873046875, -0.04503631591796875, -0.04278564453125, -0.04053497314453125, -0.0382843017578125, -0.03603363037109375, -0.033782958984375, -0.03153228759765625, -0.0292816162109375, -0.02703094482421875, -0.0247802734375, -0.02252960205078125, -0.0202789306640625, -0.01802825927734375, -0.015777587890625, -0.01352691650390625, -0.0112762451171875, -0.00902557373046875, -0.00677490234375, -0.00452423095703125, -0.0022735595703125, -2.288818359375e-05, 0.002227783203125, 0.00447845458984375, 0.0067291259765625, 0.00897979736328125, 0.01123046875, 0.01348114013671875, 0.0157318115234375, 0.01798248291015625, 0.020233154296875, 0.02248382568359375, 0.0247344970703125, 0.02698516845703125, 0.02923583984375, 0.03148651123046875, 0.0337371826171875, 0.03598785400390625, 0.038238525390625, 0.04048919677734375, 0.0427398681640625, 0.04499053955078125, 0.0472412109375, 0.04949188232421875, 0.0517425537109375, 0.05399322509765625, 0.056243896484375, 0.05849456787109375, 0.0607452392578125, 0.06299591064453125, 0.06524658203125, 0.06749725341796875, 0.0697479248046875, 0.07199859619140625, 0.074249267578125, 0.07649993896484375, 0.0787506103515625, 0.08100128173828125, 0.083251953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 11.0, 7.0, 6.0, 16.0, 10.0, 30.0, 23.0, 28.0, 55.0, 61.0, 60.0, 69.0, 80.0, 70.0, 67.0, 80.0, 72.0, 59.0, 45.0, 35.0, 24.0, 20.0, 16.0, 18.0, 5.0, 8.0, 1.0, 9.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01520538330078125, -0.014799952507019043, -0.014394521713256836, -0.013989090919494629, -0.013583660125732422, -0.013178229331970215, -0.012772798538208008, -0.0123673677444458, -0.011961936950683594, -0.011556506156921387, -0.01115107536315918, -0.010745644569396973, -0.010340213775634766, -0.009934782981872559, -0.009529352188110352, -0.009123921394348145, -0.008718490600585938, -0.00831305980682373, -0.007907629013061523, -0.007502198219299316, -0.007096767425537109, -0.006691336631774902, -0.006285905838012695, -0.005880475044250488, -0.005475044250488281, -0.005069613456726074, -0.004664182662963867, -0.00425875186920166, -0.003853321075439453, -0.003447890281677246, -0.003042459487915039, -0.002637028694152832, -0.002231597900390625, -0.001826167106628418, -0.001420736312866211, -0.001015305519104004, -0.0006098747253417969, -0.00020444393157958984, 0.0002009868621826172, 0.0006064176559448242, 0.0010118484497070312, 0.0014172792434692383, 0.0018227100372314453, 0.0022281408309936523, 0.0026335716247558594, 0.0030390024185180664, 0.0034444332122802734, 0.0038498640060424805, 0.0042552947998046875, 0.0046607255935668945, 0.0050661563873291016, 0.005471587181091309, 0.005877017974853516, 0.006282448768615723, 0.00668787956237793, 0.007093310356140137, 0.007498741149902344, 0.00790417194366455, 0.008309602737426758, 0.008715033531188965, 0.009120464324951172, 0.009525895118713379, 0.009931325912475586, 0.010336756706237793, 0.0107421875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 14.0, 85.0, 201.0, 316.0, 253.0, 101.0, 29.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.79278564453125, -2.374638080596924, -1.956490397453308, -1.5383427143096924, -1.1201951503753662, -0.70204758644104, -0.28389978408813477, 0.1342477798461914, 0.5523953437805176, 0.9705429673194885, 1.3886905908584595, 1.8068382740020752, 2.2249858379364014, 2.6431334018707275, 3.061281204223633, 3.479428768157959, 3.897576332092285, 4.315723896026611, 4.7338714599609375, 5.152019500732422, 5.57016658782959, 5.988314628601074, 6.4064621925354, 6.824609756469727, 7.242757320404053, 7.660904884338379, 8.079052925109863, 8.497200012207031, 8.915348052978516, 9.333495140075684, 9.751643180847168, 10.169790267944336, 10.58793830871582, 11.006086349487305, 11.424233436584473, 11.842381477355957, 12.260528564453125, 12.67867660522461, 13.096824645996094, 13.514971733093262, 13.93311882019043, 14.351266860961914, 14.769413948059082, 15.187561988830566, 15.605709075927734, 16.02385711669922, 16.442005157470703, 16.860153198242188, 17.278301239013672, 17.696449279785156, 18.11459732055664, 18.532743453979492, 18.950891494750977, 19.36903953552246, 19.787187576293945, 20.205333709716797, 20.62348175048828, 21.041629791259766, 21.45977783203125, 21.8779239654541, 22.296072006225586, 22.71422004699707, 23.132368087768555, 23.550514221191406, 23.96866226196289]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 18.0, 16.0, 9.0, 17.0, 21.0, 16.0, 24.0, 21.0, 33.0, 24.0, 49.0, 46.0, 57.0, 42.0, 50.0, 45.0, 46.0, 47.0, 33.0, 37.0, 51.0, 33.0, 35.0, 24.0, 26.0, 29.0, 23.0, 17.0, 17.0, 12.0, 15.0, 5.0, 10.0, 3.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-2.7195491790771484, -2.641597270965576, -2.563645362854004, -2.4856932163238525, -2.4077413082122803, -2.329789400100708, -2.2518374919891357, -2.1738855838775635, -2.095933437347412, -2.01798152923584, -1.940029501914978, -1.8620775938034058, -1.784125566482544, -1.7061736583709717, -1.6282217502593994, -1.5502698421478271, -1.4723179340362549, -1.3943660259246826, -1.3164139986038208, -1.2384620904922485, -1.1605100631713867, -1.0825581550598145, -1.0046062469482422, -0.9266542792320251, -0.8487023115158081, -0.7707503437995911, -0.692798376083374, -0.6148464679718018, -0.5368945002555847, -0.4589425325393677, -0.380990594625473, -0.30303865671157837, -0.22508645057678223, -0.14713449776172638, -0.06918254494667053, 0.008769407868385315, 0.08672136068344116, 0.1646733283996582, 0.24262526631355286, 0.3205772042274475, 0.39852917194366455, 0.4764811396598816, 0.5544331073760986, 0.6323850154876709, 0.7103369832038879, 0.788288950920105, 0.8662408590316772, 0.9441928267478943, 1.0221447944641113, 1.1000967025756836, 1.1780487298965454, 1.2560006380081177, 1.3339526653289795, 1.4119045734405518, 1.489856481552124, 1.5678083896636963, 1.645760416984558, 1.7237123250961304, 1.8016643524169922, 1.8796162605285645, 1.9575681686401367, 2.035520076751709, 2.1134722232818604, 2.1914241313934326, 2.269376039505005]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 4.0, 15.0, 13.0, 12.0, 16.0, 11.0, 11.0, 36.0, 43.0, 61.0, 114.0, 190.0, 368.0, 998.0, 3058.0, 10724.0, 41871.0, 142467.0, 318792.0, 323152.0, 146873.0, 43375.0, 11205.0, 3166.0, 1004.0, 382.0, 199.0, 108.0, 59.0, 40.0, 35.0, 24.0, 30.0, 12.0, 8.0, 12.0, 5.0, 8.0, 10.0, 5.0, 4.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.3890380859375, -3.276123046875, -3.1632080078125, -3.05029296875, -2.9373779296875, -2.824462890625, -2.7115478515625, -2.5986328125, -2.4857177734375, -2.372802734375, -2.2598876953125, -2.14697265625, -2.0340576171875, -1.921142578125, -1.8082275390625, -1.6953125, -1.5823974609375, -1.469482421875, -1.3565673828125, -1.24365234375, -1.1307373046875, -1.017822265625, -0.9049072265625, -0.7919921875, -0.6790771484375, -0.566162109375, -0.4532470703125, -0.34033203125, -0.2274169921875, -0.114501953125, -0.0015869140625, 0.111328125, 0.2242431640625, 0.337158203125, 0.4500732421875, 0.56298828125, 0.6759033203125, 0.788818359375, 0.9017333984375, 1.0146484375, 1.1275634765625, 1.240478515625, 1.3533935546875, 1.46630859375, 1.5792236328125, 1.692138671875, 1.8050537109375, 1.91796875, 2.0308837890625, 2.143798828125, 2.2567138671875, 2.36962890625, 2.4825439453125, 2.595458984375, 2.7083740234375, 2.8212890625, 2.9342041015625, 3.047119140625, 3.1600341796875, 3.27294921875, 3.3858642578125, 3.498779296875, 3.6116943359375, 3.724609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 9.0, 10.0, 9.0, 15.0, 12.0, 15.0, 14.0, 16.0, 17.0, 26.0, 34.0, 32.0, 39.0, 42.0, 42.0, 50.0, 45.0, 45.0, 46.0, 45.0, 51.0, 37.0, 38.0, 42.0, 26.0, 40.0, 40.0, 24.0, 30.0, 14.0, 17.0, 13.0, 20.0, 6.0, 9.0, 8.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-5.07421875, -4.93170166015625, -4.7891845703125, -4.64666748046875, -4.504150390625, -4.36163330078125, -4.2191162109375, -4.07659912109375, -3.93408203125, -3.79156494140625, -3.6490478515625, -3.50653076171875, -3.364013671875, -3.22149658203125, -3.0789794921875, -2.93646240234375, -2.7939453125, -2.65142822265625, -2.5089111328125, -2.36639404296875, -2.223876953125, -2.08135986328125, -1.9388427734375, -1.79632568359375, -1.65380859375, -1.51129150390625, -1.3687744140625, -1.22625732421875, -1.083740234375, -0.94122314453125, -0.7987060546875, -0.65618896484375, -0.513671875, -0.37115478515625, -0.2286376953125, -0.08612060546875, 0.056396484375, 0.19891357421875, 0.3414306640625, 0.48394775390625, 0.62646484375, 0.76898193359375, 0.9114990234375, 1.05401611328125, 1.196533203125, 1.33905029296875, 1.4815673828125, 1.62408447265625, 1.7666015625, 1.90911865234375, 2.0516357421875, 2.19415283203125, 2.336669921875, 2.47918701171875, 2.6217041015625, 2.76422119140625, 2.90673828125, 3.04925537109375, 3.1917724609375, 3.33428955078125, 3.476806640625, 3.61932373046875, 3.7618408203125, 3.90435791015625, 4.046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 20.0, 20.0, 28.0, 37.0, 58.0, 67.0, 92.0, 151.0, 173.0, 265.0, 371.0, 633.0, 8902.0, 555674.0, 473334.0, 6785.0, 613.0, 346.0, 266.0, 212.0, 138.0, 102.0, 72.0, 56.0, 36.0, 16.0, 16.0, 9.0, 14.0, 13.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0545654296875, -9.695068359375, -9.3355712890625, -8.97607421875, -8.6165771484375, -8.257080078125, -7.8975830078125, -7.5380859375, -7.1785888671875, -6.819091796875, -6.4595947265625, -6.10009765625, -5.7406005859375, -5.381103515625, -5.0216064453125, -4.662109375, -4.3026123046875, -3.943115234375, -3.5836181640625, -3.22412109375, -2.8646240234375, -2.505126953125, -2.1456298828125, -1.7861328125, -1.4266357421875, -1.067138671875, -0.7076416015625, -0.34814453125, 0.0113525390625, 0.370849609375, 0.7303466796875, 1.08984375, 1.4493408203125, 1.808837890625, 2.1683349609375, 2.52783203125, 2.8873291015625, 3.246826171875, 3.6063232421875, 3.9658203125, 4.3253173828125, 4.684814453125, 5.0443115234375, 5.40380859375, 5.7633056640625, 6.122802734375, 6.4822998046875, 6.841796875, 7.2012939453125, 7.560791015625, 7.9202880859375, 8.27978515625, 8.6392822265625, 8.998779296875, 9.3582763671875, 9.7177734375, 10.0772705078125, 10.436767578125, 10.7962646484375, 11.15576171875, 11.5152587890625, 11.874755859375, 12.2342529296875, 12.59375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 8.0, 5.0, 6.0, 10.0, 15.0, 13.0, 19.0, 18.0, 20.0, 24.0, 36.0, 27.0, 48.0, 32.0, 54.0, 34.0, 52.0, 33.0, 45.0, 58.0, 48.0, 44.0, 49.0, 41.0, 36.0, 36.0, 34.0, 31.0, 14.0, 20.0, 17.0, 20.0, 9.0, 7.0, 5.0, 10.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.78033447265625, -4.6270751953125, -4.47381591796875, -4.320556640625, -4.16729736328125, -4.0140380859375, -3.86077880859375, -3.70751953125, -3.55426025390625, -3.4010009765625, -3.24774169921875, -3.094482421875, -2.94122314453125, -2.7879638671875, -2.63470458984375, -2.4814453125, -2.32818603515625, -2.1749267578125, -2.02166748046875, -1.868408203125, -1.71514892578125, -1.5618896484375, -1.40863037109375, -1.25537109375, -1.10211181640625, -0.9488525390625, -0.79559326171875, -0.642333984375, -0.48907470703125, -0.3358154296875, -0.18255615234375, -0.029296875, 0.12396240234375, 0.2772216796875, 0.43048095703125, 0.583740234375, 0.73699951171875, 0.8902587890625, 1.04351806640625, 1.19677734375, 1.35003662109375, 1.5032958984375, 1.65655517578125, 1.809814453125, 1.96307373046875, 2.1163330078125, 2.26959228515625, 2.4228515625, 2.57611083984375, 2.7293701171875, 2.88262939453125, 3.035888671875, 3.18914794921875, 3.3424072265625, 3.49566650390625, 3.64892578125, 3.80218505859375, 3.9554443359375, 4.10870361328125, 4.261962890625, 4.41522216796875, 4.5684814453125, 4.72174072265625, 4.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 7.0, 18.0, 18.0, 47.0, 64.0, 122.0, 359.0, 1595.0, 19694.0, 948362.0, 74586.0, 2848.0, 473.0, 149.0, 80.0, 44.0, 16.0, 13.0, 11.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.84765625, -4.6944580078125, -4.541259765625, -4.3880615234375, -4.23486328125, -4.0816650390625, -3.928466796875, -3.7752685546875, -3.6220703125, -3.4688720703125, -3.315673828125, -3.1624755859375, -3.00927734375, -2.8560791015625, -2.702880859375, -2.5496826171875, -2.396484375, -2.2432861328125, -2.090087890625, -1.9368896484375, -1.78369140625, -1.6304931640625, -1.477294921875, -1.3240966796875, -1.1708984375, -1.0177001953125, -0.864501953125, -0.7113037109375, -0.55810546875, -0.4049072265625, -0.251708984375, -0.0985107421875, 0.0546875, 0.2078857421875, 0.361083984375, 0.5142822265625, 0.66748046875, 0.8206787109375, 0.973876953125, 1.1270751953125, 1.2802734375, 1.4334716796875, 1.586669921875, 1.7398681640625, 1.89306640625, 2.0462646484375, 2.199462890625, 2.3526611328125, 2.505859375, 2.6590576171875, 2.812255859375, 2.9654541015625, 3.11865234375, 3.2718505859375, 3.425048828125, 3.5782470703125, 3.7314453125, 3.8846435546875, 4.037841796875, 4.1910400390625, 4.34423828125, 4.4974365234375, 4.650634765625, 4.8038330078125, 4.95703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 6.0, 8.0, 11.0, 21.0, 40.0, 41.0, 75.0, 109.0, 114.0, 146.0, 126.0, 94.0, 68.0, 53.0, 38.0, 19.0, 14.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002390146255493164, -0.0002278406172990799, -0.00021666660904884338, -0.00020549260079860687, -0.00019431859254837036, -0.00018314458429813385, -0.00017197057604789734, -0.00016079656779766083, -0.00014962255954742432, -0.0001384485512971878, -0.0001272745430469513, -0.00011610053479671478, -0.00010492652654647827, -9.375251829624176e-05, -8.257851004600525e-05, -7.140450179576874e-05, -6.0230493545532227e-05, -4.9056485295295715e-05, -3.7882477045059204e-05, -2.6708468794822693e-05, -1.553446054458618e-05, -4.36045229434967e-06, 6.813555955886841e-06, 1.7987564206123352e-05, 2.9161572456359863e-05, 4.0335580706596375e-05, 5.1509588956832886e-05, 6.26835972070694e-05, 7.385760545730591e-05, 8.503161370754242e-05, 9.620562195777893e-05, 0.00010737963020801544, 0.00011855363845825195, 0.00012972764670848846, 0.00014090165495872498, 0.0001520756632089615, 0.000163249671459198, 0.0001744236797094345, 0.00018559768795967102, 0.00019677169620990753, 0.00020794570446014404, 0.00021911971271038055, 0.00023029372096061707, 0.00024146772921085358, 0.0002526417374610901, 0.0002638157457113266, 0.0002749897539615631, 0.0002861637622117996, 0.00029733777046203613, 0.00030851177871227264, 0.00031968578696250916, 0.00033085979521274567, 0.0003420338034629822, 0.0003532078117132187, 0.0003643818199634552, 0.0003755558282136917, 0.0003867298364639282, 0.00039790384471416473, 0.00040907785296440125, 0.00042025186121463776, 0.00043142586946487427, 0.0004425998777151108, 0.0004537738859653473, 0.0004649478942155838, 0.0004761219024658203]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 7.0, 8.0, 5.0, 12.0, 21.0, 30.0, 60.0, 117.0, 347.0, 2137.0, 93644.0, 942515.0, 8408.0, 804.0, 227.0, 85.0, 48.0, 24.0, 9.0, 7.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.79296875, -7.5892333984375, -7.385498046875, -7.1817626953125, -6.97802734375, -6.7742919921875, -6.570556640625, -6.3668212890625, -6.1630859375, -5.9593505859375, -5.755615234375, -5.5518798828125, -5.34814453125, -5.1444091796875, -4.940673828125, -4.7369384765625, -4.533203125, -4.3294677734375, -4.125732421875, -3.9219970703125, -3.71826171875, -3.5145263671875, -3.310791015625, -3.1070556640625, -2.9033203125, -2.6995849609375, -2.495849609375, -2.2921142578125, -2.08837890625, -1.8846435546875, -1.680908203125, -1.4771728515625, -1.2734375, -1.0697021484375, -0.865966796875, -0.6622314453125, -0.45849609375, -0.2547607421875, -0.051025390625, 0.1527099609375, 0.3564453125, 0.5601806640625, 0.763916015625, 0.9676513671875, 1.17138671875, 1.3751220703125, 1.578857421875, 1.7825927734375, 1.986328125, 2.1900634765625, 2.393798828125, 2.5975341796875, 2.80126953125, 3.0050048828125, 3.208740234375, 3.4124755859375, 3.6162109375, 3.8199462890625, 4.023681640625, 4.2274169921875, 4.43115234375, 4.6348876953125, 4.838623046875, 5.0423583984375, 5.24609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 8.0, 17.0, 17.0, 50.0, 71.0, 107.0, 126.0, 136.0, 138.0, 102.0, 89.0, 44.0, 32.0, 14.0, 11.0, 9.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9155654907226562, -0.8784942626953125, -0.8414230346679688, -0.804351806640625, -0.7672805786132812, -0.7302093505859375, -0.6931381225585938, -0.65606689453125, -0.6189956665039062, -0.5819244384765625, -0.5448532104492188, -0.507781982421875, -0.47071075439453125, -0.4336395263671875, -0.39656829833984375, -0.3594970703125, -0.32242584228515625, -0.2853546142578125, -0.24828338623046875, -0.211212158203125, -0.17414093017578125, -0.1370697021484375, -0.09999847412109375, -0.06292724609375, -0.02585601806640625, 0.0112152099609375, 0.04828643798828125, 0.085357666015625, 0.12242889404296875, 0.1595001220703125, 0.19657135009765625, 0.233642578125, 0.27071380615234375, 0.3077850341796875, 0.34485626220703125, 0.381927490234375, 0.41899871826171875, 0.4560699462890625, 0.49314117431640625, 0.53021240234375, 0.5672836303710938, 0.6043548583984375, 0.6414260864257812, 0.678497314453125, 0.7155685424804688, 0.7526397705078125, 0.7897109985351562, 0.8267822265625, 0.8638534545898438, 0.9009246826171875, 0.9379959106445312, 0.975067138671875, 1.0121383666992188, 1.0492095947265625, 1.0862808227539062, 1.12335205078125, 1.1604232788085938, 1.1974945068359375, 1.2345657348632812, 1.271636962890625, 1.3087081909179688, 1.3457794189453125, 1.3828506469726562, 1.419921875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 3.0, 10.0, 14.0, 35.0, 39.0, 51.0, 59.0, 84.0, 76.0, 97.0, 122.0, 110.0, 87.0, 60.0, 45.0, 39.0, 25.0, 13.0, 10.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.805922031402588, -5.532161712646484, -5.258401870727539, -4.9846415519714355, -4.710881233215332, -4.437121391296387, -4.163361072540283, -3.8896007537841797, -3.6158406734466553, -3.342080593109131, -3.0683202743530273, -2.794560194015503, -2.5208001136779785, -2.247039794921875, -1.9732797145843506, -1.6995195150375366, -1.4257593154907227, -1.1519991159439087, -0.8782389760017395, -0.6044788360595703, -0.33071863651275635, -0.05695843696594238, 0.21680164337158203, 0.490561842918396, 0.76432204246521, 1.038082242012024, 1.311842441558838, 1.5856025218963623, 1.8593627214431763, 2.1331229209899902, 2.4068830013275146, 2.680643081665039, 2.9544029235839844, 3.228163003921509, 3.5019233226776123, 3.7756834030151367, 4.04944372177124, 4.323204040527344, 4.596963882446289, 4.870724201202393, 5.144484519958496, 5.4182448387146, 5.692004680633545, 5.965764999389648, 6.239525318145752, 6.5132856369018555, 6.787045478820801, 7.060805797576904, 7.33456563949585, 7.608325958251953, 7.882085800170898, 8.155845642089844, 8.429606437683105, 8.70336627960205, 8.977127075195312, 9.250886917114258, 9.524646759033203, 9.798406600952148, 10.07216739654541, 10.345927238464355, 10.6196870803833, 10.893447875976562, 11.167207717895508, 11.440967559814453, 11.714728355407715]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 11.0, 9.0, 11.0, 23.0, 6.0, 21.0, 29.0, 21.0, 18.0, 13.0, 25.0, 32.0, 42.0, 39.0, 34.0, 45.0, 40.0, 38.0, 35.0, 39.0, 41.0, 45.0, 30.0, 40.0, 30.0, 45.0, 26.0, 26.0, 23.0, 13.0, 23.0, 16.0, 10.0, 11.0, 13.0, 11.0, 6.0, 8.0, 9.0, 1.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 5.0], "bins": [-8.248883247375488, -8.016459465026855, -7.7840352058410645, -7.551611423492432, -7.319187641143799, -7.086763381958008, -6.854339599609375, -6.621915817260742, -6.389492034912109, -6.157068252563477, -5.9246439933776855, -5.692220211029053, -5.45979642868042, -5.227372169494629, -4.994948387145996, -4.762524604797363, -4.530100345611572, -4.2976765632629395, -4.065252304077148, -3.8328285217285156, -3.600404739379883, -3.367980718612671, -3.135556697845459, -2.903132915496826, -2.6707088947296143, -2.4382848739624023, -2.2058610916137695, -1.9734370708465576, -1.7410131692886353, -1.508589267730713, -1.276165246963501, -1.0437413454055786, -0.811316967010498, -0.5788930654525757, -0.34646910429000854, -0.1140451431274414, 0.11837875843048096, 0.3508026599884033, 0.5832266807556152, 0.8156505823135376, 1.04807448387146, 1.2804983854293823, 1.5129222869873047, 1.7453463077545166, 1.977770209312439, 2.2101941108703613, 2.4426181316375732, 2.675042152404785, 2.907465934753418, 3.13988995552063, 3.3723137378692627, 3.6047377586364746, 3.8371615409851074, 4.069585800170898, 4.302009582519531, 4.534433364868164, 4.766857147216797, 4.99928092956543, 5.231705188751221, 5.4641289710998535, 5.696552753448486, 5.928977012634277, 6.16140079498291, 6.393824577331543, 6.626248836517334]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 14.0, 10.0, 18.0, 28.0, 25.0, 57.0, 77.0, 127.0, 232.0, 513.0, 3912.0, 359990.0, 3683113.0, 141741.0, 2897.0, 711.0, 342.0, 193.0, 109.0, 57.0, 42.0, 20.0, 25.0, 8.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0], "bins": [-19.765625, -19.330322265625, -18.89501953125, -18.459716796875, -18.0244140625, -17.589111328125, -17.15380859375, -16.718505859375, -16.283203125, -15.847900390625, -15.41259765625, -14.977294921875, -14.5419921875, -14.106689453125, -13.67138671875, -13.236083984375, -12.80078125, -12.365478515625, -11.93017578125, -11.494873046875, -11.0595703125, -10.624267578125, -10.18896484375, -9.753662109375, -9.318359375, -8.883056640625, -8.44775390625, -8.012451171875, -7.5771484375, -7.141845703125, -6.70654296875, -6.271240234375, -5.8359375, -5.400634765625, -4.96533203125, -4.530029296875, -4.0947265625, -3.659423828125, -3.22412109375, -2.788818359375, -2.353515625, -1.918212890625, -1.48291015625, -1.047607421875, -0.6123046875, -0.177001953125, 0.25830078125, 0.693603515625, 1.12890625, 1.564208984375, 1.99951171875, 2.434814453125, 2.8701171875, 3.305419921875, 3.74072265625, 4.176025390625, 4.611328125, 5.046630859375, 5.48193359375, 5.917236328125, 6.3525390625, 6.787841796875, 7.22314453125, 7.658447265625, 8.09375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 9.0, 7.0, 5.0, 7.0, 9.0, 21.0, 23.0, 26.0, 24.0, 34.0, 45.0, 33.0, 48.0, 57.0, 59.0, 70.0, 72.0, 62.0, 64.0, 43.0, 49.0, 50.0, 42.0, 26.0, 26.0, 22.0, 17.0, 14.0, 12.0, 14.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0625, -5.908203125, -5.75390625, -5.599609375, -5.4453125, -5.291015625, -5.13671875, -4.982421875, -4.828125, -4.673828125, -4.51953125, -4.365234375, -4.2109375, -4.056640625, -3.90234375, -3.748046875, -3.59375, -3.439453125, -3.28515625, -3.130859375, -2.9765625, -2.822265625, -2.66796875, -2.513671875, -2.359375, -2.205078125, -2.05078125, -1.896484375, -1.7421875, -1.587890625, -1.43359375, -1.279296875, -1.125, -0.970703125, -0.81640625, -0.662109375, -0.5078125, -0.353515625, -0.19921875, -0.044921875, 0.109375, 0.263671875, 0.41796875, 0.572265625, 0.7265625, 0.880859375, 1.03515625, 1.189453125, 1.34375, 1.498046875, 1.65234375, 1.806640625, 1.9609375, 2.115234375, 2.26953125, 2.423828125, 2.578125, 2.732421875, 2.88671875, 3.041015625, 3.1953125, 3.349609375, 3.50390625, 3.658203125, 3.8125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 9.0, 9.0, 18.0, 17.0, 32.0, 44.0, 68.0, 80.0, 107.0, 185.0, 260.0, 506.0, 931.0, 2050.0, 9821.0, 196047.0, 3545134.0, 419405.0, 14613.0, 2520.0, 1030.0, 501.0, 327.0, 170.0, 105.0, 75.0, 58.0, 44.0, 32.0, 22.0, 15.0, 13.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.2421875, -7.9813232421875, -7.720458984375, -7.4595947265625, -7.19873046875, -6.9378662109375, -6.677001953125, -6.4161376953125, -6.1552734375, -5.8944091796875, -5.633544921875, -5.3726806640625, -5.11181640625, -4.8509521484375, -4.590087890625, -4.3292236328125, -4.068359375, -3.8074951171875, -3.546630859375, -3.2857666015625, -3.02490234375, -2.7640380859375, -2.503173828125, -2.2423095703125, -1.9814453125, -1.7205810546875, -1.459716796875, -1.1988525390625, -0.93798828125, -0.6771240234375, -0.416259765625, -0.1553955078125, 0.10546875, 0.3663330078125, 0.627197265625, 0.8880615234375, 1.14892578125, 1.4097900390625, 1.670654296875, 1.9315185546875, 2.1923828125, 2.4532470703125, 2.714111328125, 2.9749755859375, 3.23583984375, 3.4967041015625, 3.757568359375, 4.0184326171875, 4.279296875, 4.5401611328125, 4.801025390625, 5.0618896484375, 5.32275390625, 5.5836181640625, 5.844482421875, 6.1053466796875, 6.3662109375, 6.6270751953125, 6.887939453125, 7.1488037109375, 7.40966796875, 7.6705322265625, 7.931396484375, 8.1922607421875, 8.453125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 6.0, 10.0, 16.0, 14.0, 30.0, 47.0, 70.0, 97.0, 150.0, 206.0, 317.0, 379.0, 530.0, 570.0, 466.0, 379.0, 253.0, 156.0, 126.0, 71.0, 58.0, 43.0, 28.0, 13.0, 13.0, 13.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.2208404541015625, -1.163360595703125, -1.1058807373046875, -1.04840087890625, -0.9909210205078125, -0.933441162109375, -0.8759613037109375, -0.8184814453125, -0.7610015869140625, -0.703521728515625, -0.6460418701171875, -0.58856201171875, -0.5310821533203125, -0.473602294921875, -0.4161224365234375, -0.358642578125, -0.3011627197265625, -0.243682861328125, -0.1862030029296875, -0.12872314453125, -0.0712432861328125, -0.013763427734375, 0.0437164306640625, 0.1011962890625, 0.1586761474609375, 0.216156005859375, 0.2736358642578125, 0.33111572265625, 0.3885955810546875, 0.446075439453125, 0.5035552978515625, 0.56103515625, 0.6185150146484375, 0.675994873046875, 0.7334747314453125, 0.79095458984375, 0.8484344482421875, 0.905914306640625, 0.9633941650390625, 1.0208740234375, 1.0783538818359375, 1.135833740234375, 1.1933135986328125, 1.25079345703125, 1.3082733154296875, 1.365753173828125, 1.4232330322265625, 1.480712890625, 1.5381927490234375, 1.595672607421875, 1.6531524658203125, 1.71063232421875, 1.7681121826171875, 1.825592041015625, 1.8830718994140625, 1.9405517578125, 1.9980316162109375, 2.055511474609375, 2.1129913330078125, 2.17047119140625, 2.2279510498046875, 2.285430908203125, 2.3429107666015625, 2.400390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 20.0, 31.0, 60.0, 86.0, 89.0, 125.0, 139.0, 111.0, 94.0, 86.0, 61.0, 40.0, 31.0, 8.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033071041107178, -6.758542537689209, -6.484014511108398, -6.20948600769043, -5.934957981109619, -5.66042947769165, -5.38590145111084, -5.111372947692871, -4.836844444274902, -4.562315940856934, -4.287787914276123, -4.013259410858154, -3.7387313842773438, -3.464202880859375, -3.1896746158599854, -2.9151463508605957, -2.640618324279785, -2.3660900592803955, -2.091561794281006, -1.8170334100723267, -1.542505145072937, -1.2679768800735474, -0.9934484958648682, -0.7189202308654785, -0.44439196586608887, -0.16986367106437683, 0.1046646237373352, 0.37919294834136963, 0.6537212133407593, 0.9282494783401489, 1.2027778625488281, 1.4773061275482178, 1.7518348693847656, 2.0263631343841553, 2.300891399383545, 2.5754199028015137, 2.849947929382324, 3.124476432800293, 3.3990046977996826, 3.6735329627990723, 3.948061227798462, 4.222589492797852, 4.49711799621582, 4.771646022796631, 5.0461745262146, 5.32070255279541, 5.595231056213379, 5.869759559631348, 6.144287586212158, 6.418816089630127, 6.6933441162109375, 6.967872619628906, 7.242400646209717, 7.5169291496276855, 7.791457176208496, 8.065985679626465, 8.340514183044434, 8.615042686462402, 8.889571189880371, 9.164098739624023, 9.438627243041992, 9.713155746459961, 9.98768424987793, 10.262212753295898, 10.53674030303955]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 3.0, 9.0, 7.0, 2.0, 7.0, 15.0, 14.0, 16.0, 13.0, 19.0, 16.0, 16.0, 21.0, 25.0, 31.0, 25.0, 28.0, 27.0, 35.0, 38.0, 36.0, 39.0, 34.0, 34.0, 34.0, 18.0, 35.0, 43.0, 31.0, 38.0, 33.0, 29.0, 25.0, 31.0, 18.0, 23.0, 18.0, 19.0, 16.0, 11.0, 9.0, 9.0, 5.0, 5.0, 10.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0], "bins": [-3.432600975036621, -3.331881523132324, -3.2311620712280273, -3.1304426193237305, -3.0297231674194336, -2.9290037155151367, -2.828284502029419, -2.727565050125122, -2.626845598220825, -2.5261261463165283, -2.4254066944122314, -2.3246872425079346, -2.223968029022217, -2.12324857711792, -2.022529125213623, -1.9218096733093262, -1.8210902214050293, -1.7203707695007324, -1.6196513175964355, -1.5189319849014282, -1.4182125329971313, -1.3174930810928345, -1.2167737483978271, -1.1160542964935303, -1.0153348445892334, -0.9146153926849365, -0.8138960003852844, -0.7131766080856323, -0.6124571561813354, -0.5117377042770386, -0.4110183119773865, -0.3102989196777344, -0.2095797061920166, -0.10886028409004211, -0.008140861988067627, 0.09257856011390686, 0.19329798221588135, 0.2940174341201782, 0.3947368264198303, 0.4954562187194824, 0.5961756706237793, 0.6968951225280762, 0.7976145148277283, 0.8983339071273804, 0.9990533590316772, 1.0997728109359741, 1.2004921436309814, 1.3012115955352783, 1.4019310474395752, 1.502650499343872, 1.603369951248169, 1.7040892839431763, 1.8048087358474731, 1.90552818775177, 2.0062475204467773, 2.106966972351074, 2.207686424255371, 2.308405876159668, 2.409125328063965, 2.5098447799682617, 2.6105642318725586, 2.7112836837768555, 2.8120028972625732, 2.91272234916687, 3.013441801071167]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 14.0, 28.0, 43.0, 80.0, 100.0, 185.0, 324.0, 576.0, 1086.0, 2150.0, 4710.0, 11937.0, 36129.0, 114216.0, 300709.0, 348361.0, 152107.0, 48701.0, 15747.0, 5897.0, 2580.0, 1207.0, 660.0, 391.0, 229.0, 123.0, 88.0, 54.0, 31.0, 32.0, 13.0, 16.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6083984375, -0.5894622802734375, -0.570526123046875, -0.5515899658203125, -0.53265380859375, -0.5137176513671875, -0.494781494140625, -0.4758453369140625, -0.4569091796875, -0.4379730224609375, -0.419036865234375, -0.4001007080078125, -0.38116455078125, -0.3622283935546875, -0.343292236328125, -0.3243560791015625, -0.305419921875, -0.2864837646484375, -0.267547607421875, -0.2486114501953125, -0.22967529296875, -0.2107391357421875, -0.191802978515625, -0.1728668212890625, -0.1539306640625, -0.1349945068359375, -0.116058349609375, -0.0971221923828125, -0.07818603515625, -0.0592498779296875, -0.040313720703125, -0.0213775634765625, -0.00244140625, 0.0164947509765625, 0.035430908203125, 0.0543670654296875, 0.07330322265625, 0.0922393798828125, 0.111175537109375, 0.1301116943359375, 0.1490478515625, 0.1679840087890625, 0.186920166015625, 0.2058563232421875, 0.22479248046875, 0.2437286376953125, 0.262664794921875, 0.2816009521484375, 0.300537109375, 0.3194732666015625, 0.338409423828125, 0.3573455810546875, 0.37628173828125, 0.3952178955078125, 0.414154052734375, 0.4330902099609375, 0.4520263671875, 0.4709625244140625, 0.489898681640625, 0.5088348388671875, 0.52777099609375, 0.5467071533203125, 0.565643310546875, 0.5845794677734375, 0.603515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 10.0, 12.0, 16.0, 17.0, 16.0, 15.0, 21.0, 31.0, 36.0, 43.0, 43.0, 42.0, 55.0, 41.0, 54.0, 57.0, 38.0, 43.0, 49.0, 50.0, 46.0, 42.0, 29.0, 35.0, 35.0, 27.0, 21.0, 10.0, 11.0, 9.0, 12.0, 4.0, 6.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.959930419921875, -3.85736083984375, -3.754791259765625, -3.6522216796875, -3.549652099609375, -3.44708251953125, -3.344512939453125, -3.241943359375, -3.139373779296875, -3.03680419921875, -2.934234619140625, -2.8316650390625, -2.729095458984375, -2.62652587890625, -2.523956298828125, -2.42138671875, -2.318817138671875, -2.21624755859375, -2.113677978515625, -2.0111083984375, -1.908538818359375, -1.80596923828125, -1.703399658203125, -1.600830078125, -1.498260498046875, -1.39569091796875, -1.293121337890625, -1.1905517578125, -1.087982177734375, -0.98541259765625, -0.882843017578125, -0.7802734375, -0.677703857421875, -0.57513427734375, -0.472564697265625, -0.3699951171875, -0.267425537109375, -0.16485595703125, -0.062286376953125, 0.040283203125, 0.142852783203125, 0.24542236328125, 0.347991943359375, 0.4505615234375, 0.553131103515625, 0.65570068359375, 0.758270263671875, 0.86083984375, 0.963409423828125, 1.06597900390625, 1.168548583984375, 1.2711181640625, 1.373687744140625, 1.47625732421875, 1.578826904296875, 1.681396484375, 1.783966064453125, 1.88653564453125, 1.989105224609375, 2.0916748046875, 2.194244384765625, 2.29681396484375, 2.399383544921875, 2.501953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 10.0, 16.0, 29.0, 36.0, 52.0, 109.0, 212.0, 384.0, 812.0, 1645.0, 3665.0, 8026.0, 17846.0, 39581.0, 85878.0, 171459.0, 261746.0, 223728.0, 124826.0, 59443.0, 26754.0, 12045.0, 5397.0, 2510.0, 1100.0, 560.0, 296.0, 149.0, 94.0, 49.0, 25.0, 16.0, 12.0, 12.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3818359375, -0.3705253601074219, -0.35921478271484375, -0.3479042053222656, -0.3365936279296875, -0.3252830505371094, -0.31397247314453125, -0.3026618957519531, -0.291351318359375, -0.2800407409667969, -0.26873016357421875, -0.2574195861816406, -0.2461090087890625, -0.23479843139648438, -0.22348785400390625, -0.21217727661132812, -0.20086669921875, -0.18955612182617188, -0.17824554443359375, -0.16693496704101562, -0.1556243896484375, -0.14431381225585938, -0.13300323486328125, -0.12169265747070312, -0.110382080078125, -0.09907150268554688, -0.08776092529296875, -0.07645034790039062, -0.0651397705078125, -0.053829193115234375, -0.04251861572265625, -0.031208038330078125, -0.0198974609375, -0.008586883544921875, 0.00272369384765625, 0.014034271240234375, 0.0253448486328125, 0.036655426025390625, 0.04796600341796875, 0.059276580810546875, 0.070587158203125, 0.08189773559570312, 0.09320831298828125, 0.10451889038085938, 0.1158294677734375, 0.12714004516601562, 0.13845062255859375, 0.14976119995117188, 0.16107177734375, 0.17238235473632812, 0.18369293212890625, 0.19500350952148438, 0.2063140869140625, 0.21762466430664062, 0.22893524169921875, 0.24024581909179688, 0.251556396484375, 0.2628669738769531, 0.27417755126953125, 0.2854881286621094, 0.2967987060546875, 0.3081092834472656, 0.31941986083984375, 0.3307304382324219, 0.342041015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 9.0, 4.0, 5.0, 6.0, 11.0, 17.0, 20.0, 16.0, 28.0, 33.0, 26.0, 34.0, 39.0, 46.0, 42.0, 46.0, 58.0, 39.0, 55.0, 46.0, 47.0, 50.0, 53.0, 37.0, 35.0, 29.0, 31.0, 25.0, 24.0, 16.0, 18.0, 10.0, 10.0, 10.0, 5.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.6015625, -6.39208984375, -6.1826171875, -5.97314453125, -5.763671875, -5.55419921875, -5.3447265625, -5.13525390625, -4.92578125, -4.71630859375, -4.5068359375, -4.29736328125, -4.087890625, -3.87841796875, -3.6689453125, -3.45947265625, -3.25, -3.04052734375, -2.8310546875, -2.62158203125, -2.412109375, -2.20263671875, -1.9931640625, -1.78369140625, -1.57421875, -1.36474609375, -1.1552734375, -0.94580078125, -0.736328125, -0.52685546875, -0.3173828125, -0.10791015625, 0.1015625, 0.31103515625, 0.5205078125, 0.72998046875, 0.939453125, 1.14892578125, 1.3583984375, 1.56787109375, 1.77734375, 1.98681640625, 2.1962890625, 2.40576171875, 2.615234375, 2.82470703125, 3.0341796875, 3.24365234375, 3.453125, 3.66259765625, 3.8720703125, 4.08154296875, 4.291015625, 4.50048828125, 4.7099609375, 4.91943359375, 5.12890625, 5.33837890625, 5.5478515625, 5.75732421875, 5.966796875, 6.17626953125, 6.3857421875, 6.59521484375, 6.8046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 6.0, 7.0, 5.0, 16.0, 10.0, 27.0, 40.0, 37.0, 77.0, 106.0, 166.0, 283.0, 397.0, 606.0, 1042.0, 1851.0, 3540.0, 7580.0, 19496.0, 57751.0, 193323.0, 451158.0, 210787.0, 62579.0, 20976.0, 8134.0, 3613.0, 1911.0, 1102.0, 699.0, 412.0, 262.0, 187.0, 128.0, 91.0, 37.0, 40.0, 33.0, 11.0, 13.0, 12.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06939697265625, -0.06732749938964844, -0.06525802612304688, -0.06318855285644531, -0.06111907958984375, -0.05904960632324219, -0.056980133056640625, -0.05491065979003906, -0.0528411865234375, -0.05077171325683594, -0.048702239990234375, -0.04663276672363281, -0.04456329345703125, -0.04249382019042969, -0.040424346923828125, -0.03835487365722656, -0.036285400390625, -0.03421592712402344, -0.032146453857421875, -0.030076980590820312, -0.02800750732421875, -0.025938034057617188, -0.023868560791015625, -0.021799087524414062, -0.0197296142578125, -0.017660140991210938, -0.015590667724609375, -0.013521194458007812, -0.01145172119140625, -0.009382247924804688, -0.007312774658203125, -0.0052433013916015625, -0.003173828125, -0.0011043548583984375, 0.000965118408203125, 0.0030345916748046875, 0.00510406494140625, 0.0071735382080078125, 0.009243011474609375, 0.011312484741210938, 0.0133819580078125, 0.015451431274414062, 0.017520904541015625, 0.019590377807617188, 0.02165985107421875, 0.023729324340820312, 0.025798797607421875, 0.027868270874023438, 0.029937744140625, 0.03200721740722656, 0.034076690673828125, 0.03614616394042969, 0.03821563720703125, 0.04028511047363281, 0.042354583740234375, 0.04442405700683594, 0.0464935302734375, 0.04856300354003906, 0.050632476806640625, 0.05270195007324219, 0.05477142333984375, 0.05684089660644531, 0.058910369873046875, 0.06097984313964844, 0.06304931640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 11.0, 14.0, 29.0, 35.0, 52.0, 89.0, 113.0, 167.0, 161.0, 113.0, 67.0, 59.0, 36.0, 23.0, 20.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011998414993286133, -0.00011681392788887024, -0.00011364370584487915, -0.00011047348380088806, -0.00010730326175689697, -0.00010413303971290588, -0.0001009628176689148, -9.77925956249237e-05, -9.462237358093262e-05, -9.145215153694153e-05, -8.828192949295044e-05, -8.511170744895935e-05, -8.194148540496826e-05, -7.877126336097717e-05, -7.560104131698608e-05, -7.2430819272995e-05, -6.92605972290039e-05, -6.609037518501282e-05, -6.292015314102173e-05, -5.974993109703064e-05, -5.657970905303955e-05, -5.340948700904846e-05, -5.023926496505737e-05, -4.7069042921066284e-05, -4.3898820877075195e-05, -4.0728598833084106e-05, -3.755837678909302e-05, -3.438815474510193e-05, -3.121793270111084e-05, -2.804771065711975e-05, -2.4877488613128662e-05, -2.1707266569137573e-05, -1.8537044525146484e-05, -1.5366822481155396e-05, -1.2196600437164307e-05, -9.026378393173218e-06, -5.856156349182129e-06, -2.68593430519104e-06, 4.842877388000488e-07, 3.6545097827911377e-06, 6.8247318267822266e-06, 9.994953870773315e-06, 1.3165175914764404e-05, 1.6335397958755493e-05, 1.9505620002746582e-05, 2.267584204673767e-05, 2.584606409072876e-05, 2.901628613471985e-05, 3.218650817871094e-05, 3.5356730222702026e-05, 3.8526952266693115e-05, 4.1697174310684204e-05, 4.486739635467529e-05, 4.803761839866638e-05, 5.120784044265747e-05, 5.437806248664856e-05, 5.754828453063965e-05, 6.071850657463074e-05, 6.388872861862183e-05, 6.705895066261292e-05, 7.0229172706604e-05, 7.339939475059509e-05, 7.656961679458618e-05, 7.973983883857727e-05, 8.291006088256836e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 14.0, 14.0, 19.0, 31.0, 32.0, 45.0, 54.0, 84.0, 157.0, 342.0, 618.0, 1312.0, 3020.0, 7580.0, 23825.0, 94662.0, 446867.0, 364682.0, 74327.0, 19380.0, 6556.0, 2494.0, 1137.0, 539.0, 294.0, 141.0, 86.0, 61.0, 50.0, 28.0, 25.0, 16.0, 7.0, 8.0, 7.0, 7.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.086181640625, -0.08356380462646484, -0.08094596862792969, -0.07832813262939453, -0.07571029663085938, -0.07309246063232422, -0.07047462463378906, -0.0678567886352539, -0.06523895263671875, -0.0626211166381836, -0.06000328063964844, -0.05738544464111328, -0.054767608642578125, -0.05214977264404297, -0.04953193664550781, -0.046914100646972656, -0.0442962646484375, -0.041678428649902344, -0.03906059265136719, -0.03644275665283203, -0.033824920654296875, -0.03120708465576172, -0.028589248657226562, -0.025971412658691406, -0.02335357666015625, -0.020735740661621094, -0.018117904663085938, -0.015500068664550781, -0.012882232666015625, -0.010264396667480469, -0.0076465606689453125, -0.005028724670410156, -0.002410888671875, 0.00020694732666015625, 0.0028247833251953125, 0.005442619323730469, 0.008060455322265625, 0.010678291320800781, 0.013296127319335938, 0.015913963317871094, 0.01853179931640625, 0.021149635314941406, 0.023767471313476562, 0.02638530731201172, 0.029003143310546875, 0.03162097930908203, 0.03423881530761719, 0.036856651306152344, 0.0394744873046875, 0.042092323303222656, 0.04471015930175781, 0.04732799530029297, 0.049945831298828125, 0.05256366729736328, 0.05518150329589844, 0.057799339294433594, 0.06041717529296875, 0.0630350112915039, 0.06565284729003906, 0.06827068328857422, 0.07088851928710938, 0.07350635528564453, 0.07612419128417969, 0.07874202728271484, 0.08135986328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 1.0, 6.0, 9.0, 10.0, 14.0, 29.0, 13.0, 21.0, 18.0, 42.0, 36.0, 69.0, 58.0, 71.0, 98.0, 92.0, 87.0, 64.0, 56.0, 43.0, 27.0, 17.0, 21.0, 22.0, 16.0, 12.0, 9.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0227508544921875, -0.022097110748291016, -0.02144336700439453, -0.020789623260498047, -0.020135879516601562, -0.019482135772705078, -0.018828392028808594, -0.01817464828491211, -0.017520904541015625, -0.01686716079711914, -0.016213417053222656, -0.015559673309326172, -0.014905929565429688, -0.014252185821533203, -0.013598442077636719, -0.012944698333740234, -0.01229095458984375, -0.011637210845947266, -0.010983467102050781, -0.010329723358154297, -0.009675979614257812, -0.009022235870361328, -0.008368492126464844, -0.007714748382568359, -0.007061004638671875, -0.006407260894775391, -0.005753517150878906, -0.005099773406982422, -0.0044460296630859375, -0.003792285919189453, -0.0031385421752929688, -0.0024847984313964844, -0.0018310546875, -0.0011773109436035156, -0.0005235671997070312, 0.00013017654418945312, 0.0007839202880859375, 0.0014376640319824219, 0.0020914077758789062, 0.0027451515197753906, 0.003398895263671875, 0.004052639007568359, 0.004706382751464844, 0.005360126495361328, 0.0060138702392578125, 0.006667613983154297, 0.007321357727050781, 0.007975101470947266, 0.00862884521484375, 0.009282588958740234, 0.009936332702636719, 0.010590076446533203, 0.011243820190429688, 0.011897563934326172, 0.012551307678222656, 0.01320505142211914, 0.013858795166015625, 0.01451253890991211, 0.015166282653808594, 0.015820026397705078, 0.016473770141601562, 0.017127513885498047, 0.01778125762939453, 0.018435001373291016, 0.0190887451171875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 12.0, 25.0, 148.0, 322.0, 309.0, 158.0, 35.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.214421272277832, -4.742288112640381, -4.270155429840088, -3.7980222702026367, -3.3258893489837646, -2.8537564277648926, -2.3816232681274414, -1.9094903469085693, -1.4373574256896973, -0.9652244448661804, -0.4930914640426636, -0.020958423614501953, 0.4511744976043701, 0.9233074188232422, 1.3954405784606934, 1.8675734996795654, 2.3397064208984375, 2.8118393421173096, 3.2839722633361816, 3.756105422973633, 4.228238105773926, 4.700371265411377, 5.172504425048828, 5.644637107849121, 6.116770267486572, 6.588903427124023, 7.061036109924316, 7.533169269561768, 8.005302429199219, 8.477435111999512, 8.949567794799805, 9.421701431274414, 9.893835067749023, 10.365967750549316, 10.838101387023926, 11.310234069824219, 11.782366752624512, 12.254499435424805, 12.726633071899414, 13.198765754699707, 13.6708984375, 14.143031120300293, 14.615164756774902, 15.087297439575195, 15.559430122375488, 16.03156280517578, 16.50369644165039, 16.975830078125, 17.44796371459961, 17.92009735107422, 18.392229080200195, 18.864362716674805, 19.336496353149414, 19.80862808227539, 20.28076171875, 20.75289535522461, 21.225027084350586, 21.697160720825195, 22.169292449951172, 22.64142608642578, 23.11355972290039, 23.585691452026367, 24.057825088500977, 24.529958724975586, 25.002090454101562]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 6.0, 2.0, 3.0, 4.0, 12.0, 11.0, 20.0, 12.0, 12.0, 19.0, 20.0, 23.0, 19.0, 31.0, 28.0, 32.0, 27.0, 31.0, 45.0, 40.0, 45.0, 39.0, 41.0, 29.0, 27.0, 48.0, 29.0, 45.0, 35.0, 33.0, 30.0, 30.0, 28.0, 20.0, 17.0, 20.0, 11.0, 12.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 8.0, 4.0, 1.0, 2.0, 5.0, 0.0, 2.0], "bins": [-2.6807005405426025, -2.6046156883239746, -2.5285305976867676, -2.4524457454681396, -2.3763608932495117, -2.3002758026123047, -2.2241909503936768, -2.148106098175049, -2.072021007537842, -1.9959360361099243, -1.9198510646820068, -1.843766212463379, -1.7676812410354614, -1.691596269607544, -1.615511417388916, -1.5394264459609985, -1.463341474533081, -1.3872565031051636, -1.311171531677246, -1.2350866794586182, -1.1590017080307007, -1.0829167366027832, -1.0068318843841553, -0.9307469129562378, -0.8546619415283203, -0.7785769701004028, -0.7024920582771301, -0.6264071464538574, -0.5503221750259399, -0.47423723340034485, -0.39815229177474976, -0.32206737995147705, -0.24598240852355957, -0.16989746689796448, -0.09381252527236938, -0.017727583646774292, 0.0583573579788208, 0.1344422996044159, 0.210527241230011, 0.2866121530532837, 0.36269712448120117, 0.43878206610679626, 0.5148670077323914, 0.5909519195556641, 0.6670368909835815, 0.743121862411499, 0.8192067742347717, 0.8952916860580444, 0.9713766574859619, 1.0474616289138794, 1.1235466003417969, 1.1996314525604248, 1.2757164239883423, 1.3518013954162598, 1.4278862476348877, 1.5039712190628052, 1.5800561904907227, 1.6561411619186401, 1.7322261333465576, 1.8083109855651855, 1.884395956993103, 1.9604809284210205, 2.0365657806396484, 2.1126508712768555, 2.1887357234954834]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 11.0, 16.0, 11.0, 19.0, 19.0, 28.0, 41.0, 56.0, 69.0, 150.0, 305.0, 793.0, 2641.0, 13624.0, 80553.0, 344045.0, 440028.0, 136142.0, 23578.0, 4371.0, 1158.0, 388.0, 186.0, 83.0, 54.0, 40.0, 25.0, 21.0, 21.0, 16.0, 13.0, 8.0, 2.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.3984375, -4.25726318359375, -4.1160888671875, -3.97491455078125, -3.833740234375, -3.69256591796875, -3.5513916015625, -3.41021728515625, -3.26904296875, -3.12786865234375, -2.9866943359375, -2.84552001953125, -2.704345703125, -2.56317138671875, -2.4219970703125, -2.28082275390625, -2.1396484375, -1.99847412109375, -1.8572998046875, -1.71612548828125, -1.574951171875, -1.43377685546875, -1.2926025390625, -1.15142822265625, -1.01025390625, -0.86907958984375, -0.7279052734375, -0.58673095703125, -0.445556640625, -0.30438232421875, -0.1632080078125, -0.02203369140625, 0.119140625, 0.26031494140625, 0.4014892578125, 0.54266357421875, 0.683837890625, 0.82501220703125, 0.9661865234375, 1.10736083984375, 1.24853515625, 1.38970947265625, 1.5308837890625, 1.67205810546875, 1.813232421875, 1.95440673828125, 2.0955810546875, 2.23675537109375, 2.3779296875, 2.51910400390625, 2.6602783203125, 2.80145263671875, 2.942626953125, 3.08380126953125, 3.2249755859375, 3.36614990234375, 3.50732421875, 3.64849853515625, 3.7896728515625, 3.93084716796875, 4.072021484375, 4.21319580078125, 4.3543701171875, 4.49554443359375, 4.63671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 6.0, 5.0, 9.0, 7.0, 20.0, 15.0, 15.0, 12.0, 20.0, 19.0, 22.0, 29.0, 26.0, 30.0, 40.0, 42.0, 38.0, 47.0, 39.0, 35.0, 43.0, 43.0, 44.0, 48.0, 51.0, 32.0, 36.0, 37.0, 37.0, 16.0, 24.0, 23.0, 10.0, 15.0, 13.0, 10.0, 7.0, 7.0, 4.0, 4.0, 3.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.503173828125, -4.35791015625, -4.212646484375, -4.0673828125, -3.922119140625, -3.77685546875, -3.631591796875, -3.486328125, -3.341064453125, -3.19580078125, -3.050537109375, -2.9052734375, -2.760009765625, -2.61474609375, -2.469482421875, -2.32421875, -2.178955078125, -2.03369140625, -1.888427734375, -1.7431640625, -1.597900390625, -1.45263671875, -1.307373046875, -1.162109375, -1.016845703125, -0.87158203125, -0.726318359375, -0.5810546875, -0.435791015625, -0.29052734375, -0.145263671875, 0.0, 0.145263671875, 0.29052734375, 0.435791015625, 0.5810546875, 0.726318359375, 0.87158203125, 1.016845703125, 1.162109375, 1.307373046875, 1.45263671875, 1.597900390625, 1.7431640625, 1.888427734375, 2.03369140625, 2.178955078125, 2.32421875, 2.469482421875, 2.61474609375, 2.760009765625, 2.9052734375, 3.050537109375, 3.19580078125, 3.341064453125, 3.486328125, 3.631591796875, 3.77685546875, 3.922119140625, 4.0673828125, 4.212646484375, 4.35791015625, 4.503173828125, 4.6484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 6.0, 6.0, 11.0, 12.0, 19.0, 17.0, 21.0, 31.0, 34.0, 48.0, 60.0, 93.0, 136.0, 171.0, 287.0, 410.0, 1299.0, 29785.0, 834158.0, 177133.0, 3078.0, 589.0, 349.0, 224.0, 139.0, 129.0, 63.0, 54.0, 38.0, 23.0, 29.0, 16.0, 19.0, 14.0, 10.0, 8.0, 7.0, 3.0, 8.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.25, -9.9266357421875, -9.603271484375, -9.2799072265625, -8.95654296875, -8.6331787109375, -8.309814453125, -7.9864501953125, -7.6630859375, -7.3397216796875, -7.016357421875, -6.6929931640625, -6.36962890625, -6.0462646484375, -5.722900390625, -5.3995361328125, -5.076171875, -4.7528076171875, -4.429443359375, -4.1060791015625, -3.78271484375, -3.4593505859375, -3.135986328125, -2.8126220703125, -2.4892578125, -2.1658935546875, -1.842529296875, -1.5191650390625, -1.19580078125, -0.8724365234375, -0.549072265625, -0.2257080078125, 0.09765625, 0.4210205078125, 0.744384765625, 1.0677490234375, 1.39111328125, 1.7144775390625, 2.037841796875, 2.3612060546875, 2.6845703125, 3.0079345703125, 3.331298828125, 3.6546630859375, 3.97802734375, 4.3013916015625, 4.624755859375, 4.9481201171875, 5.271484375, 5.5948486328125, 5.918212890625, 6.2415771484375, 6.56494140625, 6.8883056640625, 7.211669921875, 7.5350341796875, 7.8583984375, 8.1817626953125, 8.505126953125, 8.8284912109375, 9.15185546875, 9.4752197265625, 9.798583984375, 10.1219482421875, 10.4453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 6.0, 8.0, 11.0, 10.0, 9.0, 13.0, 17.0, 17.0, 24.0, 21.0, 21.0, 21.0, 27.0, 45.0, 34.0, 34.0, 42.0, 46.0, 51.0, 50.0, 44.0, 44.0, 40.0, 34.0, 40.0, 36.0, 34.0, 28.0, 35.0, 18.0, 21.0, 12.0, 20.0, 12.0, 14.0, 7.0, 10.0, 4.0, 9.0, 7.0, 2.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.137939453125, -4.97119140625, -4.804443359375, -4.6376953125, -4.470947265625, -4.30419921875, -4.137451171875, -3.970703125, -3.803955078125, -3.63720703125, -3.470458984375, -3.3037109375, -3.136962890625, -2.97021484375, -2.803466796875, -2.63671875, -2.469970703125, -2.30322265625, -2.136474609375, -1.9697265625, -1.802978515625, -1.63623046875, -1.469482421875, -1.302734375, -1.135986328125, -0.96923828125, -0.802490234375, -0.6357421875, -0.468994140625, -0.30224609375, -0.135498046875, 0.03125, 0.197998046875, 0.36474609375, 0.531494140625, 0.6982421875, 0.864990234375, 1.03173828125, 1.198486328125, 1.365234375, 1.531982421875, 1.69873046875, 1.865478515625, 2.0322265625, 2.198974609375, 2.36572265625, 2.532470703125, 2.69921875, 2.865966796875, 3.03271484375, 3.199462890625, 3.3662109375, 3.532958984375, 3.69970703125, 3.866455078125, 4.033203125, 4.199951171875, 4.36669921875, 4.533447265625, 4.7001953125, 4.866943359375, 5.03369140625, 5.200439453125, 5.3671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 20.0, 35.0, 37.0, 63.0, 152.0, 458.0, 1923.0, 10831.0, 549490.0, 473209.0, 9813.0, 1740.0, 429.0, 126.0, 61.0, 48.0, 39.0, 13.0, 7.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.423492431640625, -3.28643798828125, -3.149383544921875, -3.0123291015625, -2.875274658203125, -2.73822021484375, -2.601165771484375, -2.464111328125, -2.327056884765625, -2.19000244140625, -2.052947998046875, -1.9158935546875, -1.778839111328125, -1.64178466796875, -1.504730224609375, -1.36767578125, -1.230621337890625, -1.09356689453125, -0.956512451171875, -0.8194580078125, -0.682403564453125, -0.54534912109375, -0.408294677734375, -0.271240234375, -0.134185791015625, 0.00286865234375, 0.139923095703125, 0.2769775390625, 0.414031982421875, 0.55108642578125, 0.688140869140625, 0.8251953125, 0.962249755859375, 1.09930419921875, 1.236358642578125, 1.3734130859375, 1.510467529296875, 1.64752197265625, 1.784576416015625, 1.921630859375, 2.058685302734375, 2.19573974609375, 2.332794189453125, 2.4698486328125, 2.606903076171875, 2.74395751953125, 2.881011962890625, 3.01806640625, 3.155120849609375, 3.29217529296875, 3.429229736328125, 3.5662841796875, 3.703338623046875, 3.84039306640625, 3.977447509765625, 4.114501953125, 4.251556396484375, 4.38861083984375, 4.525665283203125, 4.6627197265625, 4.799774169921875, 4.93682861328125, 5.073883056640625, 5.2109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 11.0, 25.0, 27.0, 49.0, 72.0, 99.0, 129.0, 167.0, 120.0, 137.0, 60.0, 44.0, 28.0, 10.0, 7.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004737377166748047, -0.0004591308534145355, -0.00044452399015426636, -0.0004299171268939972, -0.00041531026363372803, -0.00040070340037345886, -0.0003860965371131897, -0.00037148967385292053, -0.00035688281059265137, -0.0003422759473323822, -0.00032766908407211304, -0.00031306222081184387, -0.0002984553575515747, -0.00028384849429130554, -0.0002692416310310364, -0.0002546347677707672, -0.00024002790451049805, -0.00022542104125022888, -0.00021081417798995972, -0.00019620731472969055, -0.0001816004514694214, -0.00016699358820915222, -0.00015238672494888306, -0.0001377798616886139, -0.00012317299842834473, -0.00010856613516807556, -9.39592719078064e-05, -7.935240864753723e-05, -6.474554538726807e-05, -5.01386821269989e-05, -3.5531818866729736e-05, -2.092495560646057e-05, -6.318092346191406e-06, 8.288770914077759e-06, 2.2895634174346924e-05, 3.750249743461609e-05, 5.2109360694885254e-05, 6.671622395515442e-05, 8.132308721542358e-05, 9.592995047569275e-05, 0.00011053681373596191, 0.00012514367699623108, 0.00013975054025650024, 0.0001543574035167694, 0.00016896426677703857, 0.00018357113003730774, 0.0001981779932975769, 0.00021278485655784607, 0.00022739171981811523, 0.0002419985830783844, 0.00025660544633865356, 0.00027121230959892273, 0.0002858191728591919, 0.00030042603611946106, 0.0003150328993797302, 0.0003296397626399994, 0.00034424662590026855, 0.0003588534891605377, 0.0003734603524208069, 0.00038806721568107605, 0.0004026740789413452, 0.0004172809422016144, 0.00043188780546188354, 0.0004464946687221527, 0.0004611015319824219]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 10.0, 9.0, 17.0, 19.0, 39.0, 78.0, 227.0, 978.0, 10738.0, 970333.0, 63205.0, 2252.0, 366.0, 131.0, 60.0, 32.0, 21.0, 10.0, 8.0, 4.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.57598876953125, -5.3590087890625, -5.14202880859375, -4.925048828125, -4.70806884765625, -4.4910888671875, -4.27410888671875, -4.05712890625, -3.84014892578125, -3.6231689453125, -3.40618896484375, -3.189208984375, -2.97222900390625, -2.7552490234375, -2.53826904296875, -2.3212890625, -2.10430908203125, -1.8873291015625, -1.67034912109375, -1.453369140625, -1.23638916015625, -1.0194091796875, -0.80242919921875, -0.58544921875, -0.36846923828125, -0.1514892578125, 0.06549072265625, 0.282470703125, 0.49945068359375, 0.7164306640625, 0.93341064453125, 1.150390625, 1.36737060546875, 1.5843505859375, 1.80133056640625, 2.018310546875, 2.23529052734375, 2.4522705078125, 2.66925048828125, 2.88623046875, 3.10321044921875, 3.3201904296875, 3.53717041015625, 3.754150390625, 3.97113037109375, 4.1881103515625, 4.40509033203125, 4.6220703125, 4.83905029296875, 5.0560302734375, 5.27301025390625, 5.489990234375, 5.70697021484375, 5.9239501953125, 6.14093017578125, 6.35791015625, 6.57489013671875, 6.7918701171875, 7.00885009765625, 7.225830078125, 7.44281005859375, 7.6597900390625, 7.87677001953125, 8.09375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 13.0, 27.0, 38.0, 62.0, 77.0, 117.0, 128.0, 145.0, 129.0, 90.0, 61.0, 33.0, 26.0, 16.0, 10.0, 3.0, 9.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.255859375, -1.220123291015625, -1.18438720703125, -1.148651123046875, -1.1129150390625, -1.077178955078125, -1.04144287109375, -1.005706787109375, -0.969970703125, -0.934234619140625, -0.89849853515625, -0.862762451171875, -0.8270263671875, -0.791290283203125, -0.75555419921875, -0.719818115234375, -0.68408203125, -0.648345947265625, -0.61260986328125, -0.576873779296875, -0.5411376953125, -0.505401611328125, -0.46966552734375, -0.433929443359375, -0.398193359375, -0.362457275390625, -0.32672119140625, -0.290985107421875, -0.2552490234375, -0.219512939453125, -0.18377685546875, -0.148040771484375, -0.1123046875, -0.076568603515625, -0.04083251953125, -0.005096435546875, 0.0306396484375, 0.066375732421875, 0.10211181640625, 0.137847900390625, 0.173583984375, 0.209320068359375, 0.24505615234375, 0.280792236328125, 0.3165283203125, 0.352264404296875, 0.38800048828125, 0.423736572265625, 0.45947265625, 0.495208740234375, 0.53094482421875, 0.566680908203125, 0.6024169921875, 0.638153076171875, 0.67388916015625, 0.709625244140625, 0.745361328125, 0.781097412109375, 0.81683349609375, 0.852569580078125, 0.8883056640625, 0.924041748046875, 0.95977783203125, 0.995513916015625, 1.03125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 17.0, 51.0, 110.0, 183.0, 213.0, 191.0, 133.0, 51.0, 29.0, 15.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.09824562072754, -23.533740997314453, -22.969236373901367, -22.40473175048828, -21.840227127075195, -21.27572250366211, -20.711219787597656, -20.14671516418457, -19.582210540771484, -19.0177059173584, -18.453201293945312, -17.888696670532227, -17.32419204711914, -16.759689331054688, -16.19518280029297, -15.6306791305542, -15.066174507141113, -14.501669883728027, -13.937165260314941, -13.372661590576172, -12.808156967163086, -12.24365234375, -11.679147720336914, -11.114643096923828, -10.550138473510742, -9.985633850097656, -9.42112922668457, -8.856624603271484, -8.292120933532715, -7.727616310119629, -7.163111686706543, -6.598607063293457, -6.034104347229004, -5.469599723815918, -4.90509557723999, -4.340590953826904, -3.7760865688323975, -3.2115821838378906, -2.6470775604248047, -2.082573175430298, -1.518068790435791, -0.9535643458366394, -0.3890599012374878, 0.1754446029663086, 0.7399489879608154, 1.3044533729553223, 1.8689579963684082, 2.433462381362915, 2.997966766357422, 3.5624711513519287, 4.1269755363464355, 4.6914801597595215, 5.255984306335449, 5.820488929748535, 6.384993553161621, 6.949498176574707, 7.514002323150635, 8.078506469726562, 8.643011093139648, 9.207515716552734, 9.77202033996582, 10.336524963378906, 10.901029586791992, 11.465533256530762, 12.030037879943848]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 6.0, 5.0, 8.0, 1.0, 9.0, 9.0, 13.0, 16.0, 18.0, 11.0, 20.0, 29.0, 27.0, 20.0, 39.0, 33.0, 37.0, 35.0, 34.0, 44.0, 39.0, 45.0, 32.0, 41.0, 35.0, 34.0, 41.0, 39.0, 30.0, 40.0, 21.0, 33.0, 23.0, 23.0, 18.0, 16.0, 20.0, 16.0, 10.0, 10.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.757124423980713, -7.4851393699646, -7.213153839111328, -6.941168785095215, -6.669183731079102, -6.39719820022583, -6.125213146209717, -5.853227615356445, -5.581242561340332, -5.309257507324219, -5.037271976470947, -4.765286922454834, -4.4933013916015625, -4.221316337585449, -3.949331283569336, -3.6773459911346436, -3.405360698699951, -3.133375406265259, -2.8613901138305664, -2.589405059814453, -2.3174197673797607, -2.0454344749450684, -1.7734493017196655, -1.5014641284942627, -1.2294788360595703, -0.9574936032295227, -0.6855083703994751, -0.4135231375694275, -0.14153790473937988, 0.1304473876953125, 0.40243256092071533, 0.6744177341461182, 0.9464035034179688, 1.2183887958526611, 1.490373969078064, 1.7623591423034668, 2.034344434738159, 2.3063297271728516, 2.578314781188965, 2.8503000736236572, 3.1222853660583496, 3.394270658493042, 3.6662559509277344, 3.9382410049438477, 4.210226058959961, 4.482211589813232, 4.754196643829346, 5.026182174682617, 5.2981672286987305, 5.570152282714844, 5.842137813568115, 6.1141228675842285, 6.3861083984375, 6.658093452453613, 6.930078506469727, 7.20206356048584, 7.474049091339111, 7.746034145355225, 8.018019676208496, 8.29000473022461, 8.561989784240723, 8.833974838256836, 9.105960845947266, 9.377945899963379, 9.649930953979492]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 11.0, 13.0, 19.0, 33.0, 58.0, 60.0, 111.0, 171.0, 315.0, 604.0, 1437.0, 16325.0, 1386879.0, 2740200.0, 44992.0, 1846.0, 503.0, 265.0, 144.0, 91.0, 54.0, 49.0, 30.0, 16.0, 13.0, 9.0, 9.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.53125, -12.14111328125, -11.7509765625, -11.36083984375, -10.970703125, -10.58056640625, -10.1904296875, -9.80029296875, -9.41015625, -9.02001953125, -8.6298828125, -8.23974609375, -7.849609375, -7.45947265625, -7.0693359375, -6.67919921875, -6.2890625, -5.89892578125, -5.5087890625, -5.11865234375, -4.728515625, -4.33837890625, -3.9482421875, -3.55810546875, -3.16796875, -2.77783203125, -2.3876953125, -1.99755859375, -1.607421875, -1.21728515625, -0.8271484375, -0.43701171875, -0.046875, 0.34326171875, 0.7333984375, 1.12353515625, 1.513671875, 1.90380859375, 2.2939453125, 2.68408203125, 3.07421875, 3.46435546875, 3.8544921875, 4.24462890625, 4.634765625, 5.02490234375, 5.4150390625, 5.80517578125, 6.1953125, 6.58544921875, 6.9755859375, 7.36572265625, 7.755859375, 8.14599609375, 8.5361328125, 8.92626953125, 9.31640625, 9.70654296875, 10.0966796875, 10.48681640625, 10.876953125, 11.26708984375, 11.6572265625, 12.04736328125, 12.4375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 12.0, 9.0, 14.0, 20.0, 26.0, 27.0, 35.0, 33.0, 34.0, 36.0, 33.0, 49.0, 52.0, 35.0, 51.0, 48.0, 47.0, 49.0, 36.0, 44.0, 49.0, 39.0, 30.0, 27.0, 28.0, 17.0, 19.0, 16.0, 17.0, 14.0, 11.0, 7.0, 10.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.93310546875, -2.8115234375, -2.68994140625, -2.568359375, -2.44677734375, -2.3251953125, -2.20361328125, -2.08203125, -1.96044921875, -1.8388671875, -1.71728515625, -1.595703125, -1.47412109375, -1.3525390625, -1.23095703125, -1.109375, -0.98779296875, -0.8662109375, -0.74462890625, -0.623046875, -0.50146484375, -0.3798828125, -0.25830078125, -0.13671875, -0.01513671875, 0.1064453125, 0.22802734375, 0.349609375, 0.47119140625, 0.5927734375, 0.71435546875, 0.8359375, 0.95751953125, 1.0791015625, 1.20068359375, 1.322265625, 1.44384765625, 1.5654296875, 1.68701171875, 1.80859375, 1.93017578125, 2.0517578125, 2.17333984375, 2.294921875, 2.41650390625, 2.5380859375, 2.65966796875, 2.78125, 2.90283203125, 3.0244140625, 3.14599609375, 3.267578125, 3.38916015625, 3.5107421875, 3.63232421875, 3.75390625, 3.87548828125, 3.9970703125, 4.11865234375, 4.240234375, 4.36181640625, 4.4833984375, 4.60498046875, 4.7265625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 7.0, 21.0, 17.0, 24.0, 43.0, 67.0, 92.0, 153.0, 248.0, 397.0, 746.0, 1822.0, 5880.0, 48891.0, 1600992.0, 2448179.0, 74857.0, 7610.0, 2100.0, 862.0, 463.0, 269.0, 187.0, 100.0, 83.0, 43.0, 29.0, 30.0, 14.0, 14.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.42578125, -6.18841552734375, -5.9510498046875, -5.71368408203125, -5.476318359375, -5.23895263671875, -5.0015869140625, -4.76422119140625, -4.52685546875, -4.28948974609375, -4.0521240234375, -3.81475830078125, -3.577392578125, -3.34002685546875, -3.1026611328125, -2.86529541015625, -2.6279296875, -2.39056396484375, -2.1531982421875, -1.91583251953125, -1.678466796875, -1.44110107421875, -1.2037353515625, -0.96636962890625, -0.72900390625, -0.49163818359375, -0.2542724609375, -0.01690673828125, 0.220458984375, 0.45782470703125, 0.6951904296875, 0.93255615234375, 1.169921875, 1.40728759765625, 1.6446533203125, 1.88201904296875, 2.119384765625, 2.35675048828125, 2.5941162109375, 2.83148193359375, 3.06884765625, 3.30621337890625, 3.5435791015625, 3.78094482421875, 4.018310546875, 4.25567626953125, 4.4930419921875, 4.73040771484375, 4.9677734375, 5.20513916015625, 5.4425048828125, 5.67987060546875, 5.917236328125, 6.15460205078125, 6.3919677734375, 6.62933349609375, 6.86669921875, 7.10406494140625, 7.3414306640625, 7.57879638671875, 7.816162109375, 8.05352783203125, 8.2908935546875, 8.52825927734375, 8.765625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 1.0, 7.0, 14.0, 6.0, 20.0, 18.0, 34.0, 31.0, 56.0, 97.0, 105.0, 151.0, 225.0, 282.0, 405.0, 447.0, 453.0, 426.0, 352.0, 280.0, 190.0, 141.0, 107.0, 75.0, 30.0, 42.0, 28.0, 13.0, 8.0, 6.0, 7.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6708984375, -1.6222381591796875, -1.573577880859375, -1.5249176025390625, -1.47625732421875, -1.4275970458984375, -1.378936767578125, -1.3302764892578125, -1.2816162109375, -1.2329559326171875, -1.184295654296875, -1.1356353759765625, -1.08697509765625, -1.0383148193359375, -0.989654541015625, -0.9409942626953125, -0.892333984375, -0.8436737060546875, -0.795013427734375, -0.7463531494140625, -0.69769287109375, -0.6490325927734375, -0.600372314453125, -0.5517120361328125, -0.5030517578125, -0.4543914794921875, -0.405731201171875, -0.3570709228515625, -0.30841064453125, -0.2597503662109375, -0.211090087890625, -0.1624298095703125, -0.11376953125, -0.0651092529296875, -0.016448974609375, 0.0322113037109375, 0.08087158203125, 0.1295318603515625, 0.178192138671875, 0.2268524169921875, 0.2755126953125, 0.3241729736328125, 0.372833251953125, 0.4214935302734375, 0.47015380859375, 0.5188140869140625, 0.567474365234375, 0.6161346435546875, 0.664794921875, 0.7134552001953125, 0.762115478515625, 0.8107757568359375, 0.85943603515625, 0.9080963134765625, 0.956756591796875, 1.0054168701171875, 1.0540771484375, 1.1027374267578125, 1.151397705078125, 1.2000579833984375, 1.24871826171875, 1.2973785400390625, 1.346038818359375, 1.3946990966796875, 1.443359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 10.0, 25.0, 38.0, 85.0, 123.0, 159.0, 189.0, 155.0, 89.0, 65.0, 40.0, 15.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.987656593322754, -5.623998641967773, -5.260340690612793, -4.896682262420654, -4.533024311065674, -4.169366359710693, -3.805708169937134, -3.442049980163574, -3.0783920288085938, -2.7147340774536133, -2.3510758876800537, -1.9874178171157837, -1.6237597465515137, -1.2601016759872437, -0.8964436054229736, -0.5327854156494141, -0.1691274642944336, 0.19453060626983643, 0.5581886768341064, 0.9218467473983765, 1.2855048179626465, 1.6491628885269165, 2.0128209590911865, 2.376479148864746, 2.7401371002197266, 3.103795051574707, 3.4674532413482666, 3.831111431121826, 4.194769382476807, 4.558427333831787, 4.922085762023926, 5.285743713378906, 5.64940071105957, 6.013058662414551, 6.376716613769531, 6.74037504196167, 7.10403299331665, 7.467690944671631, 7.8313493728637695, 8.19500732421875, 8.55866527557373, 8.922323226928711, 9.285981178283691, 9.649639129638672, 10.013298034667969, 10.37695598602295, 10.74061393737793, 11.10427188873291, 11.46792984008789, 11.831587791442871, 12.195245742797852, 12.558903694152832, 12.922561645507812, 13.28622055053711, 13.64987850189209, 14.01353645324707, 14.37719440460205, 14.740852355957031, 15.104510307312012, 15.468168258666992, 15.831827163696289, 16.195484161376953, 16.55914306640625, 16.922801971435547, 17.28645896911621]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 7.0, 3.0, 5.0, 7.0, 10.0, 14.0, 12.0, 11.0, 20.0, 19.0, 20.0, 31.0, 31.0, 34.0, 24.0, 34.0, 44.0, 43.0, 45.0, 33.0, 38.0, 40.0, 32.0, 46.0, 37.0, 43.0, 35.0, 24.0, 41.0, 34.0, 29.0, 25.0, 18.0, 18.0, 14.0, 9.0, 12.0, 14.0, 14.0, 5.0, 8.0, 8.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3395462036132812, -3.2292258739471436, -3.118905544281006, -3.0085854530334473, -2.8982651233673096, -2.787944793701172, -2.677624464035034, -2.5673041343688965, -2.456983804702759, -2.346663475036621, -2.2363431453704834, -2.1260228157043457, -2.015702724456787, -1.9053823947906494, -1.7950620651245117, -1.684741735458374, -1.5744215250015259, -1.4641011953353882, -1.35378098487854, -1.2434606552124023, -1.1331403255462646, -1.022819995880127, -0.9124997854232788, -0.8021794557571411, -0.6918591856956482, -0.5815389156341553, -0.4712185859680176, -0.36089831590652466, -0.25057801604270935, -0.14025771617889404, -0.029937446117401123, 0.08038288354873657, 0.1907031536102295, 0.3010234534740448, 0.4113437533378601, 0.521664023399353, 0.6319843530654907, 0.7423046231269836, 0.8526248931884766, 0.9629452228546143, 1.073265552520752, 1.1835858821868896, 1.2939060926437378, 1.4042264223098755, 1.5145467519760132, 1.6248669624328613, 1.735187292098999, 1.8455076217651367, 1.9558278322219849, 2.066148042678833, 2.1764683723449707, 2.2867887020111084, 2.397109031677246, 2.507429361343384, 2.6177496910095215, 2.72806978225708, 2.8383901119232178, 2.9487104415893555, 3.059030771255493, 3.169351100921631, 3.2796711921691895, 3.389991521835327, 3.500311851501465, 3.6106321811676025, 3.7209525108337402]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 16.0, 22.0, 20.0, 60.0, 100.0, 170.0, 359.0, 791.0, 1945.0, 6086.0, 23243.0, 95656.0, 341663.0, 405488.0, 129740.0, 30907.0, 7995.0, 2433.0, 959.0, 422.0, 209.0, 113.0, 54.0, 43.0, 21.0, 11.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6252288818359375, -0.604461669921875, -0.5836944580078125, -0.56292724609375, -0.5421600341796875, -0.521392822265625, -0.5006256103515625, -0.4798583984375, -0.4590911865234375, -0.438323974609375, -0.4175567626953125, -0.39678955078125, -0.3760223388671875, -0.355255126953125, -0.3344879150390625, -0.313720703125, -0.2929534912109375, -0.272186279296875, -0.2514190673828125, -0.23065185546875, -0.2098846435546875, -0.189117431640625, -0.1683502197265625, -0.1475830078125, -0.1268157958984375, -0.106048583984375, -0.0852813720703125, -0.06451416015625, -0.0437469482421875, -0.022979736328125, -0.0022125244140625, 0.0185546875, 0.0393218994140625, 0.060089111328125, 0.0808563232421875, 0.10162353515625, 0.1223907470703125, 0.143157958984375, 0.1639251708984375, 0.1846923828125, 0.2054595947265625, 0.226226806640625, 0.2469940185546875, 0.26776123046875, 0.2885284423828125, 0.309295654296875, 0.3300628662109375, 0.350830078125, 0.3715972900390625, 0.392364501953125, 0.4131317138671875, 0.43389892578125, 0.4546661376953125, 0.475433349609375, 0.4962005615234375, 0.5169677734375, 0.5377349853515625, 0.558502197265625, 0.5792694091796875, 0.60003662109375, 0.6208038330078125, 0.641571044921875, 0.6623382568359375, 0.68310546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 14.0, 22.0, 24.0, 19.0, 36.0, 35.0, 44.0, 45.0, 68.0, 64.0, 60.0, 59.0, 55.0, 62.0, 66.0, 52.0, 57.0, 45.0, 31.0, 27.0, 27.0, 16.0, 17.0, 19.0, 12.0, 8.0, 3.0, 7.0, 2.0, 4.0], "bins": [-5.36328125, -5.2467041015625, -5.130126953125, -5.0135498046875, -4.89697265625, -4.7803955078125, -4.663818359375, -4.5472412109375, -4.4306640625, -4.3140869140625, -4.197509765625, -4.0809326171875, -3.96435546875, -3.8477783203125, -3.731201171875, -3.6146240234375, -3.498046875, -3.3814697265625, -3.264892578125, -3.1483154296875, -3.03173828125, -2.9151611328125, -2.798583984375, -2.6820068359375, -2.5654296875, -2.4488525390625, -2.332275390625, -2.2156982421875, -2.09912109375, -1.9825439453125, -1.865966796875, -1.7493896484375, -1.6328125, -1.5162353515625, -1.399658203125, -1.2830810546875, -1.16650390625, -1.0499267578125, -0.933349609375, -0.8167724609375, -0.7001953125, -0.5836181640625, -0.467041015625, -0.3504638671875, -0.23388671875, -0.1173095703125, -0.000732421875, 0.1158447265625, 0.232421875, 0.3489990234375, 0.465576171875, 0.5821533203125, 0.69873046875, 0.8153076171875, 0.931884765625, 1.0484619140625, 1.1650390625, 1.2816162109375, 1.398193359375, 1.5147705078125, 1.63134765625, 1.7479248046875, 1.864501953125, 1.9810791015625, 2.09765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 11.0, 16.0, 24.0, 43.0, 78.0, 142.0, 231.0, 483.0, 1041.0, 2031.0, 4342.0, 8874.0, 19471.0, 41791.0, 87925.0, 170103.0, 249300.0, 218170.0, 126301.0, 62857.0, 29323.0, 13510.0, 6492.0, 3125.0, 1388.0, 701.0, 342.0, 164.0, 96.0, 61.0, 34.0, 27.0, 13.0, 17.0, 4.0, 5.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31201171875, -0.3018684387207031, -0.29172515869140625, -0.2815818786621094, -0.2714385986328125, -0.2612953186035156, -0.25115203857421875, -0.24100875854492188, -0.230865478515625, -0.22072219848632812, -0.21057891845703125, -0.20043563842773438, -0.1902923583984375, -0.18014907836914062, -0.17000579833984375, -0.15986251831054688, -0.14971923828125, -0.13957595825195312, -0.12943267822265625, -0.11928939819335938, -0.1091461181640625, -0.09900283813476562, -0.08885955810546875, -0.07871627807617188, -0.068572998046875, -0.058429718017578125, -0.04828643798828125, -0.038143157958984375, -0.0279998779296875, -0.017856597900390625, -0.00771331787109375, 0.002429962158203125, 0.0125732421875, 0.022716522216796875, 0.03285980224609375, 0.043003082275390625, 0.0531463623046875, 0.06328964233398438, 0.07343292236328125, 0.08357620239257812, 0.093719482421875, 0.10386276245117188, 0.11400604248046875, 0.12414932250976562, 0.1342926025390625, 0.14443588256835938, 0.15457916259765625, 0.16472244262695312, 0.17486572265625, 0.18500900268554688, 0.19515228271484375, 0.20529556274414062, 0.2154388427734375, 0.22558212280273438, 0.23572540283203125, 0.24586868286132812, 0.256011962890625, 0.2661552429199219, 0.27629852294921875, 0.2864418029785156, 0.2965850830078125, 0.3067283630371094, 0.31687164306640625, 0.3270149230957031, 0.337158203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 6.0, 9.0, 9.0, 9.0, 13.0, 11.0, 10.0, 14.0, 19.0, 27.0, 32.0, 20.0, 30.0, 27.0, 34.0, 36.0, 42.0, 44.0, 51.0, 33.0, 45.0, 48.0, 53.0, 31.0, 42.0, 28.0, 28.0, 37.0, 26.0, 31.0, 24.0, 17.0, 18.0, 12.0, 12.0, 9.0, 12.0, 11.0, 9.0, 3.0, 10.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.5234375, -5.3604736328125, -5.197509765625, -5.0345458984375, -4.87158203125, -4.7086181640625, -4.545654296875, -4.3826904296875, -4.2197265625, -4.0567626953125, -3.893798828125, -3.7308349609375, -3.56787109375, -3.4049072265625, -3.241943359375, -3.0789794921875, -2.916015625, -2.7530517578125, -2.590087890625, -2.4271240234375, -2.26416015625, -2.1011962890625, -1.938232421875, -1.7752685546875, -1.6123046875, -1.4493408203125, -1.286376953125, -1.1234130859375, -0.96044921875, -0.7974853515625, -0.634521484375, -0.4715576171875, -0.30859375, -0.1456298828125, 0.017333984375, 0.1802978515625, 0.34326171875, 0.5062255859375, 0.669189453125, 0.8321533203125, 0.9951171875, 1.1580810546875, 1.321044921875, 1.4840087890625, 1.64697265625, 1.8099365234375, 1.972900390625, 2.1358642578125, 2.298828125, 2.4617919921875, 2.624755859375, 2.7877197265625, 2.95068359375, 3.1136474609375, 3.276611328125, 3.4395751953125, 3.6025390625, 3.7655029296875, 3.928466796875, 4.0914306640625, 4.25439453125, 4.4173583984375, 4.580322265625, 4.7432861328125, 4.90625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 5.0, 15.0, 21.0, 29.0, 32.0, 59.0, 54.0, 101.0, 169.0, 246.0, 417.0, 679.0, 1149.0, 2235.0, 4938.0, 13622.0, 54258.0, 288009.0, 523549.0, 119285.0, 25176.0, 7556.0, 2989.0, 1501.0, 926.0, 525.0, 304.0, 233.0, 142.0, 105.0, 75.0, 42.0, 30.0, 17.0, 12.0, 12.0, 14.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.06711673736572266, -0.06489753723144531, -0.06267833709716797, -0.060459136962890625, -0.05823993682861328, -0.05602073669433594, -0.053801536560058594, -0.05158233642578125, -0.049363136291503906, -0.04714393615722656, -0.04492473602294922, -0.042705535888671875, -0.04048633575439453, -0.03826713562011719, -0.036047935485839844, -0.0338287353515625, -0.031609535217285156, -0.029390335083007812, -0.02717113494873047, -0.024951934814453125, -0.02273273468017578, -0.020513534545898438, -0.018294334411621094, -0.01607513427734375, -0.013855934143066406, -0.011636734008789062, -0.009417533874511719, -0.007198333740234375, -0.004979133605957031, -0.0027599334716796875, -0.0005407333374023438, 0.001678466796875, 0.0038976669311523438, 0.0061168670654296875, 0.008336067199707031, 0.010555267333984375, 0.012774467468261719, 0.014993667602539062, 0.017212867736816406, 0.01943206787109375, 0.021651268005371094, 0.023870468139648438, 0.02608966827392578, 0.028308868408203125, 0.03052806854248047, 0.03274726867675781, 0.034966468811035156, 0.0371856689453125, 0.039404869079589844, 0.04162406921386719, 0.04384326934814453, 0.046062469482421875, 0.04828166961669922, 0.05050086975097656, 0.052720069885253906, 0.05493927001953125, 0.057158470153808594, 0.05937767028808594, 0.06159687042236328, 0.06381607055664062, 0.06603527069091797, 0.06825447082519531, 0.07047367095947266, 0.07269287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 11.0, 11.0, 22.0, 17.0, 42.0, 60.0, 96.0, 136.0, 140.0, 138.0, 120.0, 80.0, 46.0, 30.0, 27.0, 11.0, 8.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.476308822631836e-05, -4.235748201608658e-05, -3.99518758058548e-05, -3.7546269595623016e-05, -3.5140663385391235e-05, -3.2735057175159454e-05, -3.0329450964927673e-05, -2.7923844754695892e-05, -2.551823854446411e-05, -2.311263233423233e-05, -2.070702612400055e-05, -1.830141991376877e-05, -1.5895813703536987e-05, -1.3490207493305206e-05, -1.1084601283073425e-05, -8.678995072841644e-06, -6.273388862609863e-06, -3.867782652378082e-06, -1.4621764421463013e-06, 9.434297680854797e-07, 3.3490359783172607e-06, 5.754642188549042e-06, 8.160248398780823e-06, 1.0565854609012604e-05, 1.2971460819244385e-05, 1.5377067029476166e-05, 1.7782673239707947e-05, 2.0188279449939728e-05, 2.259388566017151e-05, 2.499949187040329e-05, 2.740509808063507e-05, 2.9810704290866852e-05, 3.221631050109863e-05, 3.4621916711330414e-05, 3.7027522921562195e-05, 3.9433129131793976e-05, 4.183873534202576e-05, 4.424434155225754e-05, 4.664994776248932e-05, 4.90555539727211e-05, 5.146116018295288e-05, 5.386676639318466e-05, 5.627237260341644e-05, 5.8677978813648224e-05, 6.108358502388e-05, 6.348919123411179e-05, 6.589479744434357e-05, 6.830040365457535e-05, 7.070600986480713e-05, 7.311161607503891e-05, 7.551722228527069e-05, 7.792282849550247e-05, 8.032843470573425e-05, 8.273404091596603e-05, 8.513964712619781e-05, 8.75452533364296e-05, 8.995085954666138e-05, 9.235646575689316e-05, 9.476207196712494e-05, 9.716767817735672e-05, 9.95732843875885e-05, 0.00010197889059782028, 0.00010438449680805206, 0.00010679010301828384, 0.00010919570922851562]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 8.0, 3.0, 4.0, 6.0, 6.0, 5.0, 8.0, 10.0, 13.0, 15.0, 17.0, 30.0, 46.0, 60.0, 84.0, 144.0, 242.0, 468.0, 994.0, 2383.0, 6414.0, 25242.0, 177384.0, 661682.0, 141928.0, 21471.0, 5798.0, 2065.0, 945.0, 422.0, 223.0, 123.0, 97.0, 51.0, 39.0, 29.0, 23.0, 12.0, 14.0, 17.0, 9.0, 6.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07769775390625, -0.07486724853515625, -0.0720367431640625, -0.06920623779296875, -0.066375732421875, -0.06354522705078125, -0.0607147216796875, -0.05788421630859375, -0.0550537109375, -0.05222320556640625, -0.0493927001953125, -0.04656219482421875, -0.043731689453125, -0.04090118408203125, -0.0380706787109375, -0.03524017333984375, -0.03240966796875, -0.02957916259765625, -0.0267486572265625, -0.02391815185546875, -0.021087646484375, -0.01825714111328125, -0.0154266357421875, -0.01259613037109375, -0.009765625, -0.00693511962890625, -0.0041046142578125, -0.00127410888671875, 0.001556396484375, 0.00438690185546875, 0.0072174072265625, 0.01004791259765625, 0.01287841796875, 0.01570892333984375, 0.0185394287109375, 0.02136993408203125, 0.024200439453125, 0.02703094482421875, 0.0298614501953125, 0.03269195556640625, 0.0355224609375, 0.03835296630859375, 0.0411834716796875, 0.04401397705078125, 0.046844482421875, 0.04967498779296875, 0.0525054931640625, 0.05533599853515625, 0.05816650390625, 0.06099700927734375, 0.0638275146484375, 0.06665802001953125, 0.069488525390625, 0.07231903076171875, 0.0751495361328125, 0.07798004150390625, 0.080810546875, 0.08364105224609375, 0.0864715576171875, 0.08930206298828125, 0.092132568359375, 0.09496307373046875, 0.0977935791015625, 0.10062408447265625, 0.10345458984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 8.0, 2.0, 5.0, 11.0, 7.0, 8.0, 6.0, 10.0, 15.0, 21.0, 21.0, 31.0, 36.0, 59.0, 77.0, 97.0, 90.0, 110.0, 96.0, 68.0, 47.0, 39.0, 24.0, 22.0, 16.0, 10.0, 12.0, 7.0, 12.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0248870849609375, -0.02419281005859375, -0.02349853515625, -0.02280426025390625, -0.0221099853515625, -0.02141571044921875, -0.020721435546875, -0.02002716064453125, -0.0193328857421875, -0.01863861083984375, -0.0179443359375, -0.01725006103515625, -0.0165557861328125, -0.01586151123046875, -0.015167236328125, -0.01447296142578125, -0.0137786865234375, -0.01308441162109375, -0.01239013671875, -0.01169586181640625, -0.0110015869140625, -0.01030731201171875, -0.009613037109375, -0.00891876220703125, -0.0082244873046875, -0.00753021240234375, -0.0068359375, -0.00614166259765625, -0.0054473876953125, -0.00475311279296875, -0.004058837890625, -0.00336456298828125, -0.0026702880859375, -0.00197601318359375, -0.00128173828125, -0.00058746337890625, 0.0001068115234375, 0.00080108642578125, 0.001495361328125, 0.00218963623046875, 0.0028839111328125, 0.00357818603515625, 0.0042724609375, 0.00496673583984375, 0.0056610107421875, 0.00635528564453125, 0.007049560546875, 0.00774383544921875, 0.0084381103515625, 0.00913238525390625, 0.00982666015625, 0.01052093505859375, 0.0112152099609375, 0.01190948486328125, 0.012603759765625, 0.01329803466796875, 0.0139923095703125, 0.01468658447265625, 0.015380859375, 0.01607513427734375, 0.0167694091796875, 0.01746368408203125, 0.018157958984375, 0.01885223388671875, 0.0195465087890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 33.0, 377.0, 504.0, 94.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.115140438079834, -3.3225979804992676, -2.530055522918701, -1.7375133037567139, -0.9449708461761475, -0.15242838859558105, 0.6401138305664062, 1.4326562881469727, 2.225198745727539, 3.0177412033081055, 3.810283660888672, 4.602826118469238, 5.395368576049805, 6.187911033630371, 6.980453014373779, 7.772995471954346, 8.56553840637207, 9.358080863952637, 10.150623321533203, 10.94316577911377, 11.735708236694336, 12.528250694274902, 13.320793151855469, 14.113334655761719, 14.905877113342285, 15.698419570922852, 16.4909610748291, 17.283504486083984, 18.076045989990234, 18.868589401245117, 19.661130905151367, 20.45367431640625, 21.246217727661133, 22.038759231567383, 22.831302642822266, 23.623844146728516, 24.4163875579834, 25.20892906188965, 26.00147247314453, 26.79401397705078, 27.586557388305664, 28.379098892211914, 29.171642303466797, 29.964183807373047, 30.75672721862793, 31.54926872253418, 32.34181213378906, 33.13435363769531, 33.92689514160156, 34.71943664550781, 35.51197814941406, 36.30452346801758, 37.09706497192383, 37.88960647583008, 38.68214797973633, 39.474693298339844, 40.267234802246094, 41.059776306152344, 41.852317810058594, 42.64486312866211, 43.43740463256836, 44.22994613647461, 45.02248764038086, 45.815032958984375, 46.607574462890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 9.0, 13.0, 14.0, 15.0, 21.0, 24.0, 37.0, 25.0, 39.0, 26.0, 46.0, 53.0, 50.0, 42.0, 35.0, 48.0, 45.0, 41.0, 48.0, 44.0, 33.0, 41.0, 41.0, 29.0, 23.0, 23.0, 15.0, 12.0, 14.0, 14.0, 13.0, 10.0, 12.0, 7.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.805190086364746, -2.7237672805786133, -2.6423444747924805, -2.5609216690063477, -2.479498863220215, -2.398076057434082, -2.316653251647949, -2.2352304458618164, -2.1538076400756836, -2.072384834289551, -1.990962028503418, -1.9095392227172852, -1.8281164169311523, -1.7466936111450195, -1.6652709245681763, -1.5838481187820435, -1.5024254322052002, -1.4210026264190674, -1.3395798206329346, -1.2581570148468018, -1.176734209060669, -1.0953114032745361, -1.0138887166976929, -0.9324659109115601, -0.8510431051254272, -0.7696202993392944, -0.6881974935531616, -0.6067747473716736, -0.5253519415855408, -0.44392913579940796, -0.36250635981559753, -0.2810835838317871, -0.1996607780456543, -0.11823798716068268, -0.03681519627571106, 0.04460759460926056, 0.12603038549423218, 0.207453191280365, 0.2888759672641754, 0.37029874324798584, 0.45172154903411865, 0.5331443548202515, 0.6145671606063843, 0.6959899067878723, 0.7774127125740051, 0.8588355183601379, 0.940258264541626, 1.0216810703277588, 1.1031038761138916, 1.1845266819000244, 1.2659494876861572, 1.34737229347229, 1.4287950992584229, 1.5102179050445557, 1.591640591621399, 1.6730633974075317, 1.7544862031936646, 1.8359090089797974, 1.9173318147659302, 1.998754620552063, 2.0801773071289062, 2.161600112915039, 2.243022918701172, 2.3244457244873047, 2.4058685302734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 5.0, 2.0, 6.0, 6.0, 7.0, 13.0, 17.0, 17.0, 49.0, 54.0, 112.0, 187.0, 305.0, 648.0, 1262.0, 3448.0, 9484.0, 28044.0, 82716.0, 230338.0, 378247.0, 203611.0, 72257.0, 24108.0, 8061.0, 3049.0, 1224.0, 555.0, 263.0, 170.0, 102.0, 55.0, 42.0, 25.0, 19.0, 16.0, 7.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.875, -2.783538818359375, -2.69207763671875, -2.600616455078125, -2.5091552734375, -2.417694091796875, -2.32623291015625, -2.234771728515625, -2.143310546875, -2.051849365234375, -1.96038818359375, -1.868927001953125, -1.7774658203125, -1.686004638671875, -1.59454345703125, -1.503082275390625, -1.41162109375, -1.320159912109375, -1.22869873046875, -1.137237548828125, -1.0457763671875, -0.954315185546875, -0.86285400390625, -0.771392822265625, -0.679931640625, -0.588470458984375, -0.49700927734375, -0.405548095703125, -0.3140869140625, -0.222625732421875, -0.13116455078125, -0.039703369140625, 0.0517578125, 0.143218994140625, 0.23468017578125, 0.326141357421875, 0.4176025390625, 0.509063720703125, 0.60052490234375, 0.691986083984375, 0.783447265625, 0.874908447265625, 0.96636962890625, 1.057830810546875, 1.1492919921875, 1.240753173828125, 1.33221435546875, 1.423675537109375, 1.51513671875, 1.606597900390625, 1.69805908203125, 1.789520263671875, 1.8809814453125, 1.972442626953125, 2.06390380859375, 2.155364990234375, 2.246826171875, 2.338287353515625, 2.42974853515625, 2.521209716796875, 2.6126708984375, 2.704132080078125, 2.79559326171875, 2.887054443359375, 2.978515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 4.0, 10.0, 6.0, 7.0, 16.0, 13.0, 16.0, 19.0, 17.0, 30.0, 31.0, 32.0, 31.0, 37.0, 32.0, 38.0, 43.0, 48.0, 42.0, 49.0, 36.0, 26.0, 40.0, 37.0, 27.0, 47.0, 26.0, 30.0, 28.0, 24.0, 26.0, 17.0, 11.0, 13.0, 11.0, 15.0, 9.0, 9.0, 8.0, 6.0, 6.0, 10.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.4765625, -4.3443603515625, -4.212158203125, -4.0799560546875, -3.94775390625, -3.8155517578125, -3.683349609375, -3.5511474609375, -3.4189453125, -3.2867431640625, -3.154541015625, -3.0223388671875, -2.89013671875, -2.7579345703125, -2.625732421875, -2.4935302734375, -2.361328125, -2.2291259765625, -2.096923828125, -1.9647216796875, -1.83251953125, -1.7003173828125, -1.568115234375, -1.4359130859375, -1.3037109375, -1.1715087890625, -1.039306640625, -0.9071044921875, -0.77490234375, -0.6427001953125, -0.510498046875, -0.3782958984375, -0.24609375, -0.1138916015625, 0.018310546875, 0.1505126953125, 0.28271484375, 0.4149169921875, 0.547119140625, 0.6793212890625, 0.8115234375, 0.9437255859375, 1.075927734375, 1.2081298828125, 1.34033203125, 1.4725341796875, 1.604736328125, 1.7369384765625, 1.869140625, 2.0013427734375, 2.133544921875, 2.2657470703125, 2.39794921875, 2.5301513671875, 2.662353515625, 2.7945556640625, 2.9267578125, 3.0589599609375, 3.191162109375, 3.3233642578125, 3.45556640625, 3.5877685546875, 3.719970703125, 3.8521728515625, 3.984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 6.0, 7.0, 5.0, 12.0, 16.0, 16.0, 21.0, 28.0, 34.0, 34.0, 84.0, 134.0, 204.0, 407.0, 1464.0, 127450.0, 907923.0, 9227.0, 680.0, 300.0, 144.0, 90.0, 67.0, 45.0, 44.0, 22.0, 18.0, 9.0, 11.0, 12.0, 12.0, 5.0, 4.0, 3.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.765625, -13.3253173828125, -12.885009765625, -12.4447021484375, -12.00439453125, -11.5640869140625, -11.123779296875, -10.6834716796875, -10.2431640625, -9.8028564453125, -9.362548828125, -8.9222412109375, -8.48193359375, -8.0416259765625, -7.601318359375, -7.1610107421875, -6.720703125, -6.2803955078125, -5.840087890625, -5.3997802734375, -4.95947265625, -4.5191650390625, -4.078857421875, -3.6385498046875, -3.1982421875, -2.7579345703125, -2.317626953125, -1.8773193359375, -1.43701171875, -0.9967041015625, -0.556396484375, -0.1160888671875, 0.32421875, 0.7645263671875, 1.204833984375, 1.6451416015625, 2.08544921875, 2.5257568359375, 2.966064453125, 3.4063720703125, 3.8466796875, 4.2869873046875, 4.727294921875, 5.1676025390625, 5.60791015625, 6.0482177734375, 6.488525390625, 6.9288330078125, 7.369140625, 7.8094482421875, 8.249755859375, 8.6900634765625, 9.13037109375, 9.5706787109375, 10.010986328125, 10.4512939453125, 10.8916015625, 11.3319091796875, 11.772216796875, 12.2125244140625, 12.65283203125, 13.0931396484375, 13.533447265625, 13.9737548828125, 14.4140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 3.0, 7.0, 3.0, 5.0, 4.0, 8.0, 6.0, 9.0, 15.0, 15.0, 16.0, 14.0, 14.0, 15.0, 31.0, 23.0, 32.0, 35.0, 30.0, 37.0, 45.0, 33.0, 49.0, 37.0, 38.0, 56.0, 36.0, 34.0, 43.0, 41.0, 38.0, 34.0, 31.0, 26.0, 26.0, 20.0, 14.0, 15.0, 14.0, 8.0, 7.0, 8.0, 8.0, 9.0, 1.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5517578125, -4.384765625, -4.2177734375, -4.05078125, -3.8837890625, -3.716796875, -3.5498046875, -3.3828125, -3.2158203125, -3.048828125, -2.8818359375, -2.71484375, -2.5478515625, -2.380859375, -2.2138671875, -2.046875, -1.8798828125, -1.712890625, -1.5458984375, -1.37890625, -1.2119140625, -1.044921875, -0.8779296875, -0.7109375, -0.5439453125, -0.376953125, -0.2099609375, -0.04296875, 0.1240234375, 0.291015625, 0.4580078125, 0.625, 0.7919921875, 0.958984375, 1.1259765625, 1.29296875, 1.4599609375, 1.626953125, 1.7939453125, 1.9609375, 2.1279296875, 2.294921875, 2.4619140625, 2.62890625, 2.7958984375, 2.962890625, 3.1298828125, 3.296875, 3.4638671875, 3.630859375, 3.7978515625, 3.96484375, 4.1318359375, 4.298828125, 4.4658203125, 4.6328125, 4.7998046875, 4.966796875, 5.1337890625, 5.30078125, 5.4677734375, 5.634765625, 5.8017578125, 5.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 2.0, 3.0, 9.0, 8.0, 24.0, 26.0, 81.0, 283.0, 3141.0, 898044.0, 145098.0, 1507.0, 196.0, 59.0, 26.0, 12.0, 12.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.788330078125, -7.49853515625, -7.208740234375, -6.9189453125, -6.629150390625, -6.33935546875, -6.049560546875, -5.759765625, -5.469970703125, -5.18017578125, -4.890380859375, -4.6005859375, -4.310791015625, -4.02099609375, -3.731201171875, -3.44140625, -3.151611328125, -2.86181640625, -2.572021484375, -2.2822265625, -1.992431640625, -1.70263671875, -1.412841796875, -1.123046875, -0.833251953125, -0.54345703125, -0.253662109375, 0.0361328125, 0.325927734375, 0.61572265625, 0.905517578125, 1.1953125, 1.485107421875, 1.77490234375, 2.064697265625, 2.3544921875, 2.644287109375, 2.93408203125, 3.223876953125, 3.513671875, 3.803466796875, 4.09326171875, 4.383056640625, 4.6728515625, 4.962646484375, 5.25244140625, 5.542236328125, 5.83203125, 6.121826171875, 6.41162109375, 6.701416015625, 6.9912109375, 7.281005859375, 7.57080078125, 7.860595703125, 8.150390625, 8.440185546875, 8.72998046875, 9.019775390625, 9.3095703125, 9.599365234375, 9.88916015625, 10.178955078125, 10.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 16.0, 32.0, 51.0, 67.0, 115.0, 158.0, 121.0, 105.0, 117.0, 72.0, 34.0, 34.0, 15.0, 9.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0005197525024414062, -0.0005080327391624451, -0.0004963129758834839, -0.0004845932126045227, -0.0004728734493255615, -0.00046115368604660034, -0.00044943392276763916, -0.000437714159488678, -0.0004259943962097168, -0.0004142746329307556, -0.00040255486965179443, -0.00039083510637283325, -0.00037911534309387207, -0.0003673955798149109, -0.0003556758165359497, -0.0003439560532569885, -0.00033223628997802734, -0.00032051652669906616, -0.000308796763420105, -0.0002970770001411438, -0.0002853572368621826, -0.00027363747358322144, -0.00026191771030426025, -0.00025019794702529907, -0.0002384781837463379, -0.0002267584204673767, -0.00021503865718841553, -0.00020331889390945435, -0.00019159913063049316, -0.00017987936735153198, -0.0001681596040725708, -0.00015643984079360962, -0.00014472007751464844, -0.00013300031423568726, -0.00012128055095672607, -0.00010956078767776489, -9.784102439880371e-05, -8.612126111984253e-05, -7.440149784088135e-05, -6.268173456192017e-05, -5.0961971282958984e-05, -3.92422080039978e-05, -2.752244472503662e-05, -1.580268144607544e-05, -4.082918167114258e-06, 7.636845111846924e-06, 1.9356608390808105e-05, 3.107637166976929e-05, 4.279613494873047e-05, 5.451589822769165e-05, 6.623566150665283e-05, 7.795542478561401e-05, 8.96751880645752e-05, 0.00010139495134353638, 0.00011311471462249756, 0.00012483447790145874, 0.00013655424118041992, 0.0001482740044593811, 0.00015999376773834229, 0.00017171353101730347, 0.00018343329429626465, 0.00019515305757522583, 0.000206872820854187, 0.0002185925841331482, 0.00023031234741210938]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 9.0, 7.0, 25.0, 100.0, 429.0, 4252.0, 1031823.0, 10995.0, 700.0, 141.0, 25.0, 11.0, 9.0, 14.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46484375, -7.06402587890625, -6.6632080078125, -6.26239013671875, -5.861572265625, -5.46075439453125, -5.0599365234375, -4.65911865234375, -4.25830078125, -3.85748291015625, -3.4566650390625, -3.05584716796875, -2.655029296875, -2.25421142578125, -1.8533935546875, -1.45257568359375, -1.0517578125, -0.65093994140625, -0.2501220703125, 0.15069580078125, 0.551513671875, 0.95233154296875, 1.3531494140625, 1.75396728515625, 2.15478515625, 2.55560302734375, 2.9564208984375, 3.35723876953125, 3.758056640625, 4.15887451171875, 4.5596923828125, 4.96051025390625, 5.361328125, 5.76214599609375, 6.1629638671875, 6.56378173828125, 6.964599609375, 7.36541748046875, 7.7662353515625, 8.16705322265625, 8.56787109375, 8.96868896484375, 9.3695068359375, 9.77032470703125, 10.171142578125, 10.57196044921875, 10.9727783203125, 11.37359619140625, 11.7744140625, 12.17523193359375, 12.5760498046875, 12.97686767578125, 13.377685546875, 13.77850341796875, 14.1793212890625, 14.58013916015625, 14.98095703125, 15.38177490234375, 15.7825927734375, 16.18341064453125, 16.584228515625, 16.98504638671875, 17.3858642578125, 17.78668212890625, 18.1875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 5.0, 6.0, 12.0, 31.0, 74.0, 119.0, 166.0, 183.0, 169.0, 108.0, 55.0, 33.0, 16.0, 9.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.359375, -2.3096771240234375, -2.259979248046875, -2.2102813720703125, -2.16058349609375, -2.1108856201171875, -2.061187744140625, -2.0114898681640625, -1.9617919921875, -1.9120941162109375, -1.862396240234375, -1.8126983642578125, -1.76300048828125, -1.7133026123046875, -1.663604736328125, -1.6139068603515625, -1.564208984375, -1.5145111083984375, -1.464813232421875, -1.4151153564453125, -1.36541748046875, -1.3157196044921875, -1.266021728515625, -1.2163238525390625, -1.1666259765625, -1.1169281005859375, -1.067230224609375, -1.0175323486328125, -0.96783447265625, -0.9181365966796875, -0.868438720703125, -0.8187408447265625, -0.76904296875, -0.7193450927734375, -0.669647216796875, -0.6199493408203125, -0.57025146484375, -0.5205535888671875, -0.470855712890625, -0.4211578369140625, -0.3714599609375, -0.3217620849609375, -0.272064208984375, -0.2223663330078125, -0.17266845703125, -0.1229705810546875, -0.073272705078125, -0.0235748291015625, 0.026123046875, 0.0758209228515625, 0.125518798828125, 0.1752166748046875, 0.22491455078125, 0.2746124267578125, 0.324310302734375, 0.3740081787109375, 0.4237060546875, 0.4734039306640625, 0.523101806640625, 0.5727996826171875, 0.62249755859375, 0.6721954345703125, 0.721893310546875, 0.7715911865234375, 0.8212890625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 28.0, 115.0, 260.0, 305.0, 206.0, 66.0, 14.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.10279846191406, -34.32930374145508, -33.555809020996094, -32.782310485839844, -32.00881576538086, -31.235321044921875, -30.46182632446289, -29.688329696655273, -28.91483497619629, -28.141340255737305, -27.367843627929688, -26.594348907470703, -25.820852279663086, -25.0473575592041, -24.273860931396484, -23.5003662109375, -22.726871490478516, -21.95337677001953, -21.179880142211914, -20.40638542175293, -19.632888793945312, -18.859394073486328, -18.085899353027344, -17.312402725219727, -16.53890609741211, -15.765410423278809, -14.991914749145508, -14.218420028686523, -13.444924354553223, -12.671428680419922, -11.897933006286621, -11.12443733215332, -10.350943565368652, -9.577447891235352, -8.80395221710205, -8.03045654296875, -7.256961822509766, -6.483466148376465, -5.709970474243164, -4.9364752769470215, -4.162979602813721, -3.389484167098999, -2.6159887313842773, -1.8424930572509766, -1.0689976215362549, -0.2955021858215332, 0.4779934883117676, 1.2514886856079102, 2.024984359741211, 2.7984797954559326, 3.5719752311706543, 4.345470905303955, 5.118966102600098, 5.892461776733398, 6.665957450866699, 7.439452648162842, 8.212947845458984, 8.986443519592285, 9.759939193725586, 10.53343391418457, 11.306929588317871, 12.080425262451172, 12.853920936584473, 13.627416610717773, 14.400912284851074]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 3.0, 6.0, 10.0, 14.0, 11.0, 13.0, 22.0, 16.0, 21.0, 29.0, 27.0, 23.0, 42.0, 37.0, 38.0, 46.0, 48.0, 36.0, 40.0, 53.0, 44.0, 43.0, 32.0, 40.0, 35.0, 32.0, 39.0, 38.0, 24.0, 21.0, 18.0, 18.0, 14.0, 15.0, 14.0, 3.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.418083190917969, -9.104279518127441, -8.79047679901123, -8.476673126220703, -8.162870407104492, -7.849066734313965, -7.5352630615234375, -7.221459865570068, -6.907656669616699, -6.59385347366333, -6.280050277709961, -5.966246604919434, -5.6524434089660645, -5.338640213012695, -5.024836540222168, -4.711033344268799, -4.39723014831543, -4.0834269523620605, -3.7696235179901123, -3.455820083618164, -3.142016887664795, -2.828213691711426, -2.5144102573394775, -2.2006068229675293, -1.8868036270141602, -1.5730003118515015, -1.2591969966888428, -0.9453936815261841, -0.6315903663635254, -0.3177870512008667, -0.003983736038208008, 0.30981969833374023, 0.6236228942871094, 0.9374262094497681, 1.2512295246124268, 1.5650328397750854, 1.8788361549377441, 2.1926393508911133, 2.5064427852630615, 2.8202462196350098, 3.134049415588379, 3.447852611541748, 3.7616560459136963, 4.0754594802856445, 4.389262676239014, 4.703065872192383, 5.01686954498291, 5.330672740936279, 5.644475936889648, 5.958279132843018, 6.272082328796387, 6.585886001586914, 6.899689197540283, 7.213492393493652, 7.52729606628418, 7.841099262237549, 8.154902458190918, 8.468706130981445, 8.782508850097656, 9.096312522888184, 9.410116195678711, 9.723918914794922, 10.03772258758545, 10.351526260375977, 10.665328979492188]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 10.0, 28.0, 34.0, 47.0, 93.0, 162.0, 272.0, 680.0, 2679.0, 26353.0, 675018.0, 3139461.0, 330936.0, 15327.0, 1904.0, 590.0, 258.0, 144.0, 104.0, 68.0, 27.0, 24.0, 17.0, 14.0, 11.0, 4.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80078125, -4.53973388671875, -4.2786865234375, -4.01763916015625, -3.756591796875, -3.49554443359375, -3.2344970703125, -2.97344970703125, -2.71240234375, -2.45135498046875, -2.1903076171875, -1.92926025390625, -1.668212890625, -1.40716552734375, -1.1461181640625, -0.88507080078125, -0.6240234375, -0.36297607421875, -0.1019287109375, 0.15911865234375, 0.420166015625, 0.68121337890625, 0.9422607421875, 1.20330810546875, 1.46435546875, 1.72540283203125, 1.9864501953125, 2.24749755859375, 2.508544921875, 2.76959228515625, 3.0306396484375, 3.29168701171875, 3.552734375, 3.81378173828125, 4.0748291015625, 4.33587646484375, 4.596923828125, 4.85797119140625, 5.1190185546875, 5.38006591796875, 5.64111328125, 5.90216064453125, 6.1632080078125, 6.42425537109375, 6.685302734375, 6.94635009765625, 7.2073974609375, 7.46844482421875, 7.7294921875, 7.99053955078125, 8.2515869140625, 8.51263427734375, 8.773681640625, 9.03472900390625, 9.2957763671875, 9.55682373046875, 9.81787109375, 10.07891845703125, 10.3399658203125, 10.60101318359375, 10.862060546875, 11.12310791015625, 11.3841552734375, 11.64520263671875, 11.90625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 9.0, 14.0, 8.0, 12.0, 15.0, 14.0, 24.0, 22.0, 31.0, 30.0, 30.0, 28.0, 31.0, 34.0, 38.0, 42.0, 45.0, 38.0, 40.0, 41.0, 54.0, 52.0, 36.0, 32.0, 33.0, 36.0, 21.0, 40.0, 17.0, 13.0, 17.0, 18.0, 15.0, 9.0, 8.0, 0.0, 8.0, 13.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.998046875, -2.90179443359375, -2.8055419921875, -2.70928955078125, -2.613037109375, -2.51678466796875, -2.4205322265625, -2.32427978515625, -2.22802734375, -2.13177490234375, -2.0355224609375, -1.93927001953125, -1.843017578125, -1.74676513671875, -1.6505126953125, -1.55426025390625, -1.4580078125, -1.36175537109375, -1.2655029296875, -1.16925048828125, -1.072998046875, -0.97674560546875, -0.8804931640625, -0.78424072265625, -0.68798828125, -0.59173583984375, -0.4954833984375, -0.39923095703125, -0.302978515625, -0.20672607421875, -0.1104736328125, -0.01422119140625, 0.08203125, 0.17828369140625, 0.2745361328125, 0.37078857421875, 0.467041015625, 0.56329345703125, 0.6595458984375, 0.75579833984375, 0.85205078125, 0.94830322265625, 1.0445556640625, 1.14080810546875, 1.237060546875, 1.33331298828125, 1.4295654296875, 1.52581787109375, 1.6220703125, 1.71832275390625, 1.8145751953125, 1.91082763671875, 2.007080078125, 2.10333251953125, 2.1995849609375, 2.29583740234375, 2.39208984375, 2.48834228515625, 2.5845947265625, 2.68084716796875, 2.777099609375, 2.87335205078125, 2.9696044921875, 3.06585693359375, 3.162109375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 13.0, 20.0, 15.0, 22.0, 36.0, 39.0, 62.0, 87.0, 146.0, 224.0, 474.0, 923.0, 2361.0, 10597.0, 149450.0, 3495267.0, 508173.0, 20429.0, 3346.0, 1195.0, 544.0, 325.0, 178.0, 101.0, 93.0, 42.0, 38.0, 24.0, 12.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.59222412109375, -7.3446044921875, -7.09698486328125, -6.849365234375, -6.60174560546875, -6.3541259765625, -6.10650634765625, -5.85888671875, -5.61126708984375, -5.3636474609375, -5.11602783203125, -4.868408203125, -4.62078857421875, -4.3731689453125, -4.12554931640625, -3.8779296875, -3.63031005859375, -3.3826904296875, -3.13507080078125, -2.887451171875, -2.63983154296875, -2.3922119140625, -2.14459228515625, -1.89697265625, -1.64935302734375, -1.4017333984375, -1.15411376953125, -0.906494140625, -0.65887451171875, -0.4112548828125, -0.16363525390625, 0.083984375, 0.33160400390625, 0.5792236328125, 0.82684326171875, 1.074462890625, 1.32208251953125, 1.5697021484375, 1.81732177734375, 2.06494140625, 2.31256103515625, 2.5601806640625, 2.80780029296875, 3.055419921875, 3.30303955078125, 3.5506591796875, 3.79827880859375, 4.0458984375, 4.29351806640625, 4.5411376953125, 4.78875732421875, 5.036376953125, 5.28399658203125, 5.5316162109375, 5.77923583984375, 6.02685546875, 6.27447509765625, 6.5220947265625, 6.76971435546875, 7.017333984375, 7.26495361328125, 7.5125732421875, 7.76019287109375, 8.0078125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 8.0, 13.0, 20.0, 35.0, 37.0, 60.0, 73.0, 97.0, 151.0, 232.0, 366.0, 463.0, 552.0, 511.0, 422.0, 339.0, 220.0, 144.0, 88.0, 71.0, 45.0, 22.0, 30.0, 21.0, 11.0, 14.0, 8.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.603515625, -1.5516510009765625, -1.499786376953125, -1.4479217529296875, -1.39605712890625, -1.3441925048828125, -1.292327880859375, -1.2404632568359375, -1.1885986328125, -1.1367340087890625, -1.084869384765625, -1.0330047607421875, -0.98114013671875, -0.9292755126953125, -0.877410888671875, -0.8255462646484375, -0.773681640625, -0.7218170166015625, -0.669952392578125, -0.6180877685546875, -0.56622314453125, -0.5143585205078125, -0.462493896484375, -0.4106292724609375, -0.3587646484375, -0.3069000244140625, -0.255035400390625, -0.2031707763671875, -0.15130615234375, -0.0994415283203125, -0.047576904296875, 0.0042877197265625, 0.05615234375, 0.1080169677734375, 0.159881591796875, 0.2117462158203125, 0.26361083984375, 0.3154754638671875, 0.367340087890625, 0.4192047119140625, 0.4710693359375, 0.5229339599609375, 0.574798583984375, 0.6266632080078125, 0.67852783203125, 0.7303924560546875, 0.782257080078125, 0.8341217041015625, 0.885986328125, 0.9378509521484375, 0.989715576171875, 1.0415802001953125, 1.09344482421875, 1.1453094482421875, 1.197174072265625, 1.2490386962890625, 1.3009033203125, 1.3527679443359375, 1.404632568359375, 1.4564971923828125, 1.50836181640625, 1.5602264404296875, 1.612091064453125, 1.6639556884765625, 1.7158203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 17.0, 41.0, 60.0, 110.0, 150.0, 167.0, 175.0, 131.0, 72.0, 49.0, 15.0, 8.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.792973041534424, -4.444838047027588, -4.096703052520752, -3.748568058013916, -3.40043306350708, -3.052298069000244, -2.7041633129119873, -2.3560283184051514, -2.0078933238983154, -1.6597583293914795, -1.3116233348846436, -0.9634884595870972, -0.6153534650802612, -0.2672184705734253, 0.0809164047241211, 0.42905139923095703, 0.777186393737793, 1.125321388244629, 1.4734563827514648, 1.8215912580490112, 2.1697263717651367, 2.5178613662719727, 2.8659961223602295, 3.2141311168670654, 3.5622661113739014, 3.9104011058807373, 4.258535861968994, 4.60667085647583, 4.954805850982666, 5.302940845489502, 5.651075839996338, 5.999210834503174, 6.347346305847168, 6.695481300354004, 7.04361629486084, 7.391751289367676, 7.739886283874512, 8.088021278381348, 8.436156272888184, 8.78429126739502, 9.132426261901855, 9.480561256408691, 9.828696250915527, 10.176831245422363, 10.5249662399292, 10.873101234436035, 11.221236228942871, 11.569371223449707, 11.917505264282227, 12.265640258789062, 12.613775253295898, 12.961910247802734, 13.31004524230957, 13.658180236816406, 14.006315231323242, 14.354450225830078, 14.702585220336914, 15.05072021484375, 15.398855209350586, 15.746990203857422, 16.095125198364258, 16.443260192871094, 16.79139518737793, 17.139530181884766, 17.4876651763916]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 5.0, 11.0, 6.0, 8.0, 8.0, 9.0, 14.0, 12.0, 20.0, 23.0, 20.0, 20.0, 21.0, 36.0, 34.0, 45.0, 38.0, 45.0, 50.0, 49.0, 41.0, 36.0, 34.0, 44.0, 47.0, 30.0, 32.0, 31.0, 30.0, 31.0, 17.0, 24.0, 20.0, 20.0, 14.0, 12.0, 9.0, 15.0, 9.0, 9.0, 3.0, 4.0, 9.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.63140606880188, -3.526221752166748, -3.4210376739501953, -3.3158533573150635, -3.2106690406799316, -3.105484962463379, -3.000300645828247, -2.8951163291931152, -2.7899322509765625, -2.6847479343414307, -2.579563856124878, -2.474379539489746, -2.3691954612731934, -2.2640111446380615, -2.1588268280029297, -2.053642749786377, -1.9484584331512451, -1.8432742357254028, -1.7380900382995605, -1.6329057216644287, -1.5277215242385864, -1.4225373268127441, -1.3173530101776123, -1.21216881275177, -1.1069846153259277, -1.0018004179000854, -0.8966161608695984, -0.7914319038391113, -0.686247706413269, -0.5810635089874268, -0.4758792519569397, -0.37069499492645264, -0.26551079750061035, -0.16032657027244568, -0.055142343044281006, 0.05004188418388367, 0.15522611141204834, 0.2604103088378906, 0.3655945658683777, 0.47077882289886475, 0.575963020324707, 0.6811472177505493, 0.7863314747810364, 0.8915157318115234, 0.9966999292373657, 1.101884126663208, 1.2070684432983398, 1.3122526407241821, 1.4174368381500244, 1.5226210355758667, 1.627805233001709, 1.7329895496368408, 1.838173747062683, 1.9433579444885254, 2.0485422611236572, 2.153726577758789, 2.258910655975342, 2.3640949726104736, 2.4692790508270264, 2.574463367462158, 2.679647445678711, 2.7848317623138428, 2.8900160789489746, 2.9952001571655273, 3.100384473800659]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 10.0, 6.0, 19.0, 14.0, 23.0, 15.0, 24.0, 32.0, 35.0, 59.0, 86.0, 95.0, 123.0, 193.0, 301.0, 463.0, 763.0, 1460.0, 2974.0, 6716.0, 16617.0, 42799.0, 109870.0, 238108.0, 304603.0, 189266.0, 80773.0, 30783.0, 11850.0, 4976.0, 2330.0, 1134.0, 711.0, 380.0, 243.0, 158.0, 135.0, 103.0, 55.0, 51.0, 47.0, 42.0, 19.0, 18.0, 14.0, 14.0, 8.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.44970703125, -0.4353523254394531, -0.42099761962890625, -0.4066429138183594, -0.3922882080078125, -0.3779335021972656, -0.36357879638671875, -0.3492240905761719, -0.334869384765625, -0.3205146789550781, -0.30615997314453125, -0.2918052673339844, -0.2774505615234375, -0.2630958557128906, -0.24874114990234375, -0.23438644409179688, -0.22003173828125, -0.20567703247070312, -0.19132232666015625, -0.17696762084960938, -0.1626129150390625, -0.14825820922851562, -0.13390350341796875, -0.11954879760742188, -0.105194091796875, -0.09083938598632812, -0.07648468017578125, -0.062129974365234375, -0.0477752685546875, -0.033420562744140625, -0.01906585693359375, -0.004711151123046875, 0.0096435546875, 0.023998260498046875, 0.03835296630859375, 0.052707672119140625, 0.0670623779296875, 0.08141708374023438, 0.09577178955078125, 0.11012649536132812, 0.124481201171875, 0.13883590698242188, 0.15319061279296875, 0.16754531860351562, 0.1819000244140625, 0.19625473022460938, 0.21060943603515625, 0.22496414184570312, 0.23931884765625, 0.2536735534667969, 0.26802825927734375, 0.2823829650878906, 0.2967376708984375, 0.3110923767089844, 0.32544708251953125, 0.3398017883300781, 0.354156494140625, 0.3685111999511719, 0.38286590576171875, 0.3972206115722656, 0.4115753173828125, 0.4259300231933594, 0.44028472900390625, 0.4546394348144531, 0.468994140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 10.0, 6.0, 8.0, 16.0, 3.0, 9.0, 15.0, 17.0, 20.0, 19.0, 29.0, 17.0, 41.0, 31.0, 35.0, 40.0, 47.0, 37.0, 32.0, 50.0, 32.0, 49.0, 41.0, 36.0, 44.0, 36.0, 29.0, 30.0, 24.0, 21.0, 14.0, 30.0, 20.0, 18.0, 10.0, 13.0, 17.0, 6.0, 9.0, 8.0, 3.0, 2.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.361328125, -2.2877197265625, -2.214111328125, -2.1405029296875, -2.06689453125, -1.9932861328125, -1.919677734375, -1.8460693359375, -1.7724609375, -1.6988525390625, -1.625244140625, -1.5516357421875, -1.47802734375, -1.4044189453125, -1.330810546875, -1.2572021484375, -1.18359375, -1.1099853515625, -1.036376953125, -0.9627685546875, -0.88916015625, -0.8155517578125, -0.741943359375, -0.6683349609375, -0.5947265625, -0.5211181640625, -0.447509765625, -0.3739013671875, -0.30029296875, -0.2266845703125, -0.153076171875, -0.0794677734375, -0.005859375, 0.0677490234375, 0.141357421875, 0.2149658203125, 0.28857421875, 0.3621826171875, 0.435791015625, 0.5093994140625, 0.5830078125, 0.6566162109375, 0.730224609375, 0.8038330078125, 0.87744140625, 0.9510498046875, 1.024658203125, 1.0982666015625, 1.171875, 1.2454833984375, 1.319091796875, 1.3927001953125, 1.46630859375, 1.5399169921875, 1.613525390625, 1.6871337890625, 1.7607421875, 1.8343505859375, 1.907958984375, 1.9815673828125, 2.05517578125, 2.1287841796875, 2.202392578125, 2.2760009765625, 2.349609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 12.0, 14.0, 19.0, 30.0, 45.0, 68.0, 136.0, 256.0, 559.0, 1138.0, 2446.0, 5295.0, 11647.0, 26148.0, 57326.0, 116569.0, 199526.0, 240414.0, 187603.0, 105442.0, 51068.0, 23271.0, 10484.0, 4809.0, 2128.0, 1081.0, 495.0, 213.0, 117.0, 73.0, 34.0, 27.0, 15.0, 10.0, 7.0, 10.0, 3.0, 4.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0], "bins": [-0.3623046875, -0.35262298583984375, -0.3429412841796875, -0.33325958251953125, -0.323577880859375, -0.31389617919921875, -0.3042144775390625, -0.29453277587890625, -0.28485107421875, -0.27516937255859375, -0.2654876708984375, -0.25580596923828125, -0.246124267578125, -0.23644256591796875, -0.2267608642578125, -0.21707916259765625, -0.2073974609375, -0.19771575927734375, -0.1880340576171875, -0.17835235595703125, -0.168670654296875, -0.15898895263671875, -0.1493072509765625, -0.13962554931640625, -0.12994384765625, -0.12026214599609375, -0.1105804443359375, -0.10089874267578125, -0.091217041015625, -0.08153533935546875, -0.0718536376953125, -0.06217193603515625, -0.052490234375, -0.04280853271484375, -0.0331268310546875, -0.02344512939453125, -0.013763427734375, -0.00408172607421875, 0.0055999755859375, 0.01528167724609375, 0.02496337890625, 0.03464508056640625, 0.0443267822265625, 0.05400848388671875, 0.063690185546875, 0.07337188720703125, 0.0830535888671875, 0.09273529052734375, 0.1024169921875, 0.11209869384765625, 0.1217803955078125, 0.13146209716796875, 0.141143798828125, 0.15082550048828125, 0.1605072021484375, 0.17018890380859375, 0.17987060546875, 0.18955230712890625, 0.1992340087890625, 0.20891571044921875, 0.218597412109375, 0.22827911376953125, 0.2379608154296875, 0.24764251708984375, 0.25732421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 11.0, 9.0, 8.0, 11.0, 10.0, 12.0, 10.0, 16.0, 16.0, 23.0, 31.0, 43.0, 37.0, 38.0, 39.0, 44.0, 46.0, 44.0, 42.0, 46.0, 57.0, 40.0, 41.0, 52.0, 37.0, 42.0, 35.0, 29.0, 24.0, 13.0, 20.0, 15.0, 9.0, 13.0, 10.0, 9.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.36328125, -6.1849365234375, -6.006591796875, -5.8282470703125, -5.64990234375, -5.4715576171875, -5.293212890625, -5.1148681640625, -4.9365234375, -4.7581787109375, -4.579833984375, -4.4014892578125, -4.22314453125, -4.0447998046875, -3.866455078125, -3.6881103515625, -3.509765625, -3.3314208984375, -3.153076171875, -2.9747314453125, -2.79638671875, -2.6180419921875, -2.439697265625, -2.2613525390625, -2.0830078125, -1.9046630859375, -1.726318359375, -1.5479736328125, -1.36962890625, -1.1912841796875, -1.012939453125, -0.8345947265625, -0.65625, -0.4779052734375, -0.299560546875, -0.1212158203125, 0.05712890625, 0.2354736328125, 0.413818359375, 0.5921630859375, 0.7705078125, 0.9488525390625, 1.127197265625, 1.3055419921875, 1.48388671875, 1.6622314453125, 1.840576171875, 2.0189208984375, 2.197265625, 2.3756103515625, 2.553955078125, 2.7322998046875, 2.91064453125, 3.0889892578125, 3.267333984375, 3.4456787109375, 3.6240234375, 3.8023681640625, 3.980712890625, 4.1590576171875, 4.33740234375, 4.5157470703125, 4.694091796875, 4.8724365234375, 5.05078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 11.0, 17.0, 18.0, 25.0, 28.0, 36.0, 50.0, 76.0, 131.0, 171.0, 258.0, 389.0, 577.0, 842.0, 1567.0, 2502.0, 4822.0, 10382.0, 25037.0, 66256.0, 175781.0, 327697.0, 254478.0, 106108.0, 40018.0, 15669.0, 7002.0, 3438.0, 1938.0, 1079.0, 713.0, 461.0, 299.0, 180.0, 145.0, 98.0, 73.0, 46.0, 34.0, 20.0, 19.0, 21.0, 8.0, 6.0, 10.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0439453125, -0.042560577392578125, -0.04117584228515625, -0.039791107177734375, -0.0384063720703125, -0.037021636962890625, -0.03563690185546875, -0.034252166748046875, -0.032867431640625, -0.031482696533203125, -0.03009796142578125, -0.028713226318359375, -0.0273284912109375, -0.025943756103515625, -0.02455902099609375, -0.023174285888671875, -0.02178955078125, -0.020404815673828125, -0.01902008056640625, -0.017635345458984375, -0.0162506103515625, -0.014865875244140625, -0.01348114013671875, -0.012096405029296875, -0.010711669921875, -0.009326934814453125, -0.00794219970703125, -0.006557464599609375, -0.0051727294921875, -0.003787994384765625, -0.00240325927734375, -0.001018524169921875, 0.0003662109375, 0.001750946044921875, 0.00313568115234375, 0.004520416259765625, 0.0059051513671875, 0.007289886474609375, 0.00867462158203125, 0.010059356689453125, 0.011444091796875, 0.012828826904296875, 0.01421356201171875, 0.015598297119140625, 0.0169830322265625, 0.018367767333984375, 0.01975250244140625, 0.021137237548828125, 0.02252197265625, 0.023906707763671875, 0.02529144287109375, 0.026676177978515625, 0.0280609130859375, 0.029445648193359375, 0.03083038330078125, 0.032215118408203125, 0.033599853515625, 0.034984588623046875, 0.03636932373046875, 0.037754058837890625, 0.0391387939453125, 0.040523529052734375, 0.04190826416015625, 0.043292999267578125, 0.044677734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 17.0, 21.0, 20.0, 31.0, 36.0, 58.0, 64.0, 78.0, 98.0, 107.0, 90.0, 108.0, 77.0, 50.0, 38.0, 38.0, 22.0, 8.0, 7.0, 9.0, 7.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.462501525878906e-05, -7.263291627168655e-05, -7.064081728458405e-05, -6.864871829748154e-05, -6.665661931037903e-05, -6.466452032327652e-05, -6.267242133617401e-05, -6.06803223490715e-05, -5.8688223361968994e-05, -5.6696124374866486e-05, -5.470402538776398e-05, -5.271192640066147e-05, -5.071982741355896e-05, -4.872772842645645e-05, -4.673562943935394e-05, -4.4743530452251434e-05, -4.2751431465148926e-05, -4.075933247804642e-05, -3.876723349094391e-05, -3.67751345038414e-05, -3.478303551673889e-05, -3.279093652963638e-05, -3.0798837542533875e-05, -2.8806738555431366e-05, -2.6814639568328857e-05, -2.482254058122635e-05, -2.283044159412384e-05, -2.0838342607021332e-05, -1.8846243619918823e-05, -1.6854144632816315e-05, -1.4862045645713806e-05, -1.2869946658611298e-05, -1.0877847671508789e-05, -8.88574868440628e-06, -6.893649697303772e-06, -4.9015507102012634e-06, -2.909451723098755e-06, -9.173527359962463e-07, 1.0747462511062622e-06, 3.0668452382087708e-06, 5.058944225311279e-06, 7.051043212413788e-06, 9.043142199516296e-06, 1.1035241186618805e-05, 1.3027340173721313e-05, 1.5019439160823822e-05, 1.701153814792633e-05, 1.900363713502884e-05, 2.0995736122131348e-05, 2.2987835109233856e-05, 2.4979934096336365e-05, 2.6972033083438873e-05, 2.8964132070541382e-05, 3.095623105764389e-05, 3.29483300447464e-05, 3.494042903184891e-05, 3.6932528018951416e-05, 3.8924627006053925e-05, 4.091672599315643e-05, 4.290882498025894e-05, 4.490092396736145e-05, 4.689302295446396e-05, 4.888512194156647e-05, 5.0877220928668976e-05, 5.2869319915771484e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 10.0, 22.0, 32.0, 55.0, 74.0, 117.0, 197.0, 382.0, 953.0, 2501.0, 7923.0, 35377.0, 262362.0, 602517.0, 110522.0, 17917.0, 4567.0, 1628.0, 636.0, 302.0, 187.0, 93.0, 54.0, 30.0, 29.0, 14.0, 10.0, 6.0, 5.0, 2.0, 6.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.11566162109375, -0.11279106140136719, -0.10992050170898438, -0.10704994201660156, -0.10417938232421875, -0.10130882263183594, -0.09843826293945312, -0.09556770324707031, -0.0926971435546875, -0.08982658386230469, -0.08695602416992188, -0.08408546447753906, -0.08121490478515625, -0.07834434509277344, -0.07547378540039062, -0.07260322570800781, -0.069732666015625, -0.06686210632324219, -0.06399154663085938, -0.06112098693847656, -0.05825042724609375, -0.05537986755371094, -0.052509307861328125, -0.04963874816894531, -0.0467681884765625, -0.04389762878417969, -0.041027069091796875, -0.03815650939941406, -0.03528594970703125, -0.03241539001464844, -0.029544830322265625, -0.026674270629882812, -0.0238037109375, -0.020933151245117188, -0.018062591552734375, -0.015192031860351562, -0.01232147216796875, -0.009450912475585938, -0.006580352783203125, -0.0037097930908203125, -0.0008392333984375, 0.0020313262939453125, 0.004901885986328125, 0.0077724456787109375, 0.01064300537109375, 0.013513565063476562, 0.016384124755859375, 0.019254684448242188, 0.022125244140625, 0.024995803833007812, 0.027866363525390625, 0.030736923217773438, 0.03360748291015625, 0.03647804260253906, 0.039348602294921875, 0.04221916198730469, 0.0450897216796875, 0.04796028137207031, 0.050830841064453125, 0.05370140075683594, 0.05657196044921875, 0.05944252014160156, 0.062313079833984375, 0.06518363952636719, 0.06805419921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 13.0, 9.0, 16.0, 9.0, 26.0, 22.0, 40.0, 44.0, 68.0, 89.0, 104.0, 103.0, 98.0, 83.0, 78.0, 56.0, 51.0, 19.0, 18.0, 17.0, 7.0, 11.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018798828125, -0.018062114715576172, -0.017325401306152344, -0.016588687896728516, -0.015851974487304688, -0.01511526107788086, -0.014378547668457031, -0.013641834259033203, -0.012905120849609375, -0.012168407440185547, -0.011431694030761719, -0.01069498062133789, -0.009958267211914062, -0.009221553802490234, -0.008484840393066406, -0.007748126983642578, -0.00701141357421875, -0.006274700164794922, -0.005537986755371094, -0.004801273345947266, -0.0040645599365234375, -0.0033278465270996094, -0.0025911331176757812, -0.0018544197082519531, -0.001117706298828125, -0.0003809928894042969, 0.00035572052001953125, 0.0010924339294433594, 0.0018291473388671875, 0.0025658607482910156, 0.0033025741577148438, 0.004039287567138672, 0.0047760009765625, 0.005512714385986328, 0.006249427795410156, 0.006986141204833984, 0.0077228546142578125, 0.00845956802368164, 0.009196281433105469, 0.009932994842529297, 0.010669708251953125, 0.011406421661376953, 0.012143135070800781, 0.01287984848022461, 0.013616561889648438, 0.014353275299072266, 0.015089988708496094, 0.015826702117919922, 0.01656341552734375, 0.017300128936767578, 0.018036842346191406, 0.018773555755615234, 0.019510269165039062, 0.02024698257446289, 0.02098369598388672, 0.021720409393310547, 0.022457122802734375, 0.023193836212158203, 0.02393054962158203, 0.02466726303100586, 0.025403976440429688, 0.026140689849853516, 0.026877403259277344, 0.027614116668701172, 0.028350830078125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 11.0, 119.0, 576.0, 286.0, 21.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.401341915130615, -4.598896026611328, -3.796450138092041, -2.994004011154175, -2.1915581226348877, -1.3891119956970215, -0.5866661071777344, 0.21577978134155273, 1.0182256698608398, 1.820671558380127, 2.623117446899414, 3.4255635738372803, 4.228009223937988, 5.030455589294434, 5.832901477813721, 6.635347366333008, 7.437793254852295, 8.240239143371582, 9.042685508728027, 9.845130920410156, 10.647577285766602, 11.450023651123047, 12.252469062805176, 13.054914474487305, 13.85736083984375, 14.659807205200195, 15.462252616882324, 16.264698028564453, 17.0671443939209, 17.869590759277344, 18.67203712463379, 19.474483489990234, 20.27692985534668, 21.079376220703125, 21.88182258605957, 22.684267044067383, 23.486713409423828, 24.289159774780273, 25.09160614013672, 25.89405059814453, 26.696496963500977, 27.498943328857422, 28.301389694213867, 29.10383415222168, 29.906280517578125, 30.70872688293457, 31.511173248291016, 32.31361770629883, 33.116065979003906, 33.91851043701172, 34.7209587097168, 35.52340316772461, 36.32585144042969, 37.1282958984375, 37.93074035644531, 38.73318862915039, 39.5356330871582, 40.338077545166016, 41.140525817871094, 41.942970275878906, 42.745418548583984, 43.5478630065918, 44.35030746459961, 45.15275573730469, 45.9552001953125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 9.0, 12.0, 8.0, 6.0, 17.0, 18.0, 15.0, 29.0, 25.0, 25.0, 40.0, 51.0, 52.0, 54.0, 64.0, 68.0, 43.0, 48.0, 53.0, 57.0, 46.0, 29.0, 44.0, 34.0, 28.0, 26.0, 16.0, 14.0, 15.0, 18.0, 13.0, 3.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.7581582069396973, -3.662524938583374, -3.56689190864563, -3.4712586402893066, -3.3756256103515625, -3.2799923419952393, -3.184359073638916, -3.088726043701172, -2.9930930137634277, -2.8974597454071045, -2.8018267154693604, -2.706193447113037, -2.610560417175293, -2.5149271488189697, -2.4192938804626465, -2.3236608505249023, -2.228027582168579, -2.132394313812256, -2.0367612838745117, -1.9411280155181885, -1.8454949855804443, -1.749861717224121, -1.6542285680770874, -1.5585954189300537, -1.46296226978302, -1.3673291206359863, -1.2716959714889526, -1.176062822341919, -1.0804295539855957, -0.9847964644432068, -0.8891632556915283, -0.7935301065444946, -0.6978969573974609, -0.6022638082504272, -0.5066306591033936, -0.4109974503517151, -0.3153643012046814, -0.2197311520576477, -0.12409794330596924, -0.028464794158935547, 0.06716835498809814, 0.16280151903629303, 0.2584346830844879, 0.354067862033844, 0.4497010111808777, 0.5453341603279114, 0.6409673690795898, 0.7366005182266235, 0.8322336673736572, 0.9278668165206909, 1.0234999656677246, 1.1191332340240479, 1.214766263961792, 1.3103995323181152, 1.406032681465149, 1.5016658306121826, 1.5972989797592163, 1.69293212890625, 1.7885652780532837, 1.8841984272003174, 1.9798316955566406, 2.0754647254943848, 2.171097993850708, 2.2667312622070312, 2.3623642921447754]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 9.0, 26.0, 26.0, 54.0, 59.0, 93.0, 159.0, 242.0, 491.0, 947.0, 2033.0, 4811.0, 12948.0, 35435.0, 94542.0, 281925.0, 398396.0, 135420.0, 50617.0, 18112.0, 6799.0, 2698.0, 1231.0, 602.0, 332.0, 215.0, 117.0, 72.0, 41.0, 34.0, 23.0, 16.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.474639892578125, -2.39263916015625, -2.310638427734375, -2.2286376953125, -2.146636962890625, -2.06463623046875, -1.982635498046875, -1.900634765625, -1.818634033203125, -1.73663330078125, -1.654632568359375, -1.5726318359375, -1.490631103515625, -1.40863037109375, -1.326629638671875, -1.24462890625, -1.162628173828125, -1.08062744140625, -0.998626708984375, -0.9166259765625, -0.834625244140625, -0.75262451171875, -0.670623779296875, -0.588623046875, -0.506622314453125, -0.42462158203125, -0.342620849609375, -0.2606201171875, -0.178619384765625, -0.09661865234375, -0.014617919921875, 0.0673828125, 0.149383544921875, 0.23138427734375, 0.313385009765625, 0.3953857421875, 0.477386474609375, 0.55938720703125, 0.641387939453125, 0.723388671875, 0.805389404296875, 0.88739013671875, 0.969390869140625, 1.0513916015625, 1.133392333984375, 1.21539306640625, 1.297393798828125, 1.37939453125, 1.461395263671875, 1.54339599609375, 1.625396728515625, 1.7073974609375, 1.789398193359375, 1.87139892578125, 1.953399658203125, 2.035400390625, 2.117401123046875, 2.19940185546875, 2.281402587890625, 2.3634033203125, 2.445404052734375, 2.52740478515625, 2.609405517578125, 2.69140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 5.0, 14.0, 11.0, 9.0, 13.0, 12.0, 18.0, 14.0, 17.0, 28.0, 31.0, 34.0, 37.0, 43.0, 41.0, 43.0, 45.0, 43.0, 48.0, 29.0, 32.0, 31.0, 35.0, 35.0, 47.0, 33.0, 32.0, 28.0, 27.0, 25.0, 17.0, 16.0, 22.0, 12.0, 6.0, 12.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.140625, -4.0108642578125, -3.881103515625, -3.7513427734375, -3.62158203125, -3.4918212890625, -3.362060546875, -3.2322998046875, -3.1025390625, -2.9727783203125, -2.843017578125, -2.7132568359375, -2.58349609375, -2.4537353515625, -2.323974609375, -2.1942138671875, -2.064453125, -1.9346923828125, -1.804931640625, -1.6751708984375, -1.54541015625, -1.4156494140625, -1.285888671875, -1.1561279296875, -1.0263671875, -0.8966064453125, -0.766845703125, -0.6370849609375, -0.50732421875, -0.3775634765625, -0.247802734375, -0.1180419921875, 0.01171875, 0.1414794921875, 0.271240234375, 0.4010009765625, 0.53076171875, 0.6605224609375, 0.790283203125, 0.9200439453125, 1.0498046875, 1.1795654296875, 1.309326171875, 1.4390869140625, 1.56884765625, 1.6986083984375, 1.828369140625, 1.9581298828125, 2.087890625, 2.2176513671875, 2.347412109375, 2.4771728515625, 2.60693359375, 2.7366943359375, 2.866455078125, 2.9962158203125, 3.1259765625, 3.2557373046875, 3.385498046875, 3.5152587890625, 3.64501953125, 3.7747802734375, 3.904541015625, 4.0343017578125, 4.1640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 10.0, 10.0, 14.0, 22.0, 28.0, 44.0, 46.0, 60.0, 84.0, 155.0, 294.0, 816.0, 11174.0, 841294.0, 190479.0, 2846.0, 521.0, 217.0, 126.0, 77.0, 46.0, 29.0, 30.0, 26.0, 21.0, 19.0, 12.0, 9.0, 0.0, 6.0, 3.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.43701171875, -9.0849609375, -8.73291015625, -8.380859375, -8.02880859375, -7.6767578125, -7.32470703125, -6.97265625, -6.62060546875, -6.2685546875, -5.91650390625, -5.564453125, -5.21240234375, -4.8603515625, -4.50830078125, -4.15625, -3.80419921875, -3.4521484375, -3.10009765625, -2.748046875, -2.39599609375, -2.0439453125, -1.69189453125, -1.33984375, -0.98779296875, -0.6357421875, -0.28369140625, 0.068359375, 0.42041015625, 0.7724609375, 1.12451171875, 1.4765625, 1.82861328125, 2.1806640625, 2.53271484375, 2.884765625, 3.23681640625, 3.5888671875, 3.94091796875, 4.29296875, 4.64501953125, 4.9970703125, 5.34912109375, 5.701171875, 6.05322265625, 6.4052734375, 6.75732421875, 7.109375, 7.46142578125, 7.8134765625, 8.16552734375, 8.517578125, 8.86962890625, 9.2216796875, 9.57373046875, 9.92578125, 10.27783203125, 10.6298828125, 10.98193359375, 11.333984375, 11.68603515625, 12.0380859375, 12.39013671875, 12.7421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 5.0, 14.0, 4.0, 11.0, 8.0, 21.0, 12.0, 18.0, 25.0, 25.0, 40.0, 23.0, 34.0, 29.0, 32.0, 42.0, 33.0, 35.0, 41.0, 44.0, 38.0, 41.0, 51.0, 44.0, 34.0, 40.0, 28.0, 36.0, 37.0, 20.0, 28.0, 28.0, 13.0, 11.0, 7.0, 9.0, 10.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.92578125, -5.74365234375, -5.5615234375, -5.37939453125, -5.197265625, -5.01513671875, -4.8330078125, -4.65087890625, -4.46875, -4.28662109375, -4.1044921875, -3.92236328125, -3.740234375, -3.55810546875, -3.3759765625, -3.19384765625, -3.01171875, -2.82958984375, -2.6474609375, -2.46533203125, -2.283203125, -2.10107421875, -1.9189453125, -1.73681640625, -1.5546875, -1.37255859375, -1.1904296875, -1.00830078125, -0.826171875, -0.64404296875, -0.4619140625, -0.27978515625, -0.09765625, 0.08447265625, 0.2666015625, 0.44873046875, 0.630859375, 0.81298828125, 0.9951171875, 1.17724609375, 1.359375, 1.54150390625, 1.7236328125, 1.90576171875, 2.087890625, 2.27001953125, 2.4521484375, 2.63427734375, 2.81640625, 2.99853515625, 3.1806640625, 3.36279296875, 3.544921875, 3.72705078125, 3.9091796875, 4.09130859375, 4.2734375, 4.45556640625, 4.6376953125, 4.81982421875, 5.001953125, 5.18408203125, 5.3662109375, 5.54833984375, 5.73046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 10.0, 21.0, 38.0, 61.0, 226.0, 1090.0, 10310.0, 1003156.0, 31320.0, 1797.0, 333.0, 87.0, 31.0, 29.0, 6.0, 12.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8515625, -5.654052734375, -5.45654296875, -5.259033203125, -5.0615234375, -4.864013671875, -4.66650390625, -4.468994140625, -4.271484375, -4.073974609375, -3.87646484375, -3.678955078125, -3.4814453125, -3.283935546875, -3.08642578125, -2.888916015625, -2.69140625, -2.493896484375, -2.29638671875, -2.098876953125, -1.9013671875, -1.703857421875, -1.50634765625, -1.308837890625, -1.111328125, -0.913818359375, -0.71630859375, -0.518798828125, -0.3212890625, -0.123779296875, 0.07373046875, 0.271240234375, 0.46875, 0.666259765625, 0.86376953125, 1.061279296875, 1.2587890625, 1.456298828125, 1.65380859375, 1.851318359375, 2.048828125, 2.246337890625, 2.44384765625, 2.641357421875, 2.8388671875, 3.036376953125, 3.23388671875, 3.431396484375, 3.62890625, 3.826416015625, 4.02392578125, 4.221435546875, 4.4189453125, 4.616455078125, 4.81396484375, 5.011474609375, 5.208984375, 5.406494140625, 5.60400390625, 5.801513671875, 5.9990234375, 6.196533203125, 6.39404296875, 6.591552734375, 6.7890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 19.0, 19.0, 44.0, 79.0, 135.0, 240.0, 211.0, 117.0, 60.0, 39.0, 12.0, 10.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005593299865722656, -0.0005432441830635071, -0.0005271583795547485, -0.00051107257604599, -0.0004949867725372314, -0.0004789009690284729, -0.00046281516551971436, -0.0004467293620109558, -0.00043064355850219727, -0.0004145577549934387, -0.0003984719514846802, -0.00038238614797592163, -0.0003663003444671631, -0.00035021454095840454, -0.000334128737449646, -0.00031804293394088745, -0.0003019571304321289, -0.00028587132692337036, -0.0002697855234146118, -0.00025369971990585327, -0.00023761391639709473, -0.00022152811288833618, -0.00020544230937957764, -0.0001893565058708191, -0.00017327070236206055, -0.000157184898853302, -0.00014109909534454346, -0.0001250132918357849, -0.00010892748832702637, -9.284168481826782e-05, -7.675588130950928e-05, -6.067007780075073e-05, -4.458427429199219e-05, -2.8498470783233643e-05, -1.2412667274475098e-05, 3.6731362342834473e-06, 1.9758939743041992e-05, 3.584474325180054e-05, 5.193054676055908e-05, 6.801635026931763e-05, 8.410215377807617e-05, 0.00010018795728683472, 0.00011627376079559326, 0.0001323595643043518, 0.00014844536781311035, 0.0001645311713218689, 0.00018061697483062744, 0.00019670277833938599, 0.00021278858184814453, 0.00022887438535690308, 0.0002449601888656616, 0.00026104599237442017, 0.0002771317958831787, 0.00029321759939193726, 0.0003093034029006958, 0.00032538920640945435, 0.0003414750099182129, 0.00035756081342697144, 0.00037364661693573, 0.0003897324204444885, 0.00040581822395324707, 0.0004219040274620056, 0.00043798983097076416, 0.0004540756344795227, 0.00047016143798828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 22.0, 29.0, 34.0, 120.0, 355.0, 1158.0, 6912.0, 870260.0, 164746.0, 3772.0, 733.0, 226.0, 88.0, 38.0, 21.0, 11.0, 0.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.45916748046875, -7.2620849609375, -7.06500244140625, -6.867919921875, -6.67083740234375, -6.4737548828125, -6.27667236328125, -6.07958984375, -5.88250732421875, -5.6854248046875, -5.48834228515625, -5.291259765625, -5.09417724609375, -4.8970947265625, -4.70001220703125, -4.5029296875, -4.30584716796875, -4.1087646484375, -3.91168212890625, -3.714599609375, -3.51751708984375, -3.3204345703125, -3.12335205078125, -2.92626953125, -2.72918701171875, -2.5321044921875, -2.33502197265625, -2.137939453125, -1.94085693359375, -1.7437744140625, -1.54669189453125, -1.349609375, -1.15252685546875, -0.9554443359375, -0.75836181640625, -0.561279296875, -0.36419677734375, -0.1671142578125, 0.02996826171875, 0.22705078125, 0.42413330078125, 0.6212158203125, 0.81829833984375, 1.015380859375, 1.21246337890625, 1.4095458984375, 1.60662841796875, 1.8037109375, 2.00079345703125, 2.1978759765625, 2.39495849609375, 2.592041015625, 2.78912353515625, 2.9862060546875, 3.18328857421875, 3.38037109375, 3.57745361328125, 3.7745361328125, 3.97161865234375, 4.168701171875, 4.36578369140625, 4.5628662109375, 4.75994873046875, 4.95703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 7.0, 14.0, 17.0, 35.0, 47.0, 50.0, 68.0, 113.0, 187.0, 142.0, 88.0, 65.0, 58.0, 32.0, 30.0, 15.0, 12.0, 4.0, 3.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.87060546875, -0.84149169921875, -0.8123779296875, -0.78326416015625, -0.754150390625, -0.72503662109375, -0.6959228515625, -0.66680908203125, -0.6376953125, -0.60858154296875, -0.5794677734375, -0.55035400390625, -0.521240234375, -0.49212646484375, -0.4630126953125, -0.43389892578125, -0.40478515625, -0.37567138671875, -0.3465576171875, -0.31744384765625, -0.288330078125, -0.25921630859375, -0.2301025390625, -0.20098876953125, -0.171875, -0.14276123046875, -0.1136474609375, -0.08453369140625, -0.055419921875, -0.02630615234375, 0.0028076171875, 0.03192138671875, 0.06103515625, 0.09014892578125, 0.1192626953125, 0.14837646484375, 0.177490234375, 0.20660400390625, 0.2357177734375, 0.26483154296875, 0.2939453125, 0.32305908203125, 0.3521728515625, 0.38128662109375, 0.410400390625, 0.43951416015625, 0.4686279296875, 0.49774169921875, 0.52685546875, 0.55596923828125, 0.5850830078125, 0.61419677734375, 0.643310546875, 0.67242431640625, 0.7015380859375, 0.73065185546875, 0.759765625, 0.78887939453125, 0.8179931640625, 0.84710693359375, 0.876220703125, 0.90533447265625, 0.9344482421875, 0.96356201171875, 0.99267578125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 4.0, 14.0, 42.0, 65.0, 142.0, 189.0, 206.0, 147.0, 105.0, 45.0, 27.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.501060485839844, -16.01848602294922, -15.53591251373291, -15.053339004516602, -14.570765495300293, -14.088191986083984, -13.60561752319336, -13.12304401397705, -12.640470504760742, -12.157896995544434, -11.675322532653809, -11.1927490234375, -10.710175514221191, -10.227602005004883, -9.745027542114258, -9.26245403289795, -8.779879570007324, -8.297306060791016, -7.814732074737549, -7.332158088684082, -6.849584579467773, -6.367010593414307, -5.88443660736084, -5.401863098144531, -4.9192891120910645, -4.436715126037598, -3.954141616821289, -3.4715676307678223, -2.9889938831329346, -2.506420135498047, -2.02384614944458, -1.5412724018096924, -1.058699607849121, -0.5761258006095886, -0.09355199337005615, 0.3890218734741211, 0.8715956211090088, 1.3541693687438965, 1.8367433547973633, 2.319317102432251, 2.8018908500671387, 3.2844645977020264, 3.767038345336914, 4.249612331390381, 4.732186317443848, 5.214759826660156, 5.697333812713623, 6.17990779876709, 6.662481307983398, 7.145055294036865, 7.627628803253174, 8.11020278930664, 8.59277629852295, 9.075349807739258, 9.557924270629883, 10.040497779846191, 10.5230712890625, 11.005644798278809, 11.488219261169434, 11.970792770385742, 12.45336627960205, 12.93593978881836, 13.418514251708984, 13.901087760925293, 14.383662223815918]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 6.0, 6.0, 5.0, 8.0, 12.0, 10.0, 14.0, 18.0, 15.0, 19.0, 14.0, 25.0, 22.0, 29.0, 25.0, 26.0, 30.0, 37.0, 31.0, 38.0, 33.0, 49.0, 39.0, 47.0, 42.0, 35.0, 30.0, 32.0, 31.0, 35.0, 27.0, 33.0, 26.0, 18.0, 18.0, 14.0, 21.0, 18.0, 5.0, 15.0, 8.0, 13.0, 5.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.106329917907715, -7.848696708679199, -7.591063499450684, -7.333430290222168, -7.075797080993652, -6.818163871765137, -6.560531139373779, -6.302897930145264, -6.045264720916748, -5.787631511688232, -5.529998302459717, -5.272365093231201, -5.014732360839844, -4.757099151611328, -4.4994659423828125, -4.241832733154297, -3.9841995239257812, -3.7265663146972656, -3.46893310546875, -3.2113001346588135, -2.953666925430298, -2.6960337162017822, -2.4384007453918457, -2.18076753616333, -1.9231343269348145, -1.6655011177062988, -1.4078680276870728, -1.1502349376678467, -0.892601728439331, -0.6349685192108154, -0.37733542919158936, -0.11970233917236328, 0.13793182373046875, 0.3955649733543396, 0.6531981229782104, 0.9108312726020813, 1.1684644222259521, 1.4260976314544678, 1.6837307214736938, 1.94136381149292, 2.1989970207214355, 2.456630229949951, 2.714263439178467, 2.9718964099884033, 3.229529619216919, 3.4871628284454346, 3.744795799255371, 4.002429008483887, 4.260062217712402, 4.517695426940918, 4.775328636169434, 5.032961845397949, 5.290595054626465, 5.5482282638549805, 5.805860996246338, 6.0634942054748535, 6.321127414703369, 6.578760623931885, 6.8363938331604, 7.094027042388916, 7.351659774780273, 7.609292984008789, 7.866926193237305, 8.12455940246582, 8.382192611694336]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 13.0, 16.0, 23.0, 37.0, 47.0, 69.0, 86.0, 187.0, 277.0, 596.0, 2124.0, 13980.0, 215050.0, 2752885.0, 1142407.0, 57921.0, 5941.0, 1300.0, 523.0, 265.0, 187.0, 104.0, 86.0, 47.0, 44.0, 14.0, 13.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6875, -6.462890625, -6.23828125, -6.013671875, -5.7890625, -5.564453125, -5.33984375, -5.115234375, -4.890625, -4.666015625, -4.44140625, -4.216796875, -3.9921875, -3.767578125, -3.54296875, -3.318359375, -3.09375, -2.869140625, -2.64453125, -2.419921875, -2.1953125, -1.970703125, -1.74609375, -1.521484375, -1.296875, -1.072265625, -0.84765625, -0.623046875, -0.3984375, -0.173828125, 0.05078125, 0.275390625, 0.5, 0.724609375, 0.94921875, 1.173828125, 1.3984375, 1.623046875, 1.84765625, 2.072265625, 2.296875, 2.521484375, 2.74609375, 2.970703125, 3.1953125, 3.419921875, 3.64453125, 3.869140625, 4.09375, 4.318359375, 4.54296875, 4.767578125, 4.9921875, 5.216796875, 5.44140625, 5.666015625, 5.890625, 6.115234375, 6.33984375, 6.564453125, 6.7890625, 7.013671875, 7.23828125, 7.462890625, 7.6875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 8.0, 4.0, 10.0, 12.0, 12.0, 7.0, 12.0, 12.0, 23.0, 16.0, 22.0, 23.0, 28.0, 27.0, 29.0, 42.0, 43.0, 39.0, 35.0, 44.0, 52.0, 44.0, 37.0, 45.0, 37.0, 32.0, 30.0, 36.0, 25.0, 34.0, 31.0, 21.0, 16.0, 23.0, 12.0, 23.0, 12.0, 9.0, 5.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.591796875, -2.50201416015625, -2.4122314453125, -2.32244873046875, -2.232666015625, -2.14288330078125, -2.0531005859375, -1.96331787109375, -1.87353515625, -1.78375244140625, -1.6939697265625, -1.60418701171875, -1.514404296875, -1.42462158203125, -1.3348388671875, -1.24505615234375, -1.1552734375, -1.06549072265625, -0.9757080078125, -0.88592529296875, -0.796142578125, -0.70635986328125, -0.6165771484375, -0.52679443359375, -0.43701171875, -0.34722900390625, -0.2574462890625, -0.16766357421875, -0.077880859375, 0.01190185546875, 0.1016845703125, 0.19146728515625, 0.28125, 0.37103271484375, 0.4608154296875, 0.55059814453125, 0.640380859375, 0.73016357421875, 0.8199462890625, 0.90972900390625, 0.99951171875, 1.08929443359375, 1.1790771484375, 1.26885986328125, 1.358642578125, 1.44842529296875, 1.5382080078125, 1.62799072265625, 1.7177734375, 1.80755615234375, 1.8973388671875, 1.98712158203125, 2.076904296875, 2.16668701171875, 2.2564697265625, 2.34625244140625, 2.43603515625, 2.52581787109375, 2.6156005859375, 2.70538330078125, 2.795166015625, 2.88494873046875, 2.9747314453125, 3.06451416015625, 3.154296875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 7.0, 8.0, 11.0, 26.0, 33.0, 48.0, 78.0, 157.0, 326.0, 948.0, 3416.0, 41657.0, 3771655.0, 364936.0, 8433.0, 1558.0, 502.0, 215.0, 110.0, 64.0, 34.0, 24.0, 11.0, 4.0, 4.0, 3.0, 9.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.65625, -12.302001953125, -11.94775390625, -11.593505859375, -11.2392578125, -10.885009765625, -10.53076171875, -10.176513671875, -9.822265625, -9.468017578125, -9.11376953125, -8.759521484375, -8.4052734375, -8.051025390625, -7.69677734375, -7.342529296875, -6.98828125, -6.634033203125, -6.27978515625, -5.925537109375, -5.5712890625, -5.217041015625, -4.86279296875, -4.508544921875, -4.154296875, -3.800048828125, -3.44580078125, -3.091552734375, -2.7373046875, -2.383056640625, -2.02880859375, -1.674560546875, -1.3203125, -0.966064453125, -0.61181640625, -0.257568359375, 0.0966796875, 0.450927734375, 0.80517578125, 1.159423828125, 1.513671875, 1.867919921875, 2.22216796875, 2.576416015625, 2.9306640625, 3.284912109375, 3.63916015625, 3.993408203125, 4.34765625, 4.701904296875, 5.05615234375, 5.410400390625, 5.7646484375, 6.118896484375, 6.47314453125, 6.827392578125, 7.181640625, 7.535888671875, 7.89013671875, 8.244384765625, 8.5986328125, 8.952880859375, 9.30712890625, 9.661376953125, 10.015625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 13.0, 14.0, 16.0, 31.0, 48.0, 71.0, 105.0, 173.0, 259.0, 391.0, 569.0, 592.0, 537.0, 433.0, 311.0, 182.0, 97.0, 61.0, 53.0, 31.0, 26.0, 15.0, 11.0, 11.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6611328125, -1.6068267822265625, -1.552520751953125, -1.4982147216796875, -1.44390869140625, -1.3896026611328125, -1.335296630859375, -1.2809906005859375, -1.2266845703125, -1.1723785400390625, -1.118072509765625, -1.0637664794921875, -1.00946044921875, -0.9551544189453125, -0.900848388671875, -0.8465423583984375, -0.792236328125, -0.7379302978515625, -0.683624267578125, -0.6293182373046875, -0.57501220703125, -0.5207061767578125, -0.466400146484375, -0.4120941162109375, -0.3577880859375, -0.3034820556640625, -0.249176025390625, -0.1948699951171875, -0.14056396484375, -0.0862579345703125, -0.031951904296875, 0.0223541259765625, 0.07666015625, 0.1309661865234375, 0.185272216796875, 0.2395782470703125, 0.29388427734375, 0.3481903076171875, 0.402496337890625, 0.4568023681640625, 0.5111083984375, 0.5654144287109375, 0.619720458984375, 0.6740264892578125, 0.72833251953125, 0.7826385498046875, 0.836944580078125, 0.8912506103515625, 0.945556640625, 0.9998626708984375, 1.054168701171875, 1.1084747314453125, 1.16278076171875, 1.2170867919921875, 1.271392822265625, 1.3256988525390625, 1.3800048828125, 1.4343109130859375, 1.488616943359375, 1.5429229736328125, 1.59722900390625, 1.6515350341796875, 1.705841064453125, 1.7601470947265625, 1.814453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 25.0, 36.0, 54.0, 110.0, 162.0, 200.0, 159.0, 133.0, 74.0, 32.0, 11.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.191085815429688, -9.819502830505371, -9.447918891906738, -9.076335906982422, -8.704751968383789, -8.333168983459473, -7.96158504486084, -7.590002059936523, -7.218418121337891, -6.846834659576416, -6.475251197814941, -6.103667736053467, -5.732084274291992, -5.360500812530518, -4.988917350769043, -4.617334365844727, -4.245750904083252, -3.8741674423217773, -3.5025839805603027, -3.131000518798828, -2.7594170570373535, -2.387833595275879, -2.0162503719329834, -1.6446669101715088, -1.2730834484100342, -0.9014999866485596, -0.5299165844917297, -0.1583331823348999, 0.2132502794265747, 0.5848337411880493, 0.9564170837402344, 1.328000545501709, 1.6995840072631836, 2.071167469024658, 2.442750930786133, 2.8143343925476074, 3.185917854309082, 3.5575013160705566, 3.929084539413452, 4.300667762756348, 4.6722517013549805, 5.043835163116455, 5.41541862487793, 5.787002086639404, 6.158585548400879, 6.5301690101623535, 6.901752471923828, 7.2733354568481445, 7.644918918609619, 8.016502380371094, 8.38808536529541, 8.759669303894043, 9.13125228881836, 9.502836227416992, 9.874419212341309, 10.246003150939941, 10.617586135864258, 10.989169120788574, 11.360753059387207, 11.732336044311523, 12.103919982910156, 12.475502967834473, 12.847086906433105, 13.218669891357422, 13.590253829956055]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 7.0, 13.0, 13.0, 17.0, 14.0, 16.0, 24.0, 18.0, 26.0, 30.0, 27.0, 34.0, 42.0, 41.0, 34.0, 41.0, 39.0, 38.0, 52.0, 34.0, 34.0, 46.0, 33.0, 48.0, 25.0, 48.0, 30.0, 31.0, 35.0, 19.0, 11.0, 16.0, 20.0, 7.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853839635848999, -3.7448890209198, -3.6359384059906006, -3.5269877910614014, -3.4180374145507812, -3.309086799621582, -3.200136184692383, -3.0911855697631836, -2.9822349548339844, -2.873284339904785, -2.764333724975586, -2.6553831100463867, -2.5464324951171875, -2.4374818801879883, -2.328531503677368, -2.219580888748169, -2.1106302738189697, -2.0016796588897705, -1.8927290439605713, -1.7837785482406616, -1.6748279333114624, -1.5658773183822632, -1.4569268226623535, -1.3479762077331543, -1.239025592803955, -1.1300749778747559, -1.0211243629455566, -0.912173867225647, -0.8032232522964478, -0.6942726373672485, -0.5853220820426941, -0.47637152671813965, -0.36742115020751953, -0.2584705650806427, -0.14951997995376587, -0.04056939482688904, 0.06838119029998779, 0.177331805229187, 0.28628236055374146, 0.3952329158782959, 0.5041835308074951, 0.6131341457366943, 0.7220847010612488, 0.8310352563858032, 0.9399858713150024, 1.0489364862442017, 1.1578869819641113, 1.2668375968933105, 1.3757882118225098, 1.484738826751709, 1.5936894416809082, 1.7026399374008179, 1.811590552330017, 1.9205411672592163, 2.029491662979126, 2.138442277908325, 2.2473928928375244, 2.3563435077667236, 2.465294122695923, 2.574244737625122, 2.683195114135742, 2.7921457290649414, 2.9010963439941406, 3.01004695892334, 3.118997573852539]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 9.0, 15.0, 29.0, 42.0, 66.0, 81.0, 145.0, 280.0, 559.0, 1260.0, 3427.0, 10854.0, 50673.0, 302321.0, 521544.0, 125601.0, 21963.0, 5837.0, 2044.0, 822.0, 422.0, 215.0, 118.0, 77.0, 46.0, 31.0, 20.0, 19.0, 8.0, 9.0, 6.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.03515625, -1.0087814331054688, -0.9824066162109375, -0.9560317993164062, -0.929656982421875, -0.9032821655273438, -0.8769073486328125, -0.8505325317382812, -0.82415771484375, -0.7977828979492188, -0.7714080810546875, -0.7450332641601562, -0.718658447265625, -0.6922836303710938, -0.6659088134765625, -0.6395339965820312, -0.6131591796875, -0.5867843627929688, -0.5604095458984375, -0.5340347290039062, -0.507659912109375, -0.48128509521484375, -0.4549102783203125, -0.42853546142578125, -0.40216064453125, -0.37578582763671875, -0.3494110107421875, -0.32303619384765625, -0.296661376953125, -0.27028656005859375, -0.2439117431640625, -0.21753692626953125, -0.191162109375, -0.16478729248046875, -0.1384124755859375, -0.11203765869140625, -0.085662841796875, -0.05928802490234375, -0.0329132080078125, -0.00653839111328125, 0.01983642578125, 0.04621124267578125, 0.0725860595703125, 0.09896087646484375, 0.125335693359375, 0.15171051025390625, 0.1780853271484375, 0.20446014404296875, 0.2308349609375, 0.25720977783203125, 0.2835845947265625, 0.30995941162109375, 0.336334228515625, 0.36270904541015625, 0.3890838623046875, 0.41545867919921875, 0.44183349609375, 0.46820831298828125, 0.4945831298828125, 0.5209579467773438, 0.547332763671875, 0.5737075805664062, 0.6000823974609375, 0.6264572143554688, 0.65283203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 15.0, 17.0, 18.0, 18.0, 24.0, 41.0, 38.0, 56.0, 59.0, 52.0, 55.0, 40.0, 55.0, 65.0, 49.0, 65.0, 60.0, 47.0, 48.0, 46.0, 28.0, 21.0, 28.0, 13.0, 10.0, 8.0, 13.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.29296875, -4.192626953125, -4.09228515625, -3.991943359375, -3.8916015625, -3.791259765625, -3.69091796875, -3.590576171875, -3.490234375, -3.389892578125, -3.28955078125, -3.189208984375, -3.0888671875, -2.988525390625, -2.88818359375, -2.787841796875, -2.6875, -2.587158203125, -2.48681640625, -2.386474609375, -2.2861328125, -2.185791015625, -2.08544921875, -1.985107421875, -1.884765625, -1.784423828125, -1.68408203125, -1.583740234375, -1.4833984375, -1.383056640625, -1.28271484375, -1.182373046875, -1.08203125, -0.981689453125, -0.88134765625, -0.781005859375, -0.6806640625, -0.580322265625, -0.47998046875, -0.379638671875, -0.279296875, -0.178955078125, -0.07861328125, 0.021728515625, 0.1220703125, 0.222412109375, 0.32275390625, 0.423095703125, 0.5234375, 0.623779296875, 0.72412109375, 0.824462890625, 0.9248046875, 1.025146484375, 1.12548828125, 1.225830078125, 1.326171875, 1.426513671875, 1.52685546875, 1.627197265625, 1.7275390625, 1.827880859375, 1.92822265625, 2.028564453125, 2.12890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 14.0, 12.0, 21.0, 29.0, 43.0, 70.0, 142.0, 345.0, 756.0, 2001.0, 5080.0, 13355.0, 35411.0, 91939.0, 208541.0, 309473.0, 219994.0, 99493.0, 38387.0, 14308.0, 5339.0, 2132.0, 829.0, 386.0, 188.0, 85.0, 63.0, 39.0, 22.0, 14.0, 10.0, 4.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.34534454345703125, -0.3347320556640625, -0.32411956787109375, -0.313507080078125, -0.30289459228515625, -0.2922821044921875, -0.28166961669921875, -0.27105712890625, -0.26044464111328125, -0.2498321533203125, -0.23921966552734375, -0.228607177734375, -0.21799468994140625, -0.2073822021484375, -0.19676971435546875, -0.1861572265625, -0.17554473876953125, -0.1649322509765625, -0.15431976318359375, -0.143707275390625, -0.13309478759765625, -0.1224822998046875, -0.11186981201171875, -0.10125732421875, -0.09064483642578125, -0.0800323486328125, -0.06941986083984375, -0.058807373046875, -0.04819488525390625, -0.0375823974609375, -0.02696990966796875, -0.016357421875, -0.00574493408203125, 0.0048675537109375, 0.01548004150390625, 0.026092529296875, 0.03670501708984375, 0.0473175048828125, 0.05792999267578125, 0.06854248046875, 0.07915496826171875, 0.0897674560546875, 0.10037994384765625, 0.110992431640625, 0.12160491943359375, 0.1322174072265625, 0.14282989501953125, 0.1534423828125, 0.16405487060546875, 0.1746673583984375, 0.18527984619140625, 0.195892333984375, 0.20650482177734375, 0.2171173095703125, 0.22772979736328125, 0.23834228515625, 0.24895477294921875, 0.2595672607421875, 0.27017974853515625, 0.280792236328125, 0.29140472412109375, 0.3020172119140625, 0.31262969970703125, 0.3232421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 14.0, 14.0, 9.0, 23.0, 14.0, 22.0, 23.0, 27.0, 41.0, 47.0, 38.0, 47.0, 49.0, 47.0, 55.0, 45.0, 59.0, 59.0, 66.0, 61.0, 29.0, 40.0, 26.0, 35.0, 22.0, 22.0, 12.0, 15.0, 9.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.2103271484375, -5.026123046875, -4.8419189453125, -4.65771484375, -4.4735107421875, -4.289306640625, -4.1051025390625, -3.9208984375, -3.7366943359375, -3.552490234375, -3.3682861328125, -3.18408203125, -2.9998779296875, -2.815673828125, -2.6314697265625, -2.447265625, -2.2630615234375, -2.078857421875, -1.8946533203125, -1.71044921875, -1.5262451171875, -1.342041015625, -1.1578369140625, -0.9736328125, -0.7894287109375, -0.605224609375, -0.4210205078125, -0.23681640625, -0.0526123046875, 0.131591796875, 0.3157958984375, 0.5, 0.6842041015625, 0.868408203125, 1.0526123046875, 1.23681640625, 1.4210205078125, 1.605224609375, 1.7894287109375, 1.9736328125, 2.1578369140625, 2.342041015625, 2.5262451171875, 2.71044921875, 2.8946533203125, 3.078857421875, 3.2630615234375, 3.447265625, 3.6314697265625, 3.815673828125, 3.9998779296875, 4.18408203125, 4.3682861328125, 4.552490234375, 4.7366943359375, 4.9208984375, 5.1051025390625, 5.289306640625, 5.4735107421875, 5.65771484375, 5.8419189453125, 6.026123046875, 6.2103271484375, 6.39453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 17.0, 40.0, 40.0, 69.0, 91.0, 144.0, 250.0, 473.0, 834.0, 1477.0, 3041.0, 6798.0, 17031.0, 54184.0, 205972.0, 457702.0, 213646.0, 56258.0, 17294.0, 6723.0, 2935.0, 1549.0, 821.0, 427.0, 270.0, 158.0, 109.0, 51.0, 44.0, 25.0, 24.0, 11.0, 7.0, 7.0, 1.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.056365966796875, -0.05457735061645508, -0.052788734436035156, -0.051000118255615234, -0.04921150207519531, -0.04742288589477539, -0.04563426971435547, -0.04384565353393555, -0.042057037353515625, -0.0402684211730957, -0.03847980499267578, -0.03669118881225586, -0.03490257263183594, -0.033113956451416016, -0.031325340270996094, -0.029536724090576172, -0.02774810791015625, -0.025959491729736328, -0.024170875549316406, -0.022382259368896484, -0.020593643188476562, -0.01880502700805664, -0.01701641082763672, -0.015227794647216797, -0.013439178466796875, -0.011650562286376953, -0.009861946105957031, -0.00807332992553711, -0.0062847137451171875, -0.004496097564697266, -0.0027074813842773438, -0.0009188652038574219, 0.0008697509765625, 0.002658367156982422, 0.004446983337402344, 0.006235599517822266, 0.008024215698242188, 0.00981283187866211, 0.011601448059082031, 0.013390064239501953, 0.015178680419921875, 0.016967296600341797, 0.01875591278076172, 0.02054452896118164, 0.022333145141601562, 0.024121761322021484, 0.025910377502441406, 0.027698993682861328, 0.02948760986328125, 0.03127622604370117, 0.033064842224121094, 0.034853458404541016, 0.03664207458496094, 0.03843069076538086, 0.04021930694580078, 0.0420079231262207, 0.043796539306640625, 0.04558515548706055, 0.04737377166748047, 0.04916238784790039, 0.05095100402832031, 0.052739620208740234, 0.054528236389160156, 0.05631685256958008, 0.05810546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 9.0, 9.0, 13.0, 23.0, 23.0, 38.0, 44.0, 56.0, 67.0, 69.0, 94.0, 91.0, 79.0, 81.0, 76.0, 48.0, 43.0, 26.0, 30.0, 24.0, 14.0, 12.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.820657730102539e-05, -3.677047789096832e-05, -3.5334378480911255e-05, -3.389827907085419e-05, -3.246217966079712e-05, -3.102608025074005e-05, -2.9589980840682983e-05, -2.8153881430625916e-05, -2.6717782020568848e-05, -2.528168261051178e-05, -2.3845583200454712e-05, -2.2409483790397644e-05, -2.0973384380340576e-05, -1.9537284970283508e-05, -1.810118556022644e-05, -1.6665086150169373e-05, -1.5228986740112305e-05, -1.3792887330055237e-05, -1.2356787919998169e-05, -1.0920688509941101e-05, -9.484589099884033e-06, -8.048489689826965e-06, -6.6123902797698975e-06, -5.17629086971283e-06, -3.7401914596557617e-06, -2.304092049598694e-06, -8.67992639541626e-07, 5.681067705154419e-07, 2.0042061805725098e-06, 3.4403055906295776e-06, 4.8764050006866455e-06, 6.312504410743713e-06, 7.748603820800781e-06, 9.184703230857849e-06, 1.0620802640914917e-05, 1.2056902050971985e-05, 1.3493001461029053e-05, 1.492910087108612e-05, 1.636520028114319e-05, 1.7801299691200256e-05, 1.9237399101257324e-05, 2.0673498511314392e-05, 2.210959792137146e-05, 2.3545697331428528e-05, 2.4981796741485596e-05, 2.6417896151542664e-05, 2.785399556159973e-05, 2.92900949716568e-05, 3.072619438171387e-05, 3.2162293791770935e-05, 3.3598393201828e-05, 3.503449261188507e-05, 3.647059202194214e-05, 3.7906691431999207e-05, 3.9342790842056274e-05, 4.077889025211334e-05, 4.221498966217041e-05, 4.365108907222748e-05, 4.5087188482284546e-05, 4.6523287892341614e-05, 4.795938730239868e-05, 4.939548671245575e-05, 5.083158612251282e-05, 5.2267685532569885e-05, 5.370378494262695e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 9.0, 14.0, 23.0, 53.0, 47.0, 90.0, 141.0, 240.0, 453.0, 855.0, 1724.0, 3489.0, 8268.0, 22613.0, 83169.0, 405861.0, 401883.0, 81638.0, 22412.0, 8216.0, 3608.0, 1752.0, 792.0, 456.0, 276.0, 163.0, 95.0, 41.0, 44.0, 33.0, 22.0, 12.0, 11.0, 6.0, 8.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.06871414184570312, -0.06656646728515625, -0.06441879272460938, -0.0622711181640625, -0.060123443603515625, -0.05797576904296875, -0.055828094482421875, -0.053680419921875, -0.051532745361328125, -0.04938507080078125, -0.047237396240234375, -0.0450897216796875, -0.042942047119140625, -0.04079437255859375, -0.038646697998046875, -0.0364990234375, -0.034351348876953125, -0.03220367431640625, -0.030055999755859375, -0.0279083251953125, -0.025760650634765625, -0.02361297607421875, -0.021465301513671875, -0.019317626953125, -0.017169952392578125, -0.01502227783203125, -0.012874603271484375, -0.0107269287109375, -0.008579254150390625, -0.00643157958984375, -0.004283905029296875, -0.00213623046875, 1.1444091796875e-05, 0.00215911865234375, 0.004306793212890625, 0.0064544677734375, 0.008602142333984375, 0.01074981689453125, 0.012897491455078125, 0.015045166015625, 0.017192840576171875, 0.01934051513671875, 0.021488189697265625, 0.0236358642578125, 0.025783538818359375, 0.02793121337890625, 0.030078887939453125, 0.0322265625, 0.034374237060546875, 0.03652191162109375, 0.038669586181640625, 0.0408172607421875, 0.042964935302734375, 0.04511260986328125, 0.047260284423828125, 0.049407958984375, 0.051555633544921875, 0.05370330810546875, 0.055850982666015625, 0.0579986572265625, 0.060146331787109375, 0.06229400634765625, 0.06444168090820312, 0.06658935546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 10.0, 6.0, 7.0, 15.0, 7.0, 16.0, 18.0, 27.0, 23.0, 40.0, 53.0, 65.0, 59.0, 87.0, 76.0, 91.0, 72.0, 64.0, 64.0, 42.0, 38.0, 22.0, 18.0, 10.0, 17.0, 7.0, 7.0, 5.0, 7.0, 4.0, 4.0, 1.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0194091796875, -0.01887190341949463, -0.018334627151489258, -0.017797350883483887, -0.017260074615478516, -0.016722798347473145, -0.016185522079467773, -0.015648245811462402, -0.015110969543457031, -0.01457369327545166, -0.014036417007446289, -0.013499140739440918, -0.012961864471435547, -0.012424588203430176, -0.011887311935424805, -0.011350035667419434, -0.010812759399414062, -0.010275483131408691, -0.00973820686340332, -0.00920093059539795, -0.008663654327392578, -0.008126378059387207, -0.007589101791381836, -0.007051825523376465, -0.006514549255371094, -0.005977272987365723, -0.0054399967193603516, -0.0049027204513549805, -0.004365444183349609, -0.0038281679153442383, -0.003290891647338867, -0.002753615379333496, -0.002216339111328125, -0.001679062843322754, -0.0011417865753173828, -0.0006045103073120117, -6.723403930664062e-05, 0.00047004222869873047, 0.0010073184967041016, 0.0015445947647094727, 0.0020818710327148438, 0.002619147300720215, 0.003156423568725586, 0.003693699836730957, 0.004230976104736328, 0.004768252372741699, 0.00530552864074707, 0.005842804908752441, 0.0063800811767578125, 0.006917357444763184, 0.007454633712768555, 0.007991909980773926, 0.008529186248779297, 0.009066462516784668, 0.009603738784790039, 0.01014101505279541, 0.010678291320800781, 0.011215567588806152, 0.011752843856811523, 0.012290120124816895, 0.012827396392822266, 0.013364672660827637, 0.013901948928833008, 0.014439225196838379, 0.01497650146484375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 9.0, 39.0, 175.0, 417.0, 297.0, 67.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.210787296295166, -6.719435214996338, -6.228082656860352, -5.736730575561523, -5.245378494262695, -4.754026412963867, -4.262673854827881, -3.7713217735290527, -3.2799694538116455, -2.7886171340942383, -2.29726505279541, -1.805912733078003, -1.3145605325698853, -0.8232083320617676, -0.33185601234436035, 0.15949606895446777, 0.650848388671875, 1.1422005891799927, 1.6335527896881104, 2.1249051094055176, 2.6162571907043457, 3.107609510421753, 3.59896183013916, 4.090313911437988, 4.581665992736816, 5.0730180740356445, 5.564370632171631, 6.055722713470459, 6.547074794769287, 7.038427352905273, 7.529779434204102, 8.02113151550293, 8.512484550476074, 9.003836631774902, 9.49518871307373, 9.986541748046875, 10.477893829345703, 10.969245910644531, 11.46059799194336, 11.951950073242188, 12.443302154541016, 12.934654235839844, 13.426006317138672, 13.9173583984375, 14.408711433410645, 14.900063514709473, 15.3914155960083, 15.882767677307129, 16.374120712280273, 16.8654727935791, 17.35682487487793, 17.848176956176758, 18.339529037475586, 18.830881118774414, 19.322235107421875, 19.813587188720703, 20.3049373626709, 20.796289443969727, 21.287641525268555, 21.778993606567383, 22.27034568786621, 22.76169776916504, 23.2530517578125, 23.744403839111328, 24.235755920410156]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 1.0, 8.0, 9.0, 15.0, 8.0, 17.0, 12.0, 23.0, 20.0, 22.0, 28.0, 35.0, 31.0, 33.0, 46.0, 44.0, 40.0, 37.0, 46.0, 42.0, 44.0, 41.0, 43.0, 33.0, 46.0, 33.0, 44.0, 37.0, 30.0, 32.0, 21.0, 10.0, 20.0, 11.0, 9.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4333488941192627, -2.3600993156433105, -2.2868497371673584, -2.2136003971099854, -2.140350818634033, -2.067101240158081, -1.993851661682129, -1.9206020832061768, -1.8473526239395142, -1.774103045463562, -1.7008535861968994, -1.6276040077209473, -1.5543544292449951, -1.4811049699783325, -1.4078553915023804, -1.3346059322357178, -1.2613563537597656, -1.1881067752838135, -1.1148573160171509, -1.0416077375411987, -0.9683582186698914, -0.895108699798584, -0.8218591213226318, -0.7486096024513245, -0.6753600835800171, -0.6021105647087097, -0.5288610458374023, -0.4556114673614502, -0.3823619484901428, -0.30911242961883545, -0.2358628809452057, -0.16261333227157593, -0.08936357498168945, -0.016114041209220886, 0.05713549256324768, 0.13038502633571625, 0.20363456010818481, 0.2768840789794922, 0.35013362765312195, 0.4233831763267517, 0.4966326951980591, 0.5698822140693665, 0.6431317329406738, 0.716381311416626, 0.7896308302879333, 0.8628803491592407, 0.9361299276351929, 1.0093793869018555, 1.0826289653778076, 1.1558785438537598, 1.2291280031204224, 1.3023775815963745, 1.375627040863037, 1.4488766193389893, 1.5221261978149414, 1.5953757762908936, 1.6686252355575562, 1.7418748140335083, 1.815124273300171, 1.888373851776123, 1.9616234302520752, 2.0348730087280273, 2.1081223487854004, 2.1813719272613525, 2.2546215057373047]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 13.0, 9.0, 17.0, 22.0, 26.0, 40.0, 51.0, 82.0, 102.0, 178.0, 336.0, 615.0, 1440.0, 3544.0, 9165.0, 24149.0, 62412.0, 222951.0, 534168.0, 120662.0, 41326.0, 16269.0, 6196.0, 2439.0, 1053.0, 511.0, 280.0, 141.0, 124.0, 66.0, 42.0, 43.0, 25.0, 13.0, 18.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.82464599609375, -2.7371826171875, -2.64971923828125, -2.562255859375, -2.47479248046875, -2.3873291015625, -2.29986572265625, -2.21240234375, -2.12493896484375, -2.0374755859375, -1.95001220703125, -1.862548828125, -1.77508544921875, -1.6876220703125, -1.60015869140625, -1.5126953125, -1.42523193359375, -1.3377685546875, -1.25030517578125, -1.162841796875, -1.07537841796875, -0.9879150390625, -0.90045166015625, -0.81298828125, -0.72552490234375, -0.6380615234375, -0.55059814453125, -0.463134765625, -0.37567138671875, -0.2882080078125, -0.20074462890625, -0.11328125, -0.02581787109375, 0.0616455078125, 0.14910888671875, 0.236572265625, 0.32403564453125, 0.4114990234375, 0.49896240234375, 0.58642578125, 0.67388916015625, 0.7613525390625, 0.84881591796875, 0.936279296875, 1.02374267578125, 1.1112060546875, 1.19866943359375, 1.2861328125, 1.37359619140625, 1.4610595703125, 1.54852294921875, 1.635986328125, 1.72344970703125, 1.8109130859375, 1.89837646484375, 1.98583984375, 2.07330322265625, 2.1607666015625, 2.24822998046875, 2.335693359375, 2.42315673828125, 2.5106201171875, 2.59808349609375, 2.685546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 4.0, 13.0, 8.0, 8.0, 13.0, 8.0, 18.0, 20.0, 23.0, 29.0, 27.0, 33.0, 34.0, 39.0, 43.0, 34.0, 51.0, 39.0, 36.0, 43.0, 47.0, 31.0, 37.0, 46.0, 44.0, 34.0, 35.0, 30.0, 31.0, 32.0, 22.0, 22.0, 9.0, 15.0, 12.0, 7.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.48828125, -4.35302734375, -4.2177734375, -4.08251953125, -3.947265625, -3.81201171875, -3.6767578125, -3.54150390625, -3.40625, -3.27099609375, -3.1357421875, -3.00048828125, -2.865234375, -2.72998046875, -2.5947265625, -2.45947265625, -2.32421875, -2.18896484375, -2.0537109375, -1.91845703125, -1.783203125, -1.64794921875, -1.5126953125, -1.37744140625, -1.2421875, -1.10693359375, -0.9716796875, -0.83642578125, -0.701171875, -0.56591796875, -0.4306640625, -0.29541015625, -0.16015625, -0.02490234375, 0.1103515625, 0.24560546875, 0.380859375, 0.51611328125, 0.6513671875, 0.78662109375, 0.921875, 1.05712890625, 1.1923828125, 1.32763671875, 1.462890625, 1.59814453125, 1.7333984375, 1.86865234375, 2.00390625, 2.13916015625, 2.2744140625, 2.40966796875, 2.544921875, 2.68017578125, 2.8154296875, 2.95068359375, 3.0859375, 3.22119140625, 3.3564453125, 3.49169921875, 3.626953125, 3.76220703125, 3.8974609375, 4.03271484375, 4.16796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 10.0, 12.0, 10.0, 15.0, 26.0, 25.0, 24.0, 40.0, 40.0, 66.0, 86.0, 96.0, 196.0, 347.0, 802.0, 6917.0, 179687.0, 833880.0, 23421.0, 1646.0, 421.0, 217.0, 126.0, 90.0, 57.0, 58.0, 38.0, 26.0, 34.0, 27.0, 14.0, 13.0, 14.0, 9.0, 10.0, 7.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-8.6328125, -8.36474609375, -8.0966796875, -7.82861328125, -7.560546875, -7.29248046875, -7.0244140625, -6.75634765625, -6.48828125, -6.22021484375, -5.9521484375, -5.68408203125, -5.416015625, -5.14794921875, -4.8798828125, -4.61181640625, -4.34375, -4.07568359375, -3.8076171875, -3.53955078125, -3.271484375, -3.00341796875, -2.7353515625, -2.46728515625, -2.19921875, -1.93115234375, -1.6630859375, -1.39501953125, -1.126953125, -0.85888671875, -0.5908203125, -0.32275390625, -0.0546875, 0.21337890625, 0.4814453125, 0.74951171875, 1.017578125, 1.28564453125, 1.5537109375, 1.82177734375, 2.08984375, 2.35791015625, 2.6259765625, 2.89404296875, 3.162109375, 3.43017578125, 3.6982421875, 3.96630859375, 4.234375, 4.50244140625, 4.7705078125, 5.03857421875, 5.306640625, 5.57470703125, 5.8427734375, 6.11083984375, 6.37890625, 6.64697265625, 6.9150390625, 7.18310546875, 7.451171875, 7.71923828125, 7.9873046875, 8.25537109375, 8.5234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 9.0, 6.0, 6.0, 7.0, 12.0, 17.0, 19.0, 18.0, 15.0, 22.0, 27.0, 32.0, 31.0, 45.0, 54.0, 49.0, 54.0, 42.0, 44.0, 58.0, 52.0, 34.0, 43.0, 30.0, 32.0, 32.0, 44.0, 30.0, 13.0, 22.0, 15.0, 14.0, 11.0, 13.0, 7.0, 3.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.1953125, -5.0299072265625, -4.864501953125, -4.6990966796875, -4.53369140625, -4.3682861328125, -4.202880859375, -4.0374755859375, -3.8720703125, -3.7066650390625, -3.541259765625, -3.3758544921875, -3.21044921875, -3.0450439453125, -2.879638671875, -2.7142333984375, -2.548828125, -2.3834228515625, -2.218017578125, -2.0526123046875, -1.88720703125, -1.7218017578125, -1.556396484375, -1.3909912109375, -1.2255859375, -1.0601806640625, -0.894775390625, -0.7293701171875, -0.56396484375, -0.3985595703125, -0.233154296875, -0.0677490234375, 0.09765625, 0.2630615234375, 0.428466796875, 0.5938720703125, 0.75927734375, 0.9246826171875, 1.090087890625, 1.2554931640625, 1.4208984375, 1.5863037109375, 1.751708984375, 1.9171142578125, 2.08251953125, 2.2479248046875, 2.413330078125, 2.5787353515625, 2.744140625, 2.9095458984375, 3.074951171875, 3.2403564453125, 3.40576171875, 3.5711669921875, 3.736572265625, 3.9019775390625, 4.0673828125, 4.2327880859375, 4.398193359375, 4.5635986328125, 4.72900390625, 4.8944091796875, 5.059814453125, 5.2252197265625, 5.390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 4.0, 8.0, 12.0, 18.0, 26.0, 25.0, 48.0, 88.0, 162.0, 313.0, 717.0, 2030.0, 11808.0, 281435.0, 726520.0, 21053.0, 2670.0, 810.0, 343.0, 192.0, 96.0, 52.0, 39.0, 23.0, 15.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.3515625, -2.2734375, -2.1953125, -2.1171875, -2.0390625, -1.9609375, -1.8828125, -1.8046875, -1.7265625, -1.6484375, -1.5703125, -1.4921875, -1.4140625, -1.3359375, -1.2578125, -1.1796875, -1.1015625, -1.0234375, -0.9453125, -0.8671875, -0.7890625, -0.7109375, -0.6328125, -0.5546875, -0.4765625, -0.3984375, -0.3203125, -0.2421875, -0.1640625, -0.0859375, -0.0078125, 0.0703125, 0.1484375, 0.2265625, 0.3046875, 0.3828125, 0.4609375, 0.5390625, 0.6171875, 0.6953125, 0.7734375, 0.8515625, 0.9296875, 1.0078125, 1.0859375, 1.1640625, 1.2421875, 1.3203125, 1.3984375, 1.4765625, 1.5546875, 1.6328125, 1.7109375, 1.7890625, 1.8671875, 1.9453125, 2.0234375, 2.1015625, 2.1796875, 2.2578125, 2.3359375, 2.4140625, 2.4921875, 2.5703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 14.0, 42.0, 64.0, 152.0, 439.0, 153.0, 93.0, 36.0, 11.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009088516235351562, -0.0008864030241966248, -0.0008639544248580933, -0.0008415058255195618, -0.0008190572261810303, -0.0007966086268424988, -0.0007741600275039673, -0.0007517114281654358, -0.0007292628288269043, -0.0007068142294883728, -0.0006843656301498413, -0.0006619170308113098, -0.0006394684314727783, -0.0006170198321342468, -0.0005945712327957153, -0.0005721226334571838, -0.0005496740341186523, -0.0005272254347801208, -0.0005047768354415894, -0.00048232823610305786, -0.00045987963676452637, -0.0004374310374259949, -0.0004149824380874634, -0.0003925338387489319, -0.0003700852394104004, -0.0003476366400718689, -0.0003251880407333374, -0.0003027394413948059, -0.0002802908420562744, -0.0002578422427177429, -0.00023539364337921143, -0.00021294504404067993, -0.00019049644470214844, -0.00016804784536361694, -0.00014559924602508545, -0.00012315064668655396, -0.00010070204734802246, -7.825344800949097e-05, -5.580484867095947e-05, -3.335624933242798e-05, -1.0907649993896484e-05, 1.154094934463501e-05, 3.3989548683166504e-05, 5.6438148021698e-05, 7.888674736022949e-05, 0.00010133534669876099, 0.00012378394603729248, 0.00014623254537582397, 0.00016868114471435547, 0.00019112974405288696, 0.00021357834339141846, 0.00023602694272994995, 0.00025847554206848145, 0.00028092414140701294, 0.00030337274074554443, 0.00032582134008407593, 0.0003482699394226074, 0.0003707185387611389, 0.0003931671380996704, 0.0004156157374382019, 0.0004380643367767334, 0.0004605129361152649, 0.0004829615354537964, 0.0005054101347923279, 0.0005278587341308594]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 13.0, 9.0, 10.0, 22.0, 29.0, 47.0, 55.0, 54.0, 98.0, 124.0, 189.0, 312.0, 587.0, 1121.0, 3108.0, 16369.0, 320298.0, 674503.0, 24927.0, 3634.0, 1377.0, 623.0, 321.0, 188.0, 138.0, 108.0, 81.0, 56.0, 32.0, 33.0, 21.0, 16.0, 14.0, 11.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.509765625, -2.42633056640625, -2.3428955078125, -2.25946044921875, -2.176025390625, -2.09259033203125, -2.0091552734375, -1.92572021484375, -1.84228515625, -1.75885009765625, -1.6754150390625, -1.59197998046875, -1.508544921875, -1.42510986328125, -1.3416748046875, -1.25823974609375, -1.1748046875, -1.09136962890625, -1.0079345703125, -0.92449951171875, -0.841064453125, -0.75762939453125, -0.6741943359375, -0.59075927734375, -0.50732421875, -0.42388916015625, -0.3404541015625, -0.25701904296875, -0.173583984375, -0.09014892578125, -0.0067138671875, 0.07672119140625, 0.16015625, 0.24359130859375, 0.3270263671875, 0.41046142578125, 0.493896484375, 0.57733154296875, 0.6607666015625, 0.74420166015625, 0.82763671875, 0.91107177734375, 0.9945068359375, 1.07794189453125, 1.161376953125, 1.24481201171875, 1.3282470703125, 1.41168212890625, 1.4951171875, 1.57855224609375, 1.6619873046875, 1.74542236328125, 1.828857421875, 1.91229248046875, 1.9957275390625, 2.07916259765625, 2.16259765625, 2.24603271484375, 2.3294677734375, 2.41290283203125, 2.496337890625, 2.57977294921875, 2.6632080078125, 2.74664306640625, 2.830078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 15.0, 6.0, 16.0, 15.0, 25.0, 24.0, 34.0, 39.0, 48.0, 95.0, 255.0, 117.0, 52.0, 41.0, 46.0, 47.0, 34.0, 20.0, 12.0, 9.0, 8.0, 7.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5198822021484375, -0.498748779296875, -0.4776153564453125, -0.45648193359375, -0.4353485107421875, -0.414215087890625, -0.3930816650390625, -0.3719482421875, -0.3508148193359375, -0.329681396484375, -0.3085479736328125, -0.28741455078125, -0.2662811279296875, -0.245147705078125, -0.2240142822265625, -0.202880859375, -0.1817474365234375, -0.160614013671875, -0.1394805908203125, -0.11834716796875, -0.0972137451171875, -0.076080322265625, -0.0549468994140625, -0.0338134765625, -0.0126800537109375, 0.008453369140625, 0.0295867919921875, 0.05072021484375, 0.0718536376953125, 0.092987060546875, 0.1141204833984375, 0.13525390625, 0.1563873291015625, 0.177520751953125, 0.1986541748046875, 0.21978759765625, 0.2409210205078125, 0.262054443359375, 0.2831878662109375, 0.3043212890625, 0.3254547119140625, 0.346588134765625, 0.3677215576171875, 0.38885498046875, 0.4099884033203125, 0.431121826171875, 0.4522552490234375, 0.473388671875, 0.4945220947265625, 0.515655517578125, 0.5367889404296875, 0.55792236328125, 0.5790557861328125, 0.600189208984375, 0.6213226318359375, 0.6424560546875, 0.6635894775390625, 0.684722900390625, 0.7058563232421875, 0.72698974609375, 0.7481231689453125, 0.769256591796875, 0.7903900146484375, 0.8115234375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 14.0, 42.0, 126.0, 229.0, 291.0, 208.0, 72.0, 23.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.59986686706543, -30.915311813354492, -30.230758666992188, -29.54620361328125, -28.861650466918945, -28.177095413208008, -27.492542266845703, -26.807987213134766, -26.12343406677246, -25.438879013061523, -24.75432586669922, -24.06977081298828, -23.385217666625977, -22.70066261291504, -22.016109466552734, -21.331554412841797, -20.64699935913086, -19.962444305419922, -19.277891159057617, -18.59333610534668, -17.908782958984375, -17.224227905273438, -16.539674758911133, -15.855119705200195, -15.17056655883789, -14.48601245880127, -13.801458358764648, -13.116904258728027, -12.432350158691406, -11.747796058654785, -11.063241958618164, -10.378686904907227, -9.694134712219238, -9.009580612182617, -8.325026512145996, -7.640472412109375, -6.955918312072754, -6.271364212036133, -5.5868096351623535, -4.902255535125732, -4.217701435089111, -3.5331473350524902, -2.848593235015869, -2.164038896560669, -1.4794847965240479, -0.7949306964874268, -0.11037635803222656, 0.5741777420043945, 1.2587318420410156, 1.9432859420776367, 2.627840042114258, 3.312394380569458, 3.996948480606079, 4.681502342224121, 5.3660569190979, 6.0506110191345215, 6.735165119171143, 7.419719219207764, 8.104273796081543, 8.788827896118164, 9.473381996154785, 10.157936096191406, 10.842490196228027, 11.527044296264648, 12.21159839630127]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 4.0, 4.0, 6.0, 4.0, 12.0, 5.0, 11.0, 17.0, 18.0, 12.0, 20.0, 18.0, 22.0, 27.0, 24.0, 25.0, 28.0, 30.0, 34.0, 38.0, 32.0, 37.0, 37.0, 52.0, 37.0, 31.0, 50.0, 39.0, 36.0, 21.0, 29.0, 30.0, 33.0, 27.0, 19.0, 13.0, 24.0, 12.0, 16.0, 17.0, 7.0, 11.0, 5.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0], "bins": [-7.869814395904541, -7.64447021484375, -7.419126033782959, -7.193781852722168, -6.968438148498535, -6.743093967437744, -6.517749786376953, -6.292405605316162, -6.067061424255371, -5.84171724319458, -5.616373062133789, -5.391029357910156, -5.165685176849365, -4.940340995788574, -4.714996814727783, -4.489652633666992, -4.264308929443359, -4.038964748382568, -3.8136208057403564, -3.5882766246795654, -3.3629326820373535, -3.1375885009765625, -2.9122443199157715, -2.6869001388549805, -2.4615561962127686, -2.2362120151519775, -2.0108680725097656, -1.7855238914489746, -1.5601798295974731, -1.3348357677459717, -1.1094915866851807, -0.8841475248336792, -0.6588029861450195, -0.4334588944911957, -0.20811480283737183, 0.017229318618774414, 0.24257338047027588, 0.46791744232177734, 0.6932616233825684, 0.9186056852340698, 1.1439497470855713, 1.3692938089370728, 1.5946378707885742, 1.8199820518493652, 2.0453262329101562, 2.270670175552368, 2.496014356613159, 2.721358299255371, 2.946702480316162, 3.172046661376953, 3.397390604019165, 3.622734785079956, 3.848078727722168, 4.073422908782959, 4.29876708984375, 4.524111270904541, 4.749455451965332, 4.974799633026123, 5.200143814086914, 5.425487518310547, 5.650831699371338, 5.876175880432129, 6.10152006149292, 6.326864242553711, 6.552207946777344]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 1.0, 2.0, 7.0, 1.0, 7.0, 7.0, 6.0, 4.0, 14.0, 14.0, 17.0, 21.0, 20.0, 34.0, 29.0, 50.0, 63.0, 78.0, 97.0, 152.0, 217.0, 368.0, 690.0, 1629.0, 4815.0, 18821.0, 101668.0, 730872.0, 2361625.0, 821598.0, 119662.0, 21903.0, 5529.0, 1942.0, 877.0, 454.0, 265.0, 181.0, 133.0, 101.0, 64.0, 52.0, 43.0, 41.0, 23.0, 26.0, 22.0, 9.0, 11.0, 5.0, 4.0, 3.0, 0.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.26953125, -4.1383056640625, -4.007080078125, -3.8758544921875, -3.74462890625, -3.6134033203125, -3.482177734375, -3.3509521484375, -3.2197265625, -3.0885009765625, -2.957275390625, -2.8260498046875, -2.69482421875, -2.5635986328125, -2.432373046875, -2.3011474609375, -2.169921875, -2.0386962890625, -1.907470703125, -1.7762451171875, -1.64501953125, -1.5137939453125, -1.382568359375, -1.2513427734375, -1.1201171875, -0.9888916015625, -0.857666015625, -0.7264404296875, -0.59521484375, -0.4639892578125, -0.332763671875, -0.2015380859375, -0.0703125, 0.0609130859375, 0.192138671875, 0.3233642578125, 0.45458984375, 0.5858154296875, 0.717041015625, 0.8482666015625, 0.9794921875, 1.1107177734375, 1.241943359375, 1.3731689453125, 1.50439453125, 1.6356201171875, 1.766845703125, 1.8980712890625, 2.029296875, 2.1605224609375, 2.291748046875, 2.4229736328125, 2.55419921875, 2.6854248046875, 2.816650390625, 2.9478759765625, 3.0791015625, 3.2103271484375, 3.341552734375, 3.4727783203125, 3.60400390625, 3.7352294921875, 3.866455078125, 3.9976806640625, 4.12890625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 5.0, 7.0, 9.0, 11.0, 13.0, 19.0, 23.0, 22.0, 29.0, 24.0, 36.0, 33.0, 49.0, 45.0, 32.0, 47.0, 50.0, 40.0, 46.0, 51.0, 48.0, 39.0, 47.0, 40.0, 35.0, 20.0, 43.0, 15.0, 28.0, 15.0, 15.0, 17.0, 11.0, 15.0, 2.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.997833251953125, -2.90582275390625, -2.813812255859375, -2.7218017578125, -2.629791259765625, -2.53778076171875, -2.445770263671875, -2.353759765625, -2.261749267578125, -2.16973876953125, -2.077728271484375, -1.9857177734375, -1.893707275390625, -1.80169677734375, -1.709686279296875, -1.61767578125, -1.525665283203125, -1.43365478515625, -1.341644287109375, -1.2496337890625, -1.157623291015625, -1.06561279296875, -0.973602294921875, -0.881591796875, -0.789581298828125, -0.69757080078125, -0.605560302734375, -0.5135498046875, -0.421539306640625, -0.32952880859375, -0.237518310546875, -0.1455078125, -0.053497314453125, 0.03851318359375, 0.130523681640625, 0.2225341796875, 0.314544677734375, 0.40655517578125, 0.498565673828125, 0.590576171875, 0.682586669921875, 0.77459716796875, 0.866607666015625, 0.9586181640625, 1.050628662109375, 1.14263916015625, 1.234649658203125, 1.32666015625, 1.418670654296875, 1.51068115234375, 1.602691650390625, 1.6947021484375, 1.786712646484375, 1.87872314453125, 1.970733642578125, 2.062744140625, 2.154754638671875, 2.24676513671875, 2.338775634765625, 2.4307861328125, 2.522796630859375, 2.61480712890625, 2.706817626953125, 2.798828125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 12.0, 27.0, 53.0, 94.0, 202.0, 719.0, 2765.0, 52022.0, 4069586.0, 64501.0, 2990.0, 769.0, 265.0, 118.0, 54.0, 24.0, 24.0, 10.0, 11.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.2086181640625, -15.776611328125, -15.3446044921875, -14.91259765625, -14.4805908203125, -14.048583984375, -13.6165771484375, -13.1845703125, -12.7525634765625, -12.320556640625, -11.8885498046875, -11.45654296875, -11.0245361328125, -10.592529296875, -10.1605224609375, -9.728515625, -9.2965087890625, -8.864501953125, -8.4324951171875, -8.00048828125, -7.5684814453125, -7.136474609375, -6.7044677734375, -6.2724609375, -5.8404541015625, -5.408447265625, -4.9764404296875, -4.54443359375, -4.1124267578125, -3.680419921875, -3.2484130859375, -2.81640625, -2.3843994140625, -1.952392578125, -1.5203857421875, -1.08837890625, -0.6563720703125, -0.224365234375, 0.2076416015625, 0.6396484375, 1.0716552734375, 1.503662109375, 1.9356689453125, 2.36767578125, 2.7996826171875, 3.231689453125, 3.6636962890625, 4.095703125, 4.5277099609375, 4.959716796875, 5.3917236328125, 5.82373046875, 6.2557373046875, 6.687744140625, 7.1197509765625, 7.5517578125, 7.9837646484375, 8.415771484375, 8.8477783203125, 9.27978515625, 9.7117919921875, 10.143798828125, 10.5758056640625, 11.0078125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 7.0, 15.0, 17.0, 41.0, 68.0, 123.0, 228.0, 449.0, 677.0, 902.0, 647.0, 440.0, 202.0, 114.0, 56.0, 34.0, 14.0, 12.0, 6.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.221923828125, -2.14892578125, -2.075927734375, -2.0029296875, -1.929931640625, -1.85693359375, -1.783935546875, -1.7109375, -1.637939453125, -1.56494140625, -1.491943359375, -1.4189453125, -1.345947265625, -1.27294921875, -1.199951171875, -1.126953125, -1.053955078125, -0.98095703125, -0.907958984375, -0.8349609375, -0.761962890625, -0.68896484375, -0.615966796875, -0.54296875, -0.469970703125, -0.39697265625, -0.323974609375, -0.2509765625, -0.177978515625, -0.10498046875, -0.031982421875, 0.041015625, 0.114013671875, 0.18701171875, 0.260009765625, 0.3330078125, 0.406005859375, 0.47900390625, 0.552001953125, 0.625, 0.697998046875, 0.77099609375, 0.843994140625, 0.9169921875, 0.989990234375, 1.06298828125, 1.135986328125, 1.208984375, 1.281982421875, 1.35498046875, 1.427978515625, 1.5009765625, 1.573974609375, 1.64697265625, 1.719970703125, 1.79296875, 1.865966796875, 1.93896484375, 2.011962890625, 2.0849609375, 2.157958984375, 2.23095703125, 2.303955078125, 2.376953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 12.0, 17.0, 26.0, 55.0, 78.0, 103.0, 112.0, 133.0, 126.0, 107.0, 86.0, 58.0, 38.0, 23.0, 11.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.418701171875, -5.199883460998535, -4.98106575012207, -4.7622480392456055, -4.543430805206299, -4.324613094329834, -4.105795383453369, -3.8869776725769043, -3.6681599617004395, -3.4493422508239746, -3.230524778366089, -3.011707067489624, -2.792889356613159, -2.5740718841552734, -2.3552541732788086, -2.1364364624023438, -1.917618989944458, -1.6988013982772827, -1.4799836874008179, -1.2611660957336426, -1.0423483848571777, -0.8235307931900024, -0.6047132015228271, -0.3858954906463623, -0.167077898979187, 0.05173973739147186, 0.27055737376213074, 0.4893749952316284, 0.7081926465034485, 0.9270102977752686, 1.1458278894424438, 1.3646456003189087, 1.583463191986084, 1.8022807836532593, 2.0210983753204346, 2.2399160861968994, 2.4587337970733643, 2.67755126953125, 2.896368980407715, 3.1151866912841797, 3.3340044021606445, 3.5528221130371094, 3.771639585494995, 3.99045729637146, 4.209274768829346, 4.4280924797058105, 4.646910190582275, 4.86572790145874, 5.084545135498047, 5.303362846374512, 5.522180557250977, 5.740998268127441, 5.959815502166748, 6.178633213043213, 6.397450923919678, 6.616268634796143, 6.835086345672607, 7.053904056549072, 7.272721767425537, 7.491539001464844, 7.710356712341309, 7.929174423217773, 8.147992134094238, 8.366809844970703, 8.585627555847168]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 9.0, 7.0, 7.0, 17.0, 10.0, 12.0, 18.0, 18.0, 21.0, 18.0, 24.0, 28.0, 28.0, 24.0, 37.0, 27.0, 30.0, 35.0, 39.0, 46.0, 42.0, 38.0, 39.0, 41.0, 43.0, 34.0, 30.0, 34.0, 27.0, 24.0, 24.0, 34.0, 19.0, 13.0, 18.0, 16.0, 12.0, 11.0, 3.0, 8.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.8566651344299316, -2.7673861980438232, -2.678107261657715, -2.5888285636901855, -2.499549627304077, -2.4102706909179688, -2.3209917545318604, -2.231712818145752, -2.1424341201782227, -2.0531551837921143, -1.9638763666152954, -1.874597430229187, -1.7853186130523682, -1.6960396766662598, -1.6067607402801514, -1.517481803894043, -1.4282028675079346, -1.3389239311218262, -1.2496451139450073, -1.160366177558899, -1.07108736038208, -0.9818084239959717, -0.8925294876098633, -0.8032506108283997, -0.713971734046936, -0.6246928572654724, -0.5354139804840088, -0.4461350440979004, -0.35685616731643677, -0.26757729053497314, -0.17829835414886475, -0.08901947736740112, 0.00025963783264160156, 0.08953852951526642, 0.17881742119789124, 0.26809632778167725, 0.35737520456314087, 0.4466540813446045, 0.5359330177307129, 0.6252118945121765, 0.7144907712936401, 0.8037696480751038, 0.8930485248565674, 0.9823274612426758, 1.0716063976287842, 1.160885214805603, 1.2501641511917114, 1.3394429683685303, 1.4287219047546387, 1.518000841140747, 1.607279658317566, 1.6965585947036743, 1.7858374118804932, 1.8751163482666016, 1.96439528465271, 2.0536742210388184, 2.1429529190063477, 2.232231855392456, 2.3215107917785645, 2.4107894897460938, 2.500068426132202, 2.5893473625183105, 2.678626298904419, 2.7679052352905273, 2.8571841716766357]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 6.0, 14.0, 14.0, 24.0, 35.0, 53.0, 93.0, 123.0, 212.0, 326.0, 557.0, 1122.0, 2430.0, 7577.0, 45987.0, 423751.0, 495062.0, 56930.0, 8779.0, 2693.0, 1185.0, 625.0, 372.0, 199.0, 115.0, 95.0, 53.0, 41.0, 20.0, 17.0, 13.0, 10.0, 7.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.1265716552734375, -1.089080810546875, -1.0515899658203125, -1.01409912109375, -0.9766082763671875, -0.939117431640625, -0.9016265869140625, -0.8641357421875, -0.8266448974609375, -0.789154052734375, -0.7516632080078125, -0.71417236328125, -0.6766815185546875, -0.639190673828125, -0.6016998291015625, -0.564208984375, -0.5267181396484375, -0.489227294921875, -0.4517364501953125, -0.41424560546875, -0.3767547607421875, -0.339263916015625, -0.3017730712890625, -0.2642822265625, -0.2267913818359375, -0.189300537109375, -0.1518096923828125, -0.11431884765625, -0.0768280029296875, -0.039337158203125, -0.0018463134765625, 0.03564453125, 0.0731353759765625, 0.110626220703125, 0.1481170654296875, 0.18560791015625, 0.2230987548828125, 0.260589599609375, 0.2980804443359375, 0.3355712890625, 0.3730621337890625, 0.410552978515625, 0.4480438232421875, 0.48553466796875, 0.5230255126953125, 0.560516357421875, 0.5980072021484375, 0.635498046875, 0.6729888916015625, 0.710479736328125, 0.7479705810546875, 0.78546142578125, 0.8229522705078125, 0.860443115234375, 0.8979339599609375, 0.9354248046875, 0.9729156494140625, 1.010406494140625, 1.0478973388671875, 1.08538818359375, 1.1228790283203125, 1.160369873046875, 1.1978607177734375, 1.2353515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 11.0, 12.0, 19.0, 22.0, 25.0, 27.0, 35.0, 48.0, 44.0, 42.0, 49.0, 60.0, 65.0, 65.0, 77.0, 60.0, 53.0, 37.0, 46.0, 32.0, 40.0, 33.0, 23.0, 20.0, 13.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.265594482421875, -3.16400146484375, -3.062408447265625, -2.9608154296875, -2.859222412109375, -2.75762939453125, -2.656036376953125, -2.554443359375, -2.452850341796875, -2.35125732421875, -2.249664306640625, -2.1480712890625, -2.046478271484375, -1.94488525390625, -1.843292236328125, -1.74169921875, -1.640106201171875, -1.53851318359375, -1.436920166015625, -1.3353271484375, -1.233734130859375, -1.13214111328125, -1.030548095703125, -0.928955078125, -0.827362060546875, -0.72576904296875, -0.624176025390625, -0.5225830078125, -0.420989990234375, -0.31939697265625, -0.217803955078125, -0.1162109375, -0.014617919921875, 0.08697509765625, 0.188568115234375, 0.2901611328125, 0.391754150390625, 0.49334716796875, 0.594940185546875, 0.696533203125, 0.798126220703125, 0.89971923828125, 1.001312255859375, 1.1029052734375, 1.204498291015625, 1.30609130859375, 1.407684326171875, 1.50927734375, 1.610870361328125, 1.71246337890625, 1.814056396484375, 1.9156494140625, 2.017242431640625, 2.11883544921875, 2.220428466796875, 2.322021484375, 2.423614501953125, 2.52520751953125, 2.626800537109375, 2.7283935546875, 2.829986572265625, 2.93157958984375, 3.033172607421875, 3.134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 18.0, 17.0, 26.0, 47.0, 58.0, 134.0, 248.0, 520.0, 1160.0, 2703.0, 6628.0, 16532.0, 41915.0, 104469.0, 225969.0, 307163.0, 197135.0, 86311.0, 34412.0, 13598.0, 5367.0, 2235.0, 987.0, 432.0, 176.0, 105.0, 58.0, 36.0, 27.0, 10.0, 14.0, 5.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353515625, -0.3422584533691406, -0.33100128173828125, -0.3197441101074219, -0.3084869384765625, -0.2972297668457031, -0.28597259521484375, -0.2747154235839844, -0.263458251953125, -0.2522010803222656, -0.24094390869140625, -0.22968673706054688, -0.2184295654296875, -0.20717239379882812, -0.19591522216796875, -0.18465805053710938, -0.17340087890625, -0.16214370727539062, -0.15088653564453125, -0.13962936401367188, -0.1283721923828125, -0.11711502075195312, -0.10585784912109375, -0.09460067749023438, -0.083343505859375, -0.07208633422851562, -0.06082916259765625, -0.049571990966796875, -0.0383148193359375, -0.027057647705078125, -0.01580047607421875, -0.004543304443359375, 0.0067138671875, 0.017971038818359375, 0.02922821044921875, 0.040485382080078125, 0.0517425537109375, 0.06299972534179688, 0.07425689697265625, 0.08551406860351562, 0.096771240234375, 0.10802841186523438, 0.11928558349609375, 0.13054275512695312, 0.1417999267578125, 0.15305709838867188, 0.16431427001953125, 0.17557144165039062, 0.18682861328125, 0.19808578491210938, 0.20934295654296875, 0.22060012817382812, 0.2318572998046875, 0.24311447143554688, 0.25437164306640625, 0.2656288146972656, 0.276885986328125, 0.2881431579589844, 0.29940032958984375, 0.3106575012207031, 0.3219146728515625, 0.3331718444824219, 0.34442901611328125, 0.3556861877441406, 0.366943359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 9.0, 8.0, 16.0, 17.0, 18.0, 18.0, 28.0, 39.0, 20.0, 47.0, 50.0, 40.0, 43.0, 38.0, 58.0, 42.0, 56.0, 62.0, 40.0, 44.0, 39.0, 34.0, 29.0, 29.0, 29.0, 24.0, 18.0, 18.0, 16.0, 7.0, 8.0, 7.0, 8.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34375, -5.161376953125, -4.97900390625, -4.796630859375, -4.6142578125, -4.431884765625, -4.24951171875, -4.067138671875, -3.884765625, -3.702392578125, -3.52001953125, -3.337646484375, -3.1552734375, -2.972900390625, -2.79052734375, -2.608154296875, -2.42578125, -2.243408203125, -2.06103515625, -1.878662109375, -1.6962890625, -1.513916015625, -1.33154296875, -1.149169921875, -0.966796875, -0.784423828125, -0.60205078125, -0.419677734375, -0.2373046875, -0.054931640625, 0.12744140625, 0.309814453125, 0.4921875, 0.674560546875, 0.85693359375, 1.039306640625, 1.2216796875, 1.404052734375, 1.58642578125, 1.768798828125, 1.951171875, 2.133544921875, 2.31591796875, 2.498291015625, 2.6806640625, 2.863037109375, 3.04541015625, 3.227783203125, 3.41015625, 3.592529296875, 3.77490234375, 3.957275390625, 4.1396484375, 4.322021484375, 4.50439453125, 4.686767578125, 4.869140625, 5.051513671875, 5.23388671875, 5.416259765625, 5.5986328125, 5.781005859375, 5.96337890625, 6.145751953125, 6.328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 10.0, 14.0, 18.0, 19.0, 28.0, 52.0, 83.0, 125.0, 228.0, 365.0, 738.0, 1679.0, 5237.0, 22231.0, 159083.0, 649585.0, 176556.0, 23787.0, 5360.0, 1773.0, 725.0, 331.0, 206.0, 99.0, 67.0, 56.0, 34.0, 25.0, 13.0, 4.0, 10.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08782958984375, -0.08495235443115234, -0.08207511901855469, -0.07919788360595703, -0.07632064819335938, -0.07344341278076172, -0.07056617736816406, -0.0676889419555664, -0.06481170654296875, -0.061934471130371094, -0.05905723571777344, -0.05618000030517578, -0.053302764892578125, -0.05042552947998047, -0.04754829406738281, -0.044671058654785156, -0.0417938232421875, -0.038916587829589844, -0.03603935241699219, -0.03316211700439453, -0.030284881591796875, -0.02740764617919922, -0.024530410766601562, -0.021653175354003906, -0.01877593994140625, -0.015898704528808594, -0.013021469116210938, -0.010144233703613281, -0.007266998291015625, -0.004389762878417969, -0.0015125274658203125, 0.0013647079467773438, 0.004241943359375, 0.007119178771972656, 0.009996414184570312, 0.012873649597167969, 0.015750885009765625, 0.01862812042236328, 0.021505355834960938, 0.024382591247558594, 0.02725982666015625, 0.030137062072753906, 0.03301429748535156, 0.03589153289794922, 0.038768768310546875, 0.04164600372314453, 0.04452323913574219, 0.047400474548339844, 0.0502777099609375, 0.053154945373535156, 0.05603218078613281, 0.05890941619873047, 0.061786651611328125, 0.06466388702392578, 0.06754112243652344, 0.0704183578491211, 0.07329559326171875, 0.0761728286743164, 0.07905006408691406, 0.08192729949951172, 0.08480453491210938, 0.08768177032470703, 0.09055900573730469, 0.09343624114990234, 0.0963134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 1.0, 10.0, 10.0, 33.0, 20.0, 32.0, 42.0, 63.0, 73.0, 69.0, 102.0, 80.0, 79.0, 85.0, 77.0, 51.0, 51.0, 34.0, 21.0, 21.0, 9.0, 11.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.568431854248047e-05, -6.410665810108185e-05, -6.252899765968323e-05, -6.095133721828461e-05, -5.9373676776885986e-05, -5.7796016335487366e-05, -5.6218355894088745e-05, -5.4640695452690125e-05, -5.3063035011291504e-05, -5.148537456989288e-05, -4.990771412849426e-05, -4.833005368709564e-05, -4.675239324569702e-05, -4.51747328042984e-05, -4.359707236289978e-05, -4.201941192150116e-05, -4.044175148010254e-05, -3.886409103870392e-05, -3.72864305973053e-05, -3.570877015590668e-05, -3.413110971450806e-05, -3.2553449273109436e-05, -3.0975788831710815e-05, -2.9398128390312195e-05, -2.7820467948913574e-05, -2.6242807507514954e-05, -2.4665147066116333e-05, -2.3087486624717712e-05, -2.1509826183319092e-05, -1.993216574192047e-05, -1.835450530052185e-05, -1.677684485912323e-05, -1.519918441772461e-05, -1.3621523976325989e-05, -1.2043863534927368e-05, -1.0466203093528748e-05, -8.888542652130127e-06, -7.310882210731506e-06, -5.733221769332886e-06, -4.155561327934265e-06, -2.5779008865356445e-06, -1.000240445137024e-06, 5.774199962615967e-07, 2.1550804376602173e-06, 3.732740879058838e-06, 5.3104013204574585e-06, 6.888061761856079e-06, 8.4657222032547e-06, 1.004338264465332e-05, 1.1621043086051941e-05, 1.3198703527450562e-05, 1.4776363968849182e-05, 1.6354024410247803e-05, 1.7931684851646423e-05, 1.9509345293045044e-05, 2.1087005734443665e-05, 2.2664666175842285e-05, 2.4242326617240906e-05, 2.5819987058639526e-05, 2.7397647500038147e-05, 2.8975307941436768e-05, 3.055296838283539e-05, 3.213062882423401e-05, 3.370828926563263e-05, 3.528594970703125e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 8.0, 7.0, 26.0, 28.0, 28.0, 54.0, 60.0, 139.0, 215.0, 414.0, 806.0, 1746.0, 4089.0, 13977.0, 77615.0, 634669.0, 270234.0, 31633.0, 7545.0, 2628.0, 1254.0, 582.0, 260.0, 175.0, 134.0, 68.0, 35.0, 31.0, 21.0, 24.0, 14.0, 5.0, 3.0, 8.0, 1.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10968017578125, -0.10652542114257812, -0.10337066650390625, -0.10021591186523438, -0.0970611572265625, -0.09390640258789062, -0.09075164794921875, -0.08759689331054688, -0.084442138671875, -0.08128738403320312, -0.07813262939453125, -0.07497787475585938, -0.0718231201171875, -0.06866836547851562, -0.06551361083984375, -0.062358856201171875, -0.0592041015625, -0.056049346923828125, -0.05289459228515625, -0.049739837646484375, -0.0465850830078125, -0.043430328369140625, -0.04027557373046875, -0.037120819091796875, -0.033966064453125, -0.030811309814453125, -0.02765655517578125, -0.024501800537109375, -0.0213470458984375, -0.018192291259765625, -0.01503753662109375, -0.011882781982421875, -0.00872802734375, -0.005573272705078125, -0.00241851806640625, 0.000736236572265625, 0.0038909912109375, 0.007045745849609375, 0.01020050048828125, 0.013355255126953125, 0.016510009765625, 0.019664764404296875, 0.02281951904296875, 0.025974273681640625, 0.0291290283203125, 0.032283782958984375, 0.03543853759765625, 0.038593292236328125, 0.041748046875, 0.044902801513671875, 0.04805755615234375, 0.051212310791015625, 0.0543670654296875, 0.057521820068359375, 0.06067657470703125, 0.06383132934570312, 0.066986083984375, 0.07014083862304688, 0.07329559326171875, 0.07645034790039062, 0.0796051025390625, 0.08275985717773438, 0.08591461181640625, 0.08906936645507812, 0.09222412109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0, 9.0, 4.0, 5.0, 5.0, 10.0, 11.0, 13.0, 21.0, 31.0, 34.0, 38.0, 64.0, 97.0, 103.0, 123.0, 111.0, 64.0, 64.0, 51.0, 29.0, 23.0, 18.0, 15.0, 7.0, 9.0, 8.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02783203125, -0.02710556983947754, -0.026379108428955078, -0.025652647018432617, -0.024926185607910156, -0.024199724197387695, -0.023473262786865234, -0.022746801376342773, -0.022020339965820312, -0.02129387855529785, -0.02056741714477539, -0.01984095573425293, -0.01911449432373047, -0.018388032913208008, -0.017661571502685547, -0.016935110092163086, -0.016208648681640625, -0.015482187271118164, -0.014755725860595703, -0.014029264450073242, -0.013302803039550781, -0.01257634162902832, -0.01184988021850586, -0.011123418807983398, -0.010396957397460938, -0.009670495986938477, -0.008944034576416016, -0.008217573165893555, -0.007491111755371094, -0.006764650344848633, -0.006038188934326172, -0.005311727523803711, -0.00458526611328125, -0.003858804702758789, -0.003132343292236328, -0.002405881881713867, -0.0016794204711914062, -0.0009529590606689453, -0.00022649765014648438, 0.0004999637603759766, 0.0012264251708984375, 0.0019528865814208984, 0.0026793479919433594, 0.0034058094024658203, 0.004132270812988281, 0.004858732223510742, 0.005585193634033203, 0.006311655044555664, 0.007038116455078125, 0.007764577865600586, 0.008491039276123047, 0.009217500686645508, 0.009943962097167969, 0.01067042350769043, 0.01139688491821289, 0.012123346328735352, 0.012849807739257812, 0.013576269149780273, 0.014302730560302734, 0.015029191970825195, 0.015755653381347656, 0.016482114791870117, 0.017208576202392578, 0.01793503761291504, 0.0186614990234375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 15.0, 41.0, 163.0, 278.0, 309.0, 152.0, 47.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.976794242858887, -5.603147983551025, -5.229501724243164, -4.855855941772461, -4.4822096824646, -4.108563423156738, -3.734917402267456, -3.361271381378174, -2.9876251220703125, -2.613978862762451, -2.240332841873169, -1.8666867017745972, -1.4930405616760254, -1.1193944215774536, -0.7457482814788818, -0.3721022605895996, 0.0015439987182617188, 0.3751901388168335, 0.7488362789154053, 1.122482419013977, 1.4961285591125488, 1.8697746992111206, 2.2434208393096924, 2.6170668601989746, 2.990713119506836, 3.3643593788146973, 3.7380053997039795, 4.111651420593262, 4.485297679901123, 4.858943939208984, 5.2325897216796875, 5.606235980987549, 5.979883193969727, 6.353529453277588, 6.727175712585449, 7.100821495056152, 7.474467754364014, 7.848114013671875, 8.221759796142578, 8.595405578613281, 8.9690523147583, 9.342698097229004, 9.716344833374023, 10.089990615844727, 10.46363639831543, 10.83728313446045, 11.210928916931152, 11.584575653076172, 11.958221435546875, 12.331867218017578, 12.705513954162598, 13.0791597366333, 13.45280647277832, 13.826452255249023, 14.200098037719727, 14.57374382019043, 14.94739055633545, 15.321036338806152, 15.694683074951172, 16.068328857421875, 16.441974639892578, 16.81562042236328, 17.189268112182617, 17.56291389465332, 17.936559677124023]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 3.0, 10.0, 14.0, 16.0, 17.0, 20.0, 31.0, 27.0, 40.0, 42.0, 46.0, 47.0, 49.0, 61.0, 57.0, 76.0, 60.0, 63.0, 46.0, 53.0, 36.0, 45.0, 38.0, 19.0, 24.0, 18.0, 12.0, 11.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923027515411377, -2.825361728668213, -2.727695941925049, -2.6300299167633057, -2.5323641300201416, -2.4346983432769775, -2.3370323181152344, -2.2393665313720703, -2.1417007446289062, -2.044034957885742, -1.9463690519332886, -1.848703145980835, -1.751037359237671, -1.6533715724945068, -1.5557056665420532, -1.4580397605895996, -1.3603739738464355, -1.2627081871032715, -1.1650422811508179, -1.0673763751983643, -0.9697105884552002, -0.8720447421073914, -0.7743788957595825, -0.6767130494117737, -0.5790472030639648, -0.481381356716156, -0.38371551036834717, -0.28604966402053833, -0.1883838176727295, -0.09071797132492065, 0.006947875022888184, 0.10461372137069702, 0.20227980613708496, 0.2999456524848938, 0.39761149883270264, 0.4952773451805115, 0.5929431915283203, 0.6906090378761292, 0.788274884223938, 0.8859407305717468, 0.9836065769195557, 1.0812723636627197, 1.1789382696151733, 1.276604175567627, 1.374269962310791, 1.471935749053955, 1.5696016550064087, 1.6672675609588623, 1.7649333477020264, 1.8625991344451904, 1.960265040397644, 2.0579309463500977, 2.1555967330932617, 2.253262519836426, 2.35092830657959, 2.448594331741333, 2.546260118484497, 2.643925905227661, 2.7415919303894043, 2.8392577171325684, 2.9369235038757324, 3.0345892906188965, 3.1322550773620605, 3.2299211025238037, 3.3275868892669678]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 4.0, 6.0, 14.0, 17.0, 24.0, 43.0, 68.0, 113.0, 221.0, 402.0, 966.0, 3184.0, 16053.0, 113985.0, 701135.0, 181444.0, 24184.0, 4397.0, 1179.0, 511.0, 253.0, 132.0, 77.0, 58.0, 24.0, 19.0, 13.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.8936767578125, -3.728759765625, -3.5638427734375, -3.39892578125, -3.2340087890625, -3.069091796875, -2.9041748046875, -2.7392578125, -2.5743408203125, -2.409423828125, -2.2445068359375, -2.07958984375, -1.9146728515625, -1.749755859375, -1.5848388671875, -1.419921875, -1.2550048828125, -1.090087890625, -0.9251708984375, -0.76025390625, -0.5953369140625, -0.430419921875, -0.2655029296875, -0.1005859375, 0.0643310546875, 0.229248046875, 0.3941650390625, 0.55908203125, 0.7239990234375, 0.888916015625, 1.0538330078125, 1.21875, 1.3836669921875, 1.548583984375, 1.7135009765625, 1.87841796875, 2.0433349609375, 2.208251953125, 2.3731689453125, 2.5380859375, 2.7030029296875, 2.867919921875, 3.0328369140625, 3.19775390625, 3.3626708984375, 3.527587890625, 3.6925048828125, 3.857421875, 4.0223388671875, 4.187255859375, 4.3521728515625, 4.51708984375, 4.6820068359375, 4.846923828125, 5.0118408203125, 5.1767578125, 5.3416748046875, 5.506591796875, 5.6715087890625, 5.83642578125, 6.0013427734375, 6.166259765625, 6.3311767578125, 6.49609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 3.0, 6.0, 7.0, 14.0, 12.0, 18.0, 20.0, 38.0, 30.0, 39.0, 41.0, 40.0, 43.0, 42.0, 55.0, 56.0, 59.0, 71.0, 56.0, 44.0, 51.0, 43.0, 41.0, 27.0, 24.0, 41.0, 18.0, 11.0, 15.0, 9.0, 8.0, 8.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.560638427734375, -3.40057373046875, -3.240509033203125, -3.0804443359375, -2.920379638671875, -2.76031494140625, -2.600250244140625, -2.440185546875, -2.280120849609375, -2.12005615234375, -1.959991455078125, -1.7999267578125, -1.639862060546875, -1.47979736328125, -1.319732666015625, -1.15966796875, -0.999603271484375, -0.83953857421875, -0.679473876953125, -0.5194091796875, -0.359344482421875, -0.19927978515625, -0.039215087890625, 0.120849609375, 0.280914306640625, 0.44097900390625, 0.601043701171875, 0.7611083984375, 0.921173095703125, 1.08123779296875, 1.241302490234375, 1.4013671875, 1.561431884765625, 1.72149658203125, 1.881561279296875, 2.0416259765625, 2.201690673828125, 2.36175537109375, 2.521820068359375, 2.681884765625, 2.841949462890625, 3.00201416015625, 3.162078857421875, 3.3221435546875, 3.482208251953125, 3.64227294921875, 3.802337646484375, 3.96240234375, 4.122467041015625, 4.28253173828125, 4.442596435546875, 4.6026611328125, 4.762725830078125, 4.92279052734375, 5.082855224609375, 5.242919921875, 5.402984619140625, 5.56304931640625, 5.723114013671875, 5.8831787109375, 6.043243408203125, 6.20330810546875, 6.363372802734375, 6.5234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 8.0, 11.0, 16.0, 10.0, 14.0, 24.0, 26.0, 47.0, 52.0, 57.0, 108.0, 119.0, 193.0, 349.0, 935.0, 5564.0, 105909.0, 874440.0, 55423.0, 3490.0, 738.0, 344.0, 191.0, 104.0, 81.0, 75.0, 41.0, 37.0, 24.0, 22.0, 13.0, 12.0, 12.0, 13.0, 6.0, 11.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.3046875, -9.0418701171875, -8.779052734375, -8.5162353515625, -8.25341796875, -7.9906005859375, -7.727783203125, -7.4649658203125, -7.2021484375, -6.9393310546875, -6.676513671875, -6.4136962890625, -6.15087890625, -5.8880615234375, -5.625244140625, -5.3624267578125, -5.099609375, -4.8367919921875, -4.573974609375, -4.3111572265625, -4.04833984375, -3.7855224609375, -3.522705078125, -3.2598876953125, -2.9970703125, -2.7342529296875, -2.471435546875, -2.2086181640625, -1.94580078125, -1.6829833984375, -1.420166015625, -1.1573486328125, -0.89453125, -0.6317138671875, -0.368896484375, -0.1060791015625, 0.15673828125, 0.4195556640625, 0.682373046875, 0.9451904296875, 1.2080078125, 1.4708251953125, 1.733642578125, 1.9964599609375, 2.25927734375, 2.5220947265625, 2.784912109375, 3.0477294921875, 3.310546875, 3.5733642578125, 3.836181640625, 4.0989990234375, 4.36181640625, 4.6246337890625, 4.887451171875, 5.1502685546875, 5.4130859375, 5.6759033203125, 5.938720703125, 6.2015380859375, 6.46435546875, 6.7271728515625, 6.989990234375, 7.2528076171875, 7.515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 6.0, 10.0, 9.0, 12.0, 13.0, 14.0, 23.0, 27.0, 30.0, 37.0, 40.0, 41.0, 41.0, 47.0, 67.0, 53.0, 51.0, 55.0, 63.0, 50.0, 37.0, 43.0, 32.0, 27.0, 27.0, 25.0, 19.0, 15.0, 15.0, 17.0, 11.0, 5.0, 7.0, 3.0, 3.0, 8.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.65545654296875, -4.4866943359375, -4.31793212890625, -4.149169921875, -3.98040771484375, -3.8116455078125, -3.64288330078125, -3.47412109375, -3.30535888671875, -3.1365966796875, -2.96783447265625, -2.799072265625, -2.63031005859375, -2.4615478515625, -2.29278564453125, -2.1240234375, -1.95526123046875, -1.7864990234375, -1.61773681640625, -1.448974609375, -1.28021240234375, -1.1114501953125, -0.94268798828125, -0.77392578125, -0.60516357421875, -0.4364013671875, -0.26763916015625, -0.098876953125, 0.06988525390625, 0.2386474609375, 0.40740966796875, 0.576171875, 0.74493408203125, 0.9136962890625, 1.08245849609375, 1.251220703125, 1.41998291015625, 1.5887451171875, 1.75750732421875, 1.92626953125, 2.09503173828125, 2.2637939453125, 2.43255615234375, 2.601318359375, 2.77008056640625, 2.9388427734375, 3.10760498046875, 3.2763671875, 3.44512939453125, 3.6138916015625, 3.78265380859375, 3.951416015625, 4.12017822265625, 4.2889404296875, 4.45770263671875, 4.62646484375, 4.79522705078125, 4.9639892578125, 5.13275146484375, 5.301513671875, 5.47027587890625, 5.6390380859375, 5.80780029296875, 5.9765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 2.0, 7.0, 10.0, 5.0, 16.0, 20.0, 22.0, 30.0, 39.0, 56.0, 84.0, 155.0, 404.0, 1242.0, 8198.0, 167927.0, 829644.0, 36298.0, 3131.0, 657.0, 220.0, 133.0, 73.0, 48.0, 27.0, 23.0, 25.0, 12.0, 9.0, 10.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.11328125, -3.03192138671875, -2.9505615234375, -2.86920166015625, -2.787841796875, -2.70648193359375, -2.6251220703125, -2.54376220703125, -2.46240234375, -2.38104248046875, -2.2996826171875, -2.21832275390625, -2.136962890625, -2.05560302734375, -1.9742431640625, -1.89288330078125, -1.8115234375, -1.73016357421875, -1.6488037109375, -1.56744384765625, -1.486083984375, -1.40472412109375, -1.3233642578125, -1.24200439453125, -1.16064453125, -1.07928466796875, -0.9979248046875, -0.91656494140625, -0.835205078125, -0.75384521484375, -0.6724853515625, -0.59112548828125, -0.509765625, -0.42840576171875, -0.3470458984375, -0.26568603515625, -0.184326171875, -0.10296630859375, -0.0216064453125, 0.05975341796875, 0.14111328125, 0.22247314453125, 0.3038330078125, 0.38519287109375, 0.466552734375, 0.54791259765625, 0.6292724609375, 0.71063232421875, 0.7919921875, 0.87335205078125, 0.9547119140625, 1.03607177734375, 1.117431640625, 1.19879150390625, 1.2801513671875, 1.36151123046875, 1.44287109375, 1.52423095703125, 1.6055908203125, 1.68695068359375, 1.768310546875, 1.84967041015625, 1.9310302734375, 2.01239013671875, 2.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 14.0, 15.0, 18.0, 22.0, 36.0, 56.0, 91.0, 141.0, 200.0, 120.0, 87.0, 42.0, 43.0, 17.0, 25.0, 21.0, 9.0, 12.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003714561462402344, -0.00036202557384967804, -0.0003525950014591217, -0.00034316442906856537, -0.00033373385667800903, -0.0003243032842874527, -0.00031487271189689636, -0.00030544213950634, -0.0002960115671157837, -0.00028658099472522736, -0.000277150422334671, -0.0002677198499441147, -0.00025828927755355835, -0.000248858705163002, -0.00023942813277244568, -0.00022999756038188934, -0.000220566987991333, -0.00021113641560077667, -0.00020170584321022034, -0.000192275270819664, -0.00018284469842910767, -0.00017341412603855133, -0.000163983553647995, -0.00015455298125743866, -0.00014512240886688232, -0.000135691836476326, -0.00012626126408576965, -0.00011683069169521332, -0.00010740011930465698, -9.796954691410065e-05, -8.853897452354431e-05, -7.910840213298798e-05, -6.967782974243164e-05, -6.0247257351875305e-05, -5.081668496131897e-05, -4.1386112570762634e-05, -3.19555401802063e-05, -2.2524967789649963e-05, -1.3094395399093628e-05, -3.6638230085372925e-06, 5.766749382019043e-06, 1.5197321772575378e-05, 2.4627894163131714e-05, 3.405846655368805e-05, 4.3489038944244385e-05, 5.291961133480072e-05, 6.235018372535706e-05, 7.178075611591339e-05, 8.121132850646973e-05, 9.064190089702606e-05, 0.0001000724732875824, 0.00010950304567813873, 0.00011893361806869507, 0.0001283641904592514, 0.00013779476284980774, 0.00014722533524036407, 0.0001566559076309204, 0.00016608648002147675, 0.00017551705241203308, 0.00018494762480258942, 0.00019437819719314575, 0.0002038087695837021, 0.00021323934197425842, 0.00022266991436481476, 0.0002321004867553711]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 4.0, 8.0, 11.0, 27.0, 40.0, 83.0, 137.0, 299.0, 621.0, 1518.0, 5102.0, 92043.0, 900594.0, 42092.0, 3588.0, 1271.0, 507.0, 269.0, 129.0, 80.0, 49.0, 25.0, 12.0, 8.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.630859375, -2.53118896484375, -2.4315185546875, -2.33184814453125, -2.232177734375, -2.13250732421875, -2.0328369140625, -1.93316650390625, -1.83349609375, -1.73382568359375, -1.6341552734375, -1.53448486328125, -1.434814453125, -1.33514404296875, -1.2354736328125, -1.13580322265625, -1.0361328125, -0.93646240234375, -0.8367919921875, -0.73712158203125, -0.637451171875, -0.53778076171875, -0.4381103515625, -0.33843994140625, -0.23876953125, -0.13909912109375, -0.0394287109375, 0.06024169921875, 0.159912109375, 0.25958251953125, 0.3592529296875, 0.45892333984375, 0.55859375, 0.65826416015625, 0.7579345703125, 0.85760498046875, 0.957275390625, 1.05694580078125, 1.1566162109375, 1.25628662109375, 1.35595703125, 1.45562744140625, 1.5552978515625, 1.65496826171875, 1.754638671875, 1.85430908203125, 1.9539794921875, 2.05364990234375, 2.1533203125, 2.25299072265625, 2.3526611328125, 2.45233154296875, 2.552001953125, 2.65167236328125, 2.7513427734375, 2.85101318359375, 2.95068359375, 3.05035400390625, 3.1500244140625, 3.24969482421875, 3.349365234375, 3.44903564453125, 3.5487060546875, 3.64837646484375, 3.748046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 12.0, 15.0, 21.0, 27.0, 33.0, 53.0, 73.0, 118.0, 215.0, 151.0, 84.0, 73.0, 37.0, 31.0, 26.0, 7.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0966796875, -1.066864013671875, -1.03704833984375, -1.007232666015625, -0.9774169921875, -0.947601318359375, -0.91778564453125, -0.887969970703125, -0.858154296875, -0.828338623046875, -0.79852294921875, -0.768707275390625, -0.7388916015625, -0.709075927734375, -0.67926025390625, -0.649444580078125, -0.61962890625, -0.589813232421875, -0.55999755859375, -0.530181884765625, -0.5003662109375, -0.470550537109375, -0.44073486328125, -0.410919189453125, -0.381103515625, -0.351287841796875, -0.32147216796875, -0.291656494140625, -0.2618408203125, -0.232025146484375, -0.20220947265625, -0.172393798828125, -0.142578125, -0.112762451171875, -0.08294677734375, -0.053131103515625, -0.0233154296875, 0.006500244140625, 0.03631591796875, 0.066131591796875, 0.095947265625, 0.125762939453125, 0.15557861328125, 0.185394287109375, 0.2152099609375, 0.245025634765625, 0.27484130859375, 0.304656982421875, 0.33447265625, 0.364288330078125, 0.39410400390625, 0.423919677734375, 0.4537353515625, 0.483551025390625, 0.51336669921875, 0.543182373046875, 0.572998046875, 0.602813720703125, 0.63262939453125, 0.662445068359375, 0.6922607421875, 0.722076416015625, 0.75189208984375, 0.781707763671875, 0.8115234375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 14.0, 51.0, 126.0, 228.0, 301.0, 176.0, 90.0, 18.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.715049743652344, -34.04909896850586, -33.383148193359375, -32.71719741821289, -32.05125045776367, -31.385299682617188, -30.719348907470703, -30.05339813232422, -29.387447357177734, -28.72149658203125, -28.0555477142334, -27.389596939086914, -26.72364616394043, -26.057697296142578, -25.391746520996094, -24.72579574584961, -24.059846878051758, -23.393896102905273, -22.727947235107422, -22.061996459960938, -21.396045684814453, -20.73009490966797, -20.064146041870117, -19.398195266723633, -18.73224639892578, -18.066295623779297, -17.400346755981445, -16.73439598083496, -16.068445205688477, -15.402495384216309, -14.73654556274414, -14.070594787597656, -13.404645919799805, -12.738696098327637, -12.072745323181152, -11.406795501708984, -10.7408447265625, -10.074894905090332, -9.408945083618164, -8.74299430847168, -8.077043533325195, -7.411093235015869, -6.745142936706543, -6.079193115234375, -5.413242816925049, -4.747292518615723, -4.081342697143555, -3.4153923988342285, -2.7494425773620605, -2.0834922790527344, -1.4175422191619873, -0.7515920400619507, -0.08564186096191406, 0.5803084373474121, 1.2462584972381592, 1.9122085571289062, 2.5781588554382324, 3.2441091537475586, 3.9100592136383057, 4.576009273529053, 5.241959571838379, 5.907909870147705, 6.573860168457031, 7.239809989929199, 7.905760288238525]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 4.0, 13.0, 7.0, 18.0, 14.0, 16.0, 30.0, 21.0, 36.0, 39.0, 37.0, 31.0, 54.0, 46.0, 43.0, 53.0, 52.0, 54.0, 46.0, 37.0, 34.0, 51.0, 38.0, 35.0, 26.0, 23.0, 25.0, 23.0, 22.0, 12.0, 14.0, 10.0, 12.0, 8.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.119431495666504, -9.839310646057129, -9.559189796447754, -9.279069900512695, -8.99894905090332, -8.718828201293945, -8.43870735168457, -8.158586502075195, -7.87846565246582, -7.598344802856445, -7.3182244300842285, -7.0381035804748535, -6.7579827308654785, -6.477862358093262, -6.197741508483887, -5.917620658874512, -5.637500286102295, -5.35737943649292, -5.077259063720703, -4.797138214111328, -4.517017364501953, -4.236896514892578, -3.9567761421203613, -3.6766552925109863, -3.3965346813201904, -3.1164140701293945, -2.8362932205200195, -2.5561726093292236, -2.2760519981384277, -1.9959311485290527, -1.7158105373382568, -1.4356898069381714, -1.1555685997009277, -0.8754478693008423, -0.5953271985054016, -0.31520652770996094, -0.03508579730987549, 0.24503493309020996, 0.5251555442810059, 0.8052762746810913, 1.0853970050811768, 1.3655177354812622, 1.6456384658813477, 1.9257590770721436, 2.2058796882629395, 2.4860005378723145, 2.7661211490631104, 3.0462417602539062, 3.3263626098632812, 3.606483221054077, 3.886604070663452, 4.166724681854248, 4.446845531463623, 4.72696590423584, 5.007086753845215, 5.28720760345459, 5.567328453063965, 5.84744930267334, 6.127569675445557, 6.407690525054932, 6.687811374664307, 6.967931747436523, 7.248052597045898, 7.528173446655273, 7.80829381942749]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 9.0, 7.0, 32.0, 24.0, 34.0, 57.0, 79.0, 122.0, 195.0, 334.0, 601.0, 1400.0, 3229.0, 10335.0, 43885.0, 264170.0, 1637340.0, 1829886.0, 330362.0, 53606.0, 11979.0, 3581.0, 1346.0, 621.0, 345.0, 246.0, 153.0, 91.0, 75.0, 35.0, 34.0, 18.0, 15.0, 10.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.822265625, -3.7030029296875, -3.583740234375, -3.4644775390625, -3.34521484375, -3.2259521484375, -3.106689453125, -2.9874267578125, -2.8681640625, -2.7489013671875, -2.629638671875, -2.5103759765625, -2.39111328125, -2.2718505859375, -2.152587890625, -2.0333251953125, -1.9140625, -1.7947998046875, -1.675537109375, -1.5562744140625, -1.43701171875, -1.3177490234375, -1.198486328125, -1.0792236328125, -0.9599609375, -0.8406982421875, -0.721435546875, -0.6021728515625, -0.48291015625, -0.3636474609375, -0.244384765625, -0.1251220703125, -0.005859375, 0.1134033203125, 0.232666015625, 0.3519287109375, 0.47119140625, 0.5904541015625, 0.709716796875, 0.8289794921875, 0.9482421875, 1.0675048828125, 1.186767578125, 1.3060302734375, 1.42529296875, 1.5445556640625, 1.663818359375, 1.7830810546875, 1.90234375, 2.0216064453125, 2.140869140625, 2.2601318359375, 2.37939453125, 2.4986572265625, 2.617919921875, 2.7371826171875, 2.8564453125, 2.9757080078125, 3.094970703125, 3.2142333984375, 3.33349609375, 3.4527587890625, 3.572021484375, 3.6912841796875, 3.810546875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 6.0, 12.0, 10.0, 7.0, 4.0, 14.0, 23.0, 14.0, 31.0, 37.0, 33.0, 38.0, 35.0, 36.0, 39.0, 42.0, 45.0, 48.0, 59.0, 43.0, 49.0, 38.0, 50.0, 41.0, 37.0, 34.0, 27.0, 17.0, 24.0, 25.0, 14.0, 11.0, 16.0, 8.0, 8.0, 12.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.060546875, -2.975982666015625, -2.89141845703125, -2.806854248046875, -2.7222900390625, -2.637725830078125, -2.55316162109375, -2.468597412109375, -2.384033203125, -2.299468994140625, -2.21490478515625, -2.130340576171875, -2.0457763671875, -1.961212158203125, -1.87664794921875, -1.792083740234375, -1.70751953125, -1.622955322265625, -1.53839111328125, -1.453826904296875, -1.3692626953125, -1.284698486328125, -1.20013427734375, -1.115570068359375, -1.031005859375, -0.946441650390625, -0.86187744140625, -0.777313232421875, -0.6927490234375, -0.608184814453125, -0.52362060546875, -0.439056396484375, -0.3544921875, -0.269927978515625, -0.18536376953125, -0.100799560546875, -0.0162353515625, 0.068328857421875, 0.15289306640625, 0.237457275390625, 0.322021484375, 0.406585693359375, 0.49114990234375, 0.575714111328125, 0.6602783203125, 0.744842529296875, 0.82940673828125, 0.913970947265625, 0.99853515625, 1.083099365234375, 1.16766357421875, 1.252227783203125, 1.3367919921875, 1.421356201171875, 1.50592041015625, 1.590484619140625, 1.675048828125, 1.759613037109375, 1.84417724609375, 1.928741455078125, 2.0133056640625, 2.097869873046875, 2.18243408203125, 2.266998291015625, 2.3515625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 14.0, 15.0, 30.0, 63.0, 167.0, 438.0, 2030.0, 78376.0, 4092602.0, 18708.0, 1262.0, 327.0, 104.0, 48.0, 30.0, 21.0, 17.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.890625, -12.361572265625, -11.83251953125, -11.303466796875, -10.7744140625, -10.245361328125, -9.71630859375, -9.187255859375, -8.658203125, -8.129150390625, -7.60009765625, -7.071044921875, -6.5419921875, -6.012939453125, -5.48388671875, -4.954833984375, -4.42578125, -3.896728515625, -3.36767578125, -2.838623046875, -2.3095703125, -1.780517578125, -1.25146484375, -0.722412109375, -0.193359375, 0.335693359375, 0.86474609375, 1.393798828125, 1.9228515625, 2.451904296875, 2.98095703125, 3.510009765625, 4.0390625, 4.568115234375, 5.09716796875, 5.626220703125, 6.1552734375, 6.684326171875, 7.21337890625, 7.742431640625, 8.271484375, 8.800537109375, 9.32958984375, 9.858642578125, 10.3876953125, 10.916748046875, 11.44580078125, 11.974853515625, 12.50390625, 13.032958984375, 13.56201171875, 14.091064453125, 14.6201171875, 15.149169921875, 15.67822265625, 16.207275390625, 16.736328125, 17.265380859375, 17.79443359375, 18.323486328125, 18.8525390625, 19.381591796875, 19.91064453125, 20.439697265625, 20.96875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 6.0, 12.0, 14.0, 33.0, 30.0, 44.0, 100.0, 126.0, 235.0, 343.0, 480.0, 627.0, 617.0, 471.0, 332.0, 215.0, 130.0, 78.0, 46.0, 33.0, 19.0, 17.0, 12.0, 13.0, 7.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.009765625, -1.956878662109375, -1.90399169921875, -1.851104736328125, -1.7982177734375, -1.745330810546875, -1.69244384765625, -1.639556884765625, -1.586669921875, -1.533782958984375, -1.48089599609375, -1.428009033203125, -1.3751220703125, -1.322235107421875, -1.26934814453125, -1.216461181640625, -1.16357421875, -1.110687255859375, -1.05780029296875, -1.004913330078125, -0.9520263671875, -0.899139404296875, -0.84625244140625, -0.793365478515625, -0.740478515625, -0.687591552734375, -0.63470458984375, -0.581817626953125, -0.5289306640625, -0.476043701171875, -0.42315673828125, -0.370269775390625, -0.3173828125, -0.264495849609375, -0.21160888671875, -0.158721923828125, -0.1058349609375, -0.052947998046875, -6.103515625e-05, 0.052825927734375, 0.105712890625, 0.158599853515625, 0.21148681640625, 0.264373779296875, 0.3172607421875, 0.370147705078125, 0.42303466796875, 0.475921630859375, 0.52880859375, 0.581695556640625, 0.63458251953125, 0.687469482421875, 0.7403564453125, 0.793243408203125, 0.84613037109375, 0.899017333984375, 0.951904296875, 1.004791259765625, 1.05767822265625, 1.110565185546875, 1.1634521484375, 1.216339111328125, 1.26922607421875, 1.322113037109375, 1.375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 16.0, 7.0, 18.0, 18.0, 22.0, 23.0, 37.0, 51.0, 60.0, 56.0, 56.0, 80.0, 48.0, 63.0, 55.0, 72.0, 56.0, 55.0, 48.0, 33.0, 29.0, 23.0, 21.0, 17.0, 15.0, 11.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.885334014892578, -2.769831418991089, -2.6543288230895996, -2.5388262271881104, -2.423323631286621, -2.307821035385132, -2.1923184394836426, -2.0768158435821533, -1.961313247680664, -1.8458106517791748, -1.7303080558776855, -1.6148054599761963, -1.499302864074707, -1.3838002681732178, -1.2682976722717285, -1.1527950763702393, -1.0372925996780396, -0.9217900037765503, -0.806287407875061, -0.6907848119735718, -0.5752822160720825, -0.45977967977523804, -0.3442770838737488, -0.22877448797225952, -0.11327189207077026, 0.002230696380138397, 0.11773328483104706, 0.23323586583137512, 0.3487384617328644, 0.46424102783203125, 0.5797436237335205, 0.6952462196350098, 0.810748815536499, 0.9262514114379883, 1.0417540073394775, 1.1572566032409668, 1.272759199142456, 1.3882617950439453, 1.5037643909454346, 1.6192669868469238, 1.734769582748413, 1.8502721786499023, 1.9657747745513916, 2.081277370452881, 2.19677996635437, 2.3122825622558594, 2.4277851581573486, 2.543287754058838, 2.658790111541748, 2.7742927074432373, 2.8897953033447266, 3.005297899246216, 3.120800495147705, 3.2363030910491943, 3.3518056869506836, 3.467308282852173, 3.582810878753662, 3.6983134746551514, 3.8138160705566406, 3.92931866645813, 4.044821262359619, 4.160323619842529, 4.275826454162598, 4.391328811645508, 4.506831645965576]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 2.0, 8.0, 6.0, 12.0, 7.0, 10.0, 11.0, 27.0, 28.0, 20.0, 30.0, 35.0, 32.0, 26.0, 26.0, 29.0, 44.0, 31.0, 31.0, 46.0, 49.0, 52.0, 32.0, 35.0, 48.0, 45.0, 32.0, 24.0, 28.0, 33.0, 20.0, 19.0, 21.0, 19.0, 18.0, 12.0, 10.0, 8.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.797264814376831, -2.7073681354522705, -2.617471218109131, -2.5275745391845703, -2.4376778602600098, -2.347781181335449, -2.2578842639923096, -2.167987585067749, -2.0780909061431885, -1.9881941080093384, -1.8982974290847778, -1.8084006309509277, -1.7185039520263672, -1.628607153892517, -1.538710355758667, -1.4488136768341064, -1.3589168787002563, -1.2690200805664062, -1.1791234016418457, -1.0892266035079956, -0.9993299245834351, -0.909433126449585, -0.8195363879203796, -0.7296396493911743, -0.639742910861969, -0.5498461723327637, -0.45994943380355835, -0.37005266547203064, -0.2801559269428253, -0.19025918841362, -0.10036242008209229, -0.010465681552886963, 0.07943105697631836, 0.16932779550552368, 0.259224534034729, 0.3491213023662567, 0.43901804089546204, 0.5289148092269897, 0.6188115477561951, 0.7087082862854004, 0.7986050248146057, 0.888501763343811, 0.9783985018730164, 1.0682952404022217, 1.1581920385360718, 1.2480887174606323, 1.3379855155944824, 1.427882194519043, 1.517778992652893, 1.6076757907867432, 1.6975724697113037, 1.7874692678451538, 1.8773659467697144, 1.9672627449035645, 2.057159423828125, 2.1470561027526855, 2.236953020095825, 2.3268496990203857, 2.4167466163635254, 2.506643295288086, 2.5965399742126465, 2.686436653137207, 2.7763335704803467, 2.8662302494049072, 2.9561269283294678]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 1.0, 7.0, 11.0, 17.0, 25.0, 30.0, 43.0, 65.0, 110.0, 177.0, 311.0, 585.0, 1211.0, 3285.0, 11150.0, 62418.0, 481101.0, 420489.0, 52173.0, 9887.0, 2964.0, 1185.0, 553.0, 281.0, 155.0, 113.0, 72.0, 46.0, 27.0, 20.0, 12.0, 17.0, 4.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.1058197021484375, -1.075897216796875, -1.0459747314453125, -1.01605224609375, -0.9861297607421875, -0.956207275390625, -0.9262847900390625, -0.8963623046875, -0.8664398193359375, -0.836517333984375, -0.8065948486328125, -0.77667236328125, -0.7467498779296875, -0.716827392578125, -0.6869049072265625, -0.656982421875, -0.6270599365234375, -0.597137451171875, -0.5672149658203125, -0.53729248046875, -0.5073699951171875, -0.477447509765625, -0.4475250244140625, -0.4176025390625, -0.3876800537109375, -0.357757568359375, -0.3278350830078125, -0.29791259765625, -0.2679901123046875, -0.238067626953125, -0.2081451416015625, -0.17822265625, -0.1483001708984375, -0.118377685546875, -0.0884552001953125, -0.05853271484375, -0.0286102294921875, 0.001312255859375, 0.0312347412109375, 0.0611572265625, 0.0910797119140625, 0.121002197265625, 0.1509246826171875, 0.18084716796875, 0.2107696533203125, 0.240692138671875, 0.2706146240234375, 0.300537109375, 0.3304595947265625, 0.360382080078125, 0.3903045654296875, 0.42022705078125, 0.4501495361328125, 0.480072021484375, 0.5099945068359375, 0.5399169921875, 0.5698394775390625, 0.599761962890625, 0.6296844482421875, 0.65960693359375, 0.6895294189453125, 0.719451904296875, 0.7493743896484375, 0.779296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 11.0, 13.0, 21.0, 25.0, 25.0, 38.0, 33.0, 53.0, 42.0, 42.0, 45.0, 54.0, 67.0, 48.0, 67.0, 54.0, 47.0, 46.0, 46.0, 32.0, 29.0, 27.0, 27.0, 19.0, 20.0, 17.0, 9.0, 8.0, 7.0, 2.0, 4.0, 4.0, 3.0], "bins": [-3.2734375, -3.19915771484375, -3.1248779296875, -3.05059814453125, -2.976318359375, -2.90203857421875, -2.8277587890625, -2.75347900390625, -2.67919921875, -2.60491943359375, -2.5306396484375, -2.45635986328125, -2.382080078125, -2.30780029296875, -2.2335205078125, -2.15924072265625, -2.0849609375, -2.01068115234375, -1.9364013671875, -1.86212158203125, -1.787841796875, -1.71356201171875, -1.6392822265625, -1.56500244140625, -1.49072265625, -1.41644287109375, -1.3421630859375, -1.26788330078125, -1.193603515625, -1.11932373046875, -1.0450439453125, -0.97076416015625, -0.896484375, -0.82220458984375, -0.7479248046875, -0.67364501953125, -0.599365234375, -0.52508544921875, -0.4508056640625, -0.37652587890625, -0.30224609375, -0.22796630859375, -0.1536865234375, -0.07940673828125, -0.005126953125, 0.06915283203125, 0.1434326171875, 0.21771240234375, 0.2919921875, 0.36627197265625, 0.4405517578125, 0.51483154296875, 0.589111328125, 0.66339111328125, 0.7376708984375, 0.81195068359375, 0.88623046875, 0.96051025390625, 1.0347900390625, 1.10906982421875, 1.183349609375, 1.25762939453125, 1.3319091796875, 1.40618896484375, 1.48046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 11.0, 9.0, 23.0, 23.0, 49.0, 77.0, 139.0, 323.0, 729.0, 1348.0, 3206.0, 7203.0, 16597.0, 38677.0, 89203.0, 191784.0, 293611.0, 218346.0, 104987.0, 45727.0, 20072.0, 8796.0, 3971.0, 1778.0, 889.0, 408.0, 235.0, 122.0, 64.0, 39.0, 24.0, 11.0, 15.0, 10.0, 9.0, 6.0, 4.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.2265338897705078, -0.21832656860351562, -0.21011924743652344, -0.20191192626953125, -0.19370460510253906, -0.18549728393554688, -0.1772899627685547, -0.1690826416015625, -0.1608753204345703, -0.15266799926757812, -0.14446067810058594, -0.13625335693359375, -0.12804603576660156, -0.11983871459960938, -0.11163139343261719, -0.103424072265625, -0.09521675109863281, -0.08700942993164062, -0.07880210876464844, -0.07059478759765625, -0.06238746643066406, -0.054180145263671875, -0.04597282409667969, -0.0377655029296875, -0.029558181762695312, -0.021350860595703125, -0.013143539428710938, -0.00493621826171875, 0.0032711029052734375, 0.011478424072265625, 0.019685745239257812, 0.02789306640625, 0.03610038757324219, 0.044307708740234375, 0.05251502990722656, 0.06072235107421875, 0.06892967224121094, 0.07713699340820312, 0.08534431457519531, 0.0935516357421875, 0.10175895690917969, 0.10996627807617188, 0.11817359924316406, 0.12638092041015625, 0.13458824157714844, 0.14279556274414062, 0.1510028839111328, 0.159210205078125, 0.1674175262451172, 0.17562484741210938, 0.18383216857910156, 0.19203948974609375, 0.20024681091308594, 0.20845413208007812, 0.2166614532470703, 0.2248687744140625, 0.2330760955810547, 0.24128341674804688, 0.24949073791503906, 0.25769805908203125, 0.26590538024902344, 0.2741127014160156, 0.2823200225830078, 0.29052734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 0.0, 1.0, 7.0, 6.0, 8.0, 12.0, 8.0, 10.0, 9.0, 25.0, 17.0, 27.0, 25.0, 13.0, 39.0, 34.0, 46.0, 30.0, 41.0, 53.0, 50.0, 53.0, 59.0, 50.0, 49.0, 34.0, 44.0, 27.0, 20.0, 31.0, 16.0, 18.0, 16.0, 18.0, 11.0, 14.0, 16.0, 10.0, 8.0, 10.0, 5.0, 3.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.599609375, -3.476837158203125, -3.35406494140625, -3.231292724609375, -3.1085205078125, -2.985748291015625, -2.86297607421875, -2.740203857421875, -2.617431640625, -2.494659423828125, -2.37188720703125, -2.249114990234375, -2.1263427734375, -2.003570556640625, -1.88079833984375, -1.758026123046875, -1.63525390625, -1.512481689453125, -1.38970947265625, -1.266937255859375, -1.1441650390625, -1.021392822265625, -0.89862060546875, -0.775848388671875, -0.653076171875, -0.530303955078125, -0.40753173828125, -0.284759521484375, -0.1619873046875, -0.039215087890625, 0.08355712890625, 0.206329345703125, 0.3291015625, 0.451873779296875, 0.57464599609375, 0.697418212890625, 0.8201904296875, 0.942962646484375, 1.06573486328125, 1.188507080078125, 1.311279296875, 1.434051513671875, 1.55682373046875, 1.679595947265625, 1.8023681640625, 1.925140380859375, 2.04791259765625, 2.170684814453125, 2.29345703125, 2.416229248046875, 2.53900146484375, 2.661773681640625, 2.7845458984375, 2.907318115234375, 3.03009033203125, 3.152862548828125, 3.275634765625, 3.398406982421875, 3.52117919921875, 3.643951416015625, 3.7667236328125, 3.889495849609375, 4.01226806640625, 4.135040283203125, 4.2578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 13.0, 16.0, 24.0, 20.0, 52.0, 70.0, 91.0, 153.0, 218.0, 331.0, 524.0, 904.0, 1547.0, 3261.0, 7438.0, 19437.0, 64078.0, 251919.0, 470479.0, 160842.0, 41784.0, 13903.0, 5466.0, 2498.0, 1306.0, 780.0, 486.0, 280.0, 196.0, 134.0, 89.0, 51.0, 59.0, 36.0, 16.0, 16.0, 8.0, 12.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05615234375, -0.05441570281982422, -0.05267906188964844, -0.050942420959472656, -0.049205780029296875, -0.047469139099121094, -0.04573249816894531, -0.04399585723876953, -0.04225921630859375, -0.04052257537841797, -0.03878593444824219, -0.037049293518066406, -0.035312652587890625, -0.033576011657714844, -0.03183937072753906, -0.03010272979736328, -0.0283660888671875, -0.02662944793701172, -0.024892807006835938, -0.023156166076660156, -0.021419525146484375, -0.019682884216308594, -0.017946243286132812, -0.01620960235595703, -0.01447296142578125, -0.012736320495605469, -0.010999679565429688, -0.009263038635253906, -0.007526397705078125, -0.005789756774902344, -0.0040531158447265625, -0.0023164749145507812, -0.000579833984375, 0.0011568069458007812, 0.0028934478759765625, 0.004630088806152344, 0.006366729736328125, 0.008103370666503906, 0.009840011596679688, 0.011576652526855469, 0.01331329345703125, 0.015049934387207031, 0.016786575317382812, 0.018523216247558594, 0.020259857177734375, 0.021996498107910156, 0.023733139038085938, 0.02546977996826172, 0.0272064208984375, 0.02894306182861328, 0.030679702758789062, 0.032416343688964844, 0.034152984619140625, 0.035889625549316406, 0.03762626647949219, 0.03936290740966797, 0.04109954833984375, 0.04283618927001953, 0.04457283020019531, 0.046309471130371094, 0.048046112060546875, 0.049782752990722656, 0.05151939392089844, 0.05325603485107422, 0.05499267578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 8.0, 13.0, 16.0, 25.0, 27.0, 37.0, 41.0, 65.0, 72.0, 86.0, 106.0, 92.0, 72.0, 82.0, 51.0, 56.0, 28.0, 27.0, 31.0, 12.0, 8.0, 14.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4226646423339844e-05, -4.296936094760895e-05, -4.171207547187805e-05, -4.0454789996147156e-05, -3.919750452041626e-05, -3.7940219044685364e-05, -3.668293356895447e-05, -3.542564809322357e-05, -3.4168362617492676e-05, -3.291107714176178e-05, -3.1653791666030884e-05, -3.0396506190299988e-05, -2.9139220714569092e-05, -2.7881935238838196e-05, -2.66246497631073e-05, -2.5367364287376404e-05, -2.4110078811645508e-05, -2.2852793335914612e-05, -2.1595507860183716e-05, -2.033822238445282e-05, -1.9080936908721924e-05, -1.7823651432991028e-05, -1.6566365957260132e-05, -1.5309080481529236e-05, -1.405179500579834e-05, -1.2794509530067444e-05, -1.1537224054336548e-05, -1.0279938578605652e-05, -9.022653102874756e-06, -7.76536762714386e-06, -6.508082151412964e-06, -5.250796675682068e-06, -3.993511199951172e-06, -2.736225724220276e-06, -1.4789402484893799e-06, -2.2165477275848389e-07, 1.0356307029724121e-06, 2.292916178703308e-06, 3.550201654434204e-06, 4.8074871301651e-06, 6.064772605895996e-06, 7.322058081626892e-06, 8.579343557357788e-06, 9.836629033088684e-06, 1.109391450881958e-05, 1.2351199984550476e-05, 1.3608485460281372e-05, 1.4865770936012268e-05, 1.6123056411743164e-05, 1.738034188747406e-05, 1.8637627363204956e-05, 1.9894912838935852e-05, 2.1152198314666748e-05, 2.2409483790397644e-05, 2.366676926612854e-05, 2.4924054741859436e-05, 2.6181340217590332e-05, 2.7438625693321228e-05, 2.8695911169052124e-05, 2.995319664478302e-05, 3.1210482120513916e-05, 3.246776759624481e-05, 3.372505307197571e-05, 3.4982338547706604e-05, 3.62396240234375e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 10.0, 14.0, 16.0, 20.0, 25.0, 34.0, 63.0, 69.0, 140.0, 170.0, 291.0, 512.0, 922.0, 1787.0, 3678.0, 8834.0, 27183.0, 135481.0, 640895.0, 177511.0, 32274.0, 10164.0, 4045.0, 1982.0, 965.0, 533.0, 332.0, 197.0, 124.0, 76.0, 60.0, 43.0, 26.0, 14.0, 19.0, 14.0, 7.0, 4.0, 6.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0797119140625, -0.07701587677001953, -0.07431983947753906, -0.0716238021850586, -0.06892776489257812, -0.06623172760009766, -0.06353569030761719, -0.06083965301513672, -0.05814361572265625, -0.05544757843017578, -0.05275154113769531, -0.050055503845214844, -0.047359466552734375, -0.044663429260253906, -0.04196739196777344, -0.03927135467529297, -0.0365753173828125, -0.03387928009033203, -0.031183242797851562, -0.028487205505371094, -0.025791168212890625, -0.023095130920410156, -0.020399093627929688, -0.01770305633544922, -0.01500701904296875, -0.012310981750488281, -0.009614944458007812, -0.006918907165527344, -0.004222869873046875, -0.0015268325805664062, 0.0011692047119140625, 0.0038652420043945312, 0.006561279296875, 0.009257316589355469, 0.011953353881835938, 0.014649391174316406, 0.017345428466796875, 0.020041465759277344, 0.022737503051757812, 0.02543354034423828, 0.02812957763671875, 0.03082561492919922, 0.03352165222167969, 0.036217689514160156, 0.038913726806640625, 0.041609764099121094, 0.04430580139160156, 0.04700183868408203, 0.0496978759765625, 0.05239391326904297, 0.05508995056152344, 0.057785987854003906, 0.060482025146484375, 0.06317806243896484, 0.06587409973144531, 0.06857013702392578, 0.07126617431640625, 0.07396221160888672, 0.07665824890136719, 0.07935428619384766, 0.08205032348632812, 0.0847463607788086, 0.08744239807128906, 0.09013843536376953, 0.09283447265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 2.0, 9.0, 4.0, 16.0, 17.0, 16.0, 16.0, 22.0, 26.0, 36.0, 41.0, 73.0, 93.0, 99.0, 102.0, 99.0, 72.0, 54.0, 42.0, 28.0, 23.0, 19.0, 14.0, 16.0, 12.0, 7.0, 10.0, 8.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014923095703125, -0.014391422271728516, -0.013859748840332031, -0.013328075408935547, -0.012796401977539062, -0.012264728546142578, -0.011733055114746094, -0.01120138168334961, -0.010669708251953125, -0.01013803482055664, -0.009606361389160156, -0.009074687957763672, -0.008543014526367188, -0.008011341094970703, -0.007479667663574219, -0.006947994232177734, -0.00641632080078125, -0.005884647369384766, -0.005352973937988281, -0.004821300506591797, -0.0042896270751953125, -0.003757953643798828, -0.0032262802124023438, -0.0026946067810058594, -0.002162933349609375, -0.0016312599182128906, -0.0010995864868164062, -0.0005679130554199219, -3.62396240234375e-05, 0.0004954338073730469, 0.0010271072387695312, 0.0015587806701660156, 0.0020904541015625, 0.0026221275329589844, 0.0031538009643554688, 0.003685474395751953, 0.0042171478271484375, 0.004748821258544922, 0.005280494689941406, 0.005812168121337891, 0.006343841552734375, 0.006875514984130859, 0.007407188415527344, 0.007938861846923828, 0.008470535278320312, 0.009002208709716797, 0.009533882141113281, 0.010065555572509766, 0.01059722900390625, 0.011128902435302734, 0.011660575866699219, 0.012192249298095703, 0.012723922729492188, 0.013255596160888672, 0.013787269592285156, 0.01431894302368164, 0.014850616455078125, 0.01538228988647461, 0.015913963317871094, 0.016445636749267578, 0.016977310180664062, 0.017508983612060547, 0.01804065704345703, 0.018572330474853516, 0.01910400390625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 12.0, 19.0, 22.0, 23.0, 26.0, 43.0, 67.0, 49.0, 63.0, 71.0, 58.0, 71.0, 60.0, 61.0, 51.0, 59.0, 70.0, 34.0, 29.0, 25.0, 20.0, 17.0, 9.0, 10.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.701707363128662, -1.6349502801895142, -1.5681931972503662, -1.5014361143112183, -1.4346790313720703, -1.3679219484329224, -1.3011648654937744, -1.2344077825546265, -1.1676506996154785, -1.1008936166763306, -1.0341365337371826, -0.9673794507980347, -0.9006223678588867, -0.8338652849197388, -0.7671082019805908, -0.7003511190414429, -0.6335940361022949, -0.566836953163147, -0.500079870223999, -0.4333227872848511, -0.3665657043457031, -0.2998086214065552, -0.23305153846740723, -0.16629445552825928, -0.09953737258911133, -0.03278028964996338, 0.03397679328918457, 0.10073387622833252, 0.16749095916748047, 0.23424804210662842, 0.30100512504577637, 0.3677622079849243, 0.43451905250549316, 0.5012761354446411, 0.5680332183837891, 0.634790301322937, 0.701547384262085, 0.7683044672012329, 0.8350615501403809, 0.9018186330795288, 0.9685757160186768, 1.0353327989578247, 1.1020898818969727, 1.1688469648361206, 1.2356040477752686, 1.3023611307144165, 1.3691182136535645, 1.4358752965927124, 1.5026323795318604, 1.5693894624710083, 1.6361465454101562, 1.7029036283493042, 1.7696607112884521, 1.8364177942276, 1.903174877166748, 1.969931960105896, 2.036689043045044, 2.1034460067749023, 2.17020320892334, 2.2369604110717773, 2.3037173748016357, 2.370474338531494, 2.4372315406799316, 2.503988742828369, 2.5707457065582275]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 12.0, 10.0, 9.0, 13.0, 18.0, 34.0, 26.0, 37.0, 43.0, 42.0, 27.0, 37.0, 52.0, 43.0, 36.0, 63.0, 63.0, 41.0, 46.0, 61.0, 37.0, 34.0, 32.0, 28.0, 31.0, 25.0, 19.0, 22.0, 10.0, 10.0, 6.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2764792442321777, -2.2122318744659424, -2.147984504699707, -2.0837371349334717, -2.0194897651672363, -1.955242395401001, -1.8909951448440552, -1.8267477750778198, -1.7625004053115845, -1.6982530355453491, -1.6340056657791138, -1.5697582960128784, -1.5055110454559326, -1.4412636756896973, -1.377016305923462, -1.3127689361572266, -1.2485215663909912, -1.1842741966247559, -1.1200268268585205, -1.0557794570922852, -0.9915321469306946, -0.9272847771644592, -0.8630374670028687, -0.7987900972366333, -0.734542727470398, -0.6702953577041626, -0.6060479879379272, -0.5418006777763367, -0.4775533080101013, -0.41330593824386597, -0.349058598279953, -0.28481125831604004, -0.22056400775909424, -0.15631665289402008, -0.09206929802894592, -0.027821943163871765, 0.03642541170120239, 0.10067278146743774, 0.1649201214313507, 0.22916746139526367, 0.293414831161499, 0.3576622009277344, 0.42190954089164734, 0.4861568808555603, 0.5504042506217957, 0.614651620388031, 0.6788989305496216, 0.7431463003158569, 0.8073936700820923, 0.8716410398483276, 0.935888409614563, 1.0001357793807983, 1.0643830299377441, 1.1286303997039795, 1.1928777694702148, 1.2571251392364502, 1.3213725090026855, 1.385619878768921, 1.4498672485351562, 1.5141146183013916, 1.578361988067627, 1.6426093578338623, 1.706856608390808, 1.7711039781570435, 1.8353513479232788]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 7.0, 10.0, 12.0, 24.0, 25.0, 49.0, 52.0, 75.0, 118.0, 143.0, 263.0, 360.0, 683.0, 1189.0, 2346.0, 4772.0, 10085.0, 21725.0, 45270.0, 94712.0, 191025.0, 293911.0, 195298.0, 96951.0, 46772.0, 21947.0, 10464.0, 4869.0, 2306.0, 1252.0, 636.0, 369.0, 276.0, 168.0, 124.0, 70.0, 55.0, 35.0, 29.0, 25.0, 14.0, 9.0, 5.0, 6.0, 10.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.787109375, -1.7265625, -1.666015625, -1.60546875, -1.544921875, -1.484375, -1.423828125, -1.36328125, -1.302734375, -1.2421875, -1.181640625, -1.12109375, -1.060546875, -1.0, -0.939453125, -0.87890625, -0.818359375, -0.7578125, -0.697265625, -0.63671875, -0.576171875, -0.515625, -0.455078125, -0.39453125, -0.333984375, -0.2734375, -0.212890625, -0.15234375, -0.091796875, -0.03125, 0.029296875, 0.08984375, 0.150390625, 0.2109375, 0.271484375, 0.33203125, 0.392578125, 0.453125, 0.513671875, 0.57421875, 0.634765625, 0.6953125, 0.755859375, 0.81640625, 0.876953125, 0.9375, 0.998046875, 1.05859375, 1.119140625, 1.1796875, 1.240234375, 1.30078125, 1.361328125, 1.421875, 1.482421875, 1.54296875, 1.603515625, 1.6640625, 1.724609375, 1.78515625, 1.845703125, 1.90625, 1.966796875, 2.02734375, 2.087890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 1.0, 8.0, 12.0, 12.0, 13.0, 13.0, 19.0, 22.0, 23.0, 24.0, 33.0, 33.0, 43.0, 29.0, 37.0, 47.0, 39.0, 50.0, 35.0, 43.0, 49.0, 30.0, 36.0, 40.0, 43.0, 43.0, 29.0, 28.0, 23.0, 31.0, 21.0, 18.0, 7.0, 9.0, 8.0, 12.0, 6.0, 8.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.501953125, -3.39471435546875, -3.2874755859375, -3.18023681640625, -3.072998046875, -2.96575927734375, -2.8585205078125, -2.75128173828125, -2.64404296875, -2.53680419921875, -2.4295654296875, -2.32232666015625, -2.215087890625, -2.10784912109375, -2.0006103515625, -1.89337158203125, -1.7861328125, -1.67889404296875, -1.5716552734375, -1.46441650390625, -1.357177734375, -1.24993896484375, -1.1427001953125, -1.03546142578125, -0.92822265625, -0.82098388671875, -0.7137451171875, -0.60650634765625, -0.499267578125, -0.39202880859375, -0.2847900390625, -0.17755126953125, -0.0703125, 0.03692626953125, 0.1441650390625, 0.25140380859375, 0.358642578125, 0.46588134765625, 0.5731201171875, 0.68035888671875, 0.78759765625, 0.89483642578125, 1.0020751953125, 1.10931396484375, 1.216552734375, 1.32379150390625, 1.4310302734375, 1.53826904296875, 1.6455078125, 1.75274658203125, 1.8599853515625, 1.96722412109375, 2.074462890625, 2.18170166015625, 2.2889404296875, 2.39617919921875, 2.50341796875, 2.61065673828125, 2.7178955078125, 2.82513427734375, 2.932373046875, 3.03961181640625, 3.1468505859375, 3.25408935546875, 3.361328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 5.0, 12.0, 10.0, 13.0, 21.0, 25.0, 37.0, 43.0, 56.0, 72.0, 108.0, 151.0, 272.0, 462.0, 1100.0, 4462.0, 26549.0, 171740.0, 613166.0, 193225.0, 29465.0, 5074.0, 1164.0, 442.0, 243.0, 165.0, 119.0, 88.0, 54.0, 37.0, 32.0, 36.0, 18.0, 17.0, 10.0, 12.0, 12.0, 5.0, 2.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.91796875, -4.77130126953125, -4.6246337890625, -4.47796630859375, -4.331298828125, -4.18463134765625, -4.0379638671875, -3.89129638671875, -3.74462890625, -3.59796142578125, -3.4512939453125, -3.30462646484375, -3.157958984375, -3.01129150390625, -2.8646240234375, -2.71795654296875, -2.5712890625, -2.42462158203125, -2.2779541015625, -2.13128662109375, -1.984619140625, -1.83795166015625, -1.6912841796875, -1.54461669921875, -1.39794921875, -1.25128173828125, -1.1046142578125, -0.95794677734375, -0.811279296875, -0.66461181640625, -0.5179443359375, -0.37127685546875, -0.224609375, -0.07794189453125, 0.0687255859375, 0.21539306640625, 0.362060546875, 0.50872802734375, 0.6553955078125, 0.80206298828125, 0.94873046875, 1.09539794921875, 1.2420654296875, 1.38873291015625, 1.535400390625, 1.68206787109375, 1.8287353515625, 1.97540283203125, 2.1220703125, 2.26873779296875, 2.4154052734375, 2.56207275390625, 2.708740234375, 2.85540771484375, 3.0020751953125, 3.14874267578125, 3.29541015625, 3.44207763671875, 3.5887451171875, 3.73541259765625, 3.882080078125, 4.02874755859375, 4.1754150390625, 4.32208251953125, 4.46875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 6.0, 7.0, 8.0, 7.0, 20.0, 19.0, 20.0, 17.0, 22.0, 37.0, 41.0, 49.0, 57.0, 65.0, 50.0, 76.0, 60.0, 55.0, 60.0, 51.0, 61.0, 39.0, 27.0, 27.0, 21.0, 16.0, 12.0, 9.0, 17.0, 6.0, 6.0, 8.0, 3.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.834228515625, -4.67626953125, -4.518310546875, -4.3603515625, -4.202392578125, -4.04443359375, -3.886474609375, -3.728515625, -3.570556640625, -3.41259765625, -3.254638671875, -3.0966796875, -2.938720703125, -2.78076171875, -2.622802734375, -2.46484375, -2.306884765625, -2.14892578125, -1.990966796875, -1.8330078125, -1.675048828125, -1.51708984375, -1.359130859375, -1.201171875, -1.043212890625, -0.88525390625, -0.727294921875, -0.5693359375, -0.411376953125, -0.25341796875, -0.095458984375, 0.0625, 0.220458984375, 0.37841796875, 0.536376953125, 0.6943359375, 0.852294921875, 1.01025390625, 1.168212890625, 1.326171875, 1.484130859375, 1.64208984375, 1.800048828125, 1.9580078125, 2.115966796875, 2.27392578125, 2.431884765625, 2.58984375, 2.747802734375, 2.90576171875, 3.063720703125, 3.2216796875, 3.379638671875, 3.53759765625, 3.695556640625, 3.853515625, 4.011474609375, 4.16943359375, 4.327392578125, 4.4853515625, 4.643310546875, 4.80126953125, 4.959228515625, 5.1171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 5.0, 12.0, 15.0, 25.0, 36.0, 62.0, 104.0, 207.0, 516.0, 1637.0, 8586.0, 91655.0, 746567.0, 180825.0, 14659.0, 2356.0, 680.0, 267.0, 128.0, 62.0, 38.0, 23.0, 23.0, 17.0, 9.0, 6.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.7021484375, -1.646575927734375, -1.59100341796875, -1.535430908203125, -1.4798583984375, -1.424285888671875, -1.36871337890625, -1.313140869140625, -1.257568359375, -1.201995849609375, -1.14642333984375, -1.090850830078125, -1.0352783203125, -0.979705810546875, -0.92413330078125, -0.868560791015625, -0.81298828125, -0.757415771484375, -0.70184326171875, -0.646270751953125, -0.5906982421875, -0.535125732421875, -0.47955322265625, -0.423980712890625, -0.368408203125, -0.312835693359375, -0.25726318359375, -0.201690673828125, -0.1461181640625, -0.090545654296875, -0.03497314453125, 0.020599365234375, 0.076171875, 0.131744384765625, 0.18731689453125, 0.242889404296875, 0.2984619140625, 0.354034423828125, 0.40960693359375, 0.465179443359375, 0.520751953125, 0.576324462890625, 0.63189697265625, 0.687469482421875, 0.7430419921875, 0.798614501953125, 0.85418701171875, 0.909759521484375, 0.96533203125, 1.020904541015625, 1.07647705078125, 1.132049560546875, 1.1876220703125, 1.243194580078125, 1.29876708984375, 1.354339599609375, 1.409912109375, 1.465484619140625, 1.52105712890625, 1.576629638671875, 1.6322021484375, 1.687774658203125, 1.74334716796875, 1.798919677734375, 1.8544921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 12.0, 14.0, 14.0, 14.0, 19.0, 31.0, 22.0, 47.0, 31.0, 45.0, 52.0, 69.0, 88.0, 100.0, 86.0, 72.0, 49.0, 32.0, 23.0, 24.0, 28.0, 19.0, 20.0, 5.0, 10.0, 13.0, 5.0, 6.0, 8.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00014162063598632812, -0.00013682246208190918, -0.00013202428817749023, -0.0001272261142730713, -0.00012242794036865234, -0.0001176297664642334, -0.00011283159255981445, -0.00010803341865539551, -0.00010323524475097656, -9.843707084655762e-05, -9.363889694213867e-05, -8.884072303771973e-05, -8.404254913330078e-05, -7.924437522888184e-05, -7.444620132446289e-05, -6.964802742004395e-05, -6.4849853515625e-05, -6.0051679611206055e-05, -5.525350570678711e-05, -5.0455331802368164e-05, -4.565715789794922e-05, -4.0858983993530273e-05, -3.606081008911133e-05, -3.126263618469238e-05, -2.6464462280273438e-05, -2.1666288375854492e-05, -1.6868114471435547e-05, -1.2069940567016602e-05, -7.271766662597656e-06, -2.473592758178711e-06, 2.3245811462402344e-06, 7.12275505065918e-06, 1.1920928955078125e-05, 1.671910285949707e-05, 2.1517276763916016e-05, 2.631545066833496e-05, 3.1113624572753906e-05, 3.591179847717285e-05, 4.07099723815918e-05, 4.550814628601074e-05, 5.030632019042969e-05, 5.510449409484863e-05, 5.990266799926758e-05, 6.470084190368652e-05, 6.949901580810547e-05, 7.429718971252441e-05, 7.909536361694336e-05, 8.38935375213623e-05, 8.869171142578125e-05, 9.34898853302002e-05, 9.828805923461914e-05, 0.00010308623313903809, 0.00010788440704345703, 0.00011268258094787598, 0.00011748075485229492, 0.00012227892875671387, 0.0001270771026611328, 0.00013187527656555176, 0.0001366734504699707, 0.00014147162437438965, 0.0001462697982788086, 0.00015106797218322754, 0.00015586614608764648, 0.00016066431999206543, 0.00016546249389648438]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 17.0, 13.0, 17.0, 27.0, 55.0, 100.0, 260.0, 545.0, 1238.0, 3273.0, 15084.0, 192305.0, 739539.0, 83216.0, 8629.0, 2509.0, 914.0, 371.0, 217.0, 78.0, 52.0, 23.0, 24.0, 13.0, 3.0, 5.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.009765625, -1.94354248046875, -1.8773193359375, -1.81109619140625, -1.744873046875, -1.67864990234375, -1.6124267578125, -1.54620361328125, -1.47998046875, -1.41375732421875, -1.3475341796875, -1.28131103515625, -1.215087890625, -1.14886474609375, -1.0826416015625, -1.01641845703125, -0.9501953125, -0.88397216796875, -0.8177490234375, -0.75152587890625, -0.685302734375, -0.61907958984375, -0.5528564453125, -0.48663330078125, -0.42041015625, -0.35418701171875, -0.2879638671875, -0.22174072265625, -0.155517578125, -0.08929443359375, -0.0230712890625, 0.04315185546875, 0.109375, 0.17559814453125, 0.2418212890625, 0.30804443359375, 0.374267578125, 0.44049072265625, 0.5067138671875, 0.57293701171875, 0.63916015625, 0.70538330078125, 0.7716064453125, 0.83782958984375, 0.904052734375, 0.97027587890625, 1.0364990234375, 1.10272216796875, 1.1689453125, 1.23516845703125, 1.3013916015625, 1.36761474609375, 1.433837890625, 1.50006103515625, 1.5662841796875, 1.63250732421875, 1.69873046875, 1.76495361328125, 1.8311767578125, 1.89739990234375, 1.963623046875, 2.02984619140625, 2.0960693359375, 2.16229248046875, 2.228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 6.0, 10.0, 12.0, 27.0, 33.0, 22.0, 63.0, 79.0, 91.0, 120.0, 120.0, 108.0, 77.0, 62.0, 45.0, 34.0, 21.0, 13.0, 10.0, 10.0, 5.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7763671875, -0.7542724609375, -0.732177734375, -0.7100830078125, -0.68798828125, -0.6658935546875, -0.643798828125, -0.6217041015625, -0.599609375, -0.5775146484375, -0.555419921875, -0.5333251953125, -0.51123046875, -0.4891357421875, -0.467041015625, -0.4449462890625, -0.4228515625, -0.4007568359375, -0.378662109375, -0.3565673828125, -0.33447265625, -0.3123779296875, -0.290283203125, -0.2681884765625, -0.24609375, -0.2239990234375, -0.201904296875, -0.1798095703125, -0.15771484375, -0.1356201171875, -0.113525390625, -0.0914306640625, -0.0693359375, -0.0472412109375, -0.025146484375, -0.0030517578125, 0.01904296875, 0.0411376953125, 0.063232421875, 0.0853271484375, 0.107421875, 0.1295166015625, 0.151611328125, 0.1737060546875, 0.19580078125, 0.2178955078125, 0.239990234375, 0.2620849609375, 0.2841796875, 0.3062744140625, 0.328369140625, 0.3504638671875, 0.37255859375, 0.3946533203125, 0.416748046875, 0.4388427734375, 0.4609375, 0.4830322265625, 0.505126953125, 0.5272216796875, 0.54931640625, 0.5714111328125, 0.593505859375, 0.6156005859375, 0.6376953125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 16.0, 63.0, 113.0, 196.0, 216.0, 186.0, 138.0, 59.0, 16.0, 6.0, 1.0], "bins": [-27.351041793823242, -26.875194549560547, -26.39934730529785, -25.92350196838379, -25.447654724121094, -24.9718074798584, -24.495960235595703, -24.02011489868164, -23.544267654418945, -23.06842041015625, -22.592573165893555, -22.116727828979492, -21.640880584716797, -21.1650333404541, -20.689186096191406, -20.213340759277344, -19.73749351501465, -19.261646270751953, -18.785799026489258, -18.309953689575195, -17.8341064453125, -17.358259201049805, -16.88241195678711, -16.406566619873047, -15.930718421936035, -15.45487117767334, -14.979024887084961, -14.503177642822266, -14.027331352233887, -13.551484107971191, -13.075637817382812, -12.599790573120117, -12.123944282531738, -11.648097038269043, -11.172250747680664, -10.696403503417969, -10.22055721282959, -9.744709968566895, -9.268863677978516, -8.79301643371582, -8.317170143127441, -7.841323375701904, -7.365476608276367, -6.88962984085083, -6.413783073425293, -5.937935829162598, -5.462089538574219, -4.986242294311523, -4.5103960037231445, -4.034549236297607, -3.5587024688720703, -3.082855701446533, -2.607008934020996, -2.13116192817688, -1.6553151607513428, -1.1794683933258057, -0.7036213874816895, -0.22777459025382996, 0.24807220697402954, 0.7239190340042114, 1.1997658014297485, 1.6756126880645752, 2.1514594554901123, 2.6273062229156494, 3.1031529903411865]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 8.0, 5.0, 14.0, 10.0, 12.0, 28.0, 17.0, 22.0, 25.0, 29.0, 22.0, 30.0, 37.0, 40.0, 37.0, 48.0, 33.0, 43.0, 40.0, 41.0, 46.0, 43.0, 48.0, 39.0, 40.0, 32.0, 23.0, 38.0, 32.0, 33.0, 15.0, 17.0, 9.0, 7.0, 9.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.472193241119385, -6.257626533508301, -6.043060302734375, -5.828493595123291, -5.613926887512207, -5.399360656738281, -5.184793949127197, -4.970227241516113, -4.7556610107421875, -4.5410943031311035, -4.326528072357178, -4.111961364746094, -3.8973946571350098, -3.682828187942505, -3.46826171875, -3.253695011138916, -3.039128303527832, -2.824561834335327, -2.609995126724243, -2.3954286575317383, -2.1808619499206543, -1.9662954807281494, -1.7517290115356445, -1.53716242313385, -1.3225958347320557, -1.1080292463302612, -0.8934627175331116, -0.6788961887359619, -0.4643296003341675, -0.24976301193237305, -0.035196542739868164, 0.17937004566192627, 0.3939371109008789, 0.6085036993026733, 0.823070228099823, 1.0376367568969727, 1.252203345298767, 1.4667699337005615, 1.6813364028930664, 1.8959029912948608, 2.1104695796966553, 2.32503604888916, 2.539602756500244, 2.754169225692749, 2.968735694885254, 3.183302402496338, 3.3978688716888428, 3.6124353408813477, 3.8270020484924316, 4.041568756103516, 4.256134986877441, 4.470701694488525, 4.685268402099609, 4.899834632873535, 5.114401340484619, 5.328968048095703, 5.543534278869629, 5.758100986480713, 5.972667217254639, 6.187233924865723, 6.401800632476807, 6.616367340087891, 6.830933570861816, 7.0455002784729, 7.260066986083984]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 14.0, 8.0, 15.0, 20.0, 19.0, 23.0, 37.0, 41.0, 58.0, 76.0, 96.0, 120.0, 182.0, 230.0, 438.0, 1016.0, 2907.0, 12268.0, 99758.0, 1530906.0, 2320168.0, 199783.0, 19300.0, 3997.0, 1191.0, 548.0, 302.0, 183.0, 136.0, 70.0, 64.0, 65.0, 50.0, 40.0, 36.0, 30.0, 22.0, 11.0, 11.0, 9.0, 4.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.24609375, -5.09234619140625, -4.9385986328125, -4.78485107421875, -4.631103515625, -4.47735595703125, -4.3236083984375, -4.16986083984375, -4.01611328125, -3.86236572265625, -3.7086181640625, -3.55487060546875, -3.401123046875, -3.24737548828125, -3.0936279296875, -2.93988037109375, -2.7861328125, -2.63238525390625, -2.4786376953125, -2.32489013671875, -2.171142578125, -2.01739501953125, -1.8636474609375, -1.70989990234375, -1.55615234375, -1.40240478515625, -1.2486572265625, -1.09490966796875, -0.941162109375, -0.78741455078125, -0.6336669921875, -0.47991943359375, -0.326171875, -0.17242431640625, -0.0186767578125, 0.13507080078125, 0.288818359375, 0.44256591796875, 0.5963134765625, 0.75006103515625, 0.90380859375, 1.05755615234375, 1.2113037109375, 1.36505126953125, 1.518798828125, 1.67254638671875, 1.8262939453125, 1.98004150390625, 2.1337890625, 2.28753662109375, 2.4412841796875, 2.59503173828125, 2.748779296875, 2.90252685546875, 3.0562744140625, 3.21002197265625, 3.36376953125, 3.51751708984375, 3.6712646484375, 3.82501220703125, 3.978759765625, 4.13250732421875, 4.2862548828125, 4.44000244140625, 4.59375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 3.0, 2.0, 9.0, 15.0, 11.0, 13.0, 11.0, 17.0, 18.0, 22.0, 26.0, 23.0, 19.0, 27.0, 31.0, 35.0, 35.0, 37.0, 39.0, 31.0, 30.0, 40.0, 39.0, 44.0, 26.0, 39.0, 41.0, 33.0, 25.0, 31.0, 23.0, 26.0, 24.0, 18.0, 26.0, 18.0, 18.0, 11.0, 11.0, 9.0, 9.0, 7.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-1.919921875, -1.8626861572265625, -1.805450439453125, -1.7482147216796875, -1.69097900390625, -1.6337432861328125, -1.576507568359375, -1.5192718505859375, -1.4620361328125, -1.4048004150390625, -1.347564697265625, -1.2903289794921875, -1.23309326171875, -1.1758575439453125, -1.118621826171875, -1.0613861083984375, -1.004150390625, -0.9469146728515625, -0.889678955078125, -0.8324432373046875, -0.77520751953125, -0.7179718017578125, -0.660736083984375, -0.6035003662109375, -0.5462646484375, -0.4890289306640625, -0.431793212890625, -0.3745574951171875, -0.31732177734375, -0.2600860595703125, -0.202850341796875, -0.1456146240234375, -0.08837890625, -0.0311431884765625, 0.026092529296875, 0.0833282470703125, 0.14056396484375, 0.1977996826171875, 0.255035400390625, 0.3122711181640625, 0.3695068359375, 0.4267425537109375, 0.483978271484375, 0.5412139892578125, 0.59844970703125, 0.6556854248046875, 0.712921142578125, 0.7701568603515625, 0.827392578125, 0.8846282958984375, 0.941864013671875, 0.9990997314453125, 1.05633544921875, 1.1135711669921875, 1.170806884765625, 1.2280426025390625, 1.2852783203125, 1.3425140380859375, 1.399749755859375, 1.4569854736328125, 1.51422119140625, 1.5714569091796875, 1.628692626953125, 1.6859283447265625, 1.7431640625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 15.0, 16.0, 35.0, 74.0, 197.0, 430.0, 1247.0, 5602.0, 348848.0, 3812643.0, 21723.0, 2258.0, 670.0, 235.0, 127.0, 45.0, 30.0, 27.0, 18.0, 5.0, 7.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.2158203125, -11.869140625, -11.5224609375, -11.17578125, -10.8291015625, -10.482421875, -10.1357421875, -9.7890625, -9.4423828125, -9.095703125, -8.7490234375, -8.40234375, -8.0556640625, -7.708984375, -7.3623046875, -7.015625, -6.6689453125, -6.322265625, -5.9755859375, -5.62890625, -5.2822265625, -4.935546875, -4.5888671875, -4.2421875, -3.8955078125, -3.548828125, -3.2021484375, -2.85546875, -2.5087890625, -2.162109375, -1.8154296875, -1.46875, -1.1220703125, -0.775390625, -0.4287109375, -0.08203125, 0.2646484375, 0.611328125, 0.9580078125, 1.3046875, 1.6513671875, 1.998046875, 2.3447265625, 2.69140625, 3.0380859375, 3.384765625, 3.7314453125, 4.078125, 4.4248046875, 4.771484375, 5.1181640625, 5.46484375, 5.8115234375, 6.158203125, 6.5048828125, 6.8515625, 7.1982421875, 7.544921875, 7.8916015625, 8.23828125, 8.5849609375, 8.931640625, 9.2783203125, 9.625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 8.0, 6.0, 18.0, 38.0, 53.0, 121.0, 207.0, 378.0, 604.0, 764.0, 711.0, 498.0, 309.0, 168.0, 84.0, 48.0, 24.0, 11.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6494140625, -1.5901031494140625, -1.530792236328125, -1.4714813232421875, -1.41217041015625, -1.3528594970703125, -1.293548583984375, -1.2342376708984375, -1.1749267578125, -1.1156158447265625, -1.056304931640625, -0.9969940185546875, -0.93768310546875, -0.8783721923828125, -0.819061279296875, -0.7597503662109375, -0.700439453125, -0.6411285400390625, -0.581817626953125, -0.5225067138671875, -0.46319580078125, -0.4038848876953125, -0.344573974609375, -0.2852630615234375, -0.2259521484375, -0.1666412353515625, -0.107330322265625, -0.0480194091796875, 0.01129150390625, 0.0706024169921875, 0.129913330078125, 0.1892242431640625, 0.24853515625, 0.3078460693359375, 0.367156982421875, 0.4264678955078125, 0.48577880859375, 0.5450897216796875, 0.604400634765625, 0.6637115478515625, 0.7230224609375, 0.7823333740234375, 0.841644287109375, 0.9009552001953125, 0.96026611328125, 1.0195770263671875, 1.078887939453125, 1.1381988525390625, 1.197509765625, 1.2568206787109375, 1.316131591796875, 1.3754425048828125, 1.43475341796875, 1.4940643310546875, 1.553375244140625, 1.6126861572265625, 1.6719970703125, 1.7313079833984375, 1.790618896484375, 1.8499298095703125, 1.90924072265625, 1.9685516357421875, 2.027862548828125, 2.0871734619140625, 2.146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 4.0, 10.0, 7.0, 7.0, 12.0, 19.0, 10.0, 16.0, 19.0, 17.0, 22.0, 39.0, 34.0, 35.0, 35.0, 36.0, 32.0, 53.0, 39.0, 32.0, 38.0, 50.0, 39.0, 45.0, 48.0, 35.0, 34.0, 33.0, 30.0, 28.0, 34.0, 25.0, 15.0, 13.0, 13.0, 14.0, 7.0, 7.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7215549945831299, -1.6502245664596558, -1.5788942575454712, -1.507563829421997, -1.436233401298523, -1.3649029731750488, -1.2935726642608643, -1.2222422361373901, -1.150911808013916, -1.079581379890442, -1.0082510709762573, -0.9369206428527832, -0.8655902147293091, -0.7942598462104797, -0.7229294776916504, -0.6515990495681763, -0.5802687406539917, -0.5089383721351624, -0.43760794401168823, -0.3662775754928589, -0.29494717717170715, -0.22361677885055542, -0.15228641033172607, -0.08095601201057434, -0.009625613689422607, 0.06170477718114853, 0.13303516805171967, 0.2043655514717102, 0.27569594979286194, 0.34702634811401367, 0.418356716632843, 0.48968711495399475, 0.5610175132751465, 0.6323478817939758, 0.70367830991745, 0.7750086784362793, 0.8463391065597534, 0.9176694750785828, 0.9889998435974121, 1.0603302717208862, 1.1316606998443604, 1.2029911279678345, 1.274321436882019, 1.3456518650054932, 1.4169822931289673, 1.4883127212524414, 1.559643030166626, 1.6309734582901, 1.7023037672042847, 1.7736341953277588, 1.8449645042419434, 1.9162949323654175, 1.9876253604888916, 2.058955669403076, 2.13028621673584, 2.2016165256500244, 2.272946834564209, 2.3442771434783936, 2.4156076908111572, 2.486937999725342, 2.5582683086395264, 2.62959885597229, 2.7009291648864746, 2.772259473800659, 2.843590021133423]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 1.0, 5.0, 4.0, 1.0, 8.0, 5.0, 3.0, 6.0, 8.0, 3.0, 15.0, 13.0, 15.0, 14.0, 19.0, 21.0, 15.0, 18.0, 17.0, 27.0, 23.0, 32.0, 35.0, 43.0, 29.0, 42.0, 34.0, 40.0, 38.0, 40.0, 34.0, 34.0, 24.0, 36.0, 44.0, 31.0, 25.0, 29.0, 20.0, 18.0, 28.0, 17.0, 13.0, 13.0, 12.0, 9.0, 6.0, 7.0, 9.0, 2.0, 4.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.1947810649871826, -2.127588987350464, -2.060397148132324, -1.9932050704956055, -1.9260129928588867, -1.8588210344314575, -1.7916290760040283, -1.7244369983673096, -1.6572449207305908, -1.5900529623031616, -1.5228608846664429, -1.4556689262390137, -1.388476848602295, -1.3212848901748657, -1.2540929317474365, -1.1869008541107178, -1.1197088956832886, -1.0525169372558594, -0.9853248596191406, -0.9181329011917114, -0.8509408235549927, -0.7837488651275635, -0.7165568470954895, -0.6493648290634155, -0.5821728110313416, -0.5149807929992676, -0.4477887749671936, -0.380596786737442, -0.31340476870536804, -0.24621275067329407, -0.17902076244354248, -0.1118287444114685, -0.04463672637939453, 0.022555284202098846, 0.08974729478359222, 0.156939297914505, 0.22413131594657898, 0.29132333397865295, 0.35851532220840454, 0.4257073402404785, 0.4928993582725525, 0.5600913763046265, 0.6272833943367004, 0.6944754123687744, 0.7616673707962036, 0.8288594484329224, 0.8960514068603516, 0.9632434248924255, 1.0304354429244995, 1.0976274013519287, 1.1648194789886475, 1.2320114374160767, 1.2992035150527954, 1.3663954734802246, 1.4335875511169434, 1.5007795095443726, 1.5679714679718018, 1.635163426399231, 1.7023555040359497, 1.769547462463379, 1.8367395401000977, 1.9039314985275269, 1.971123456954956, 2.038315534591675, 2.1055076122283936]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 10.0, 7.0, 13.0, 20.0, 20.0, 32.0, 39.0, 52.0, 62.0, 93.0, 138.0, 151.0, 193.0, 311.0, 454.0, 641.0, 1335.0, 4154.0, 30724.0, 342504.0, 581207.0, 74473.0, 7473.0, 1815.0, 822.0, 491.0, 350.0, 233.0, 186.0, 125.0, 83.0, 78.0, 64.0, 45.0, 38.0, 26.0, 22.0, 17.0, 8.0, 7.0, 5.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.94287109375, -0.9144515991210938, -0.8860321044921875, -0.8576126098632812, -0.829193115234375, -0.8007736206054688, -0.7723541259765625, -0.7439346313476562, -0.71551513671875, -0.6870956420898438, -0.6586761474609375, -0.6302566528320312, -0.601837158203125, -0.5734176635742188, -0.5449981689453125, -0.5165786743164062, -0.4881591796875, -0.45973968505859375, -0.4313201904296875, -0.40290069580078125, -0.374481201171875, -0.34606170654296875, -0.3176422119140625, -0.28922271728515625, -0.26080322265625, -0.23238372802734375, -0.2039642333984375, -0.17554473876953125, -0.147125244140625, -0.11870574951171875, -0.0902862548828125, -0.06186676025390625, -0.033447265625, -0.00502777099609375, 0.0233917236328125, 0.05181121826171875, 0.080230712890625, 0.10865020751953125, 0.1370697021484375, 0.16548919677734375, 0.19390869140625, 0.22232818603515625, 0.2507476806640625, 0.27916717529296875, 0.307586669921875, 0.33600616455078125, 0.3644256591796875, 0.39284515380859375, 0.4212646484375, 0.44968414306640625, 0.4781036376953125, 0.5065231323242188, 0.534942626953125, 0.5633621215820312, 0.5917816162109375, 0.6202011108398438, 0.64862060546875, 0.6770401000976562, 0.7054595947265625, 0.7338790893554688, 0.762298583984375, 0.7907180786132812, 0.8191375732421875, 0.8475570678710938, 0.8759765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 7.0, 1.0, 3.0, 6.0, 15.0, 10.0, 16.0, 17.0, 10.0, 16.0, 21.0, 32.0, 22.0, 27.0, 26.0, 32.0, 44.0, 31.0, 37.0, 34.0, 44.0, 43.0, 42.0, 47.0, 32.0, 41.0, 37.0, 43.0, 38.0, 21.0, 22.0, 28.0, 35.0, 14.0, 17.0, 16.0, 12.0, 6.0, 12.0, 7.0, 6.0, 5.0, 10.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.4547576904296875, -1.405609130859375, -1.3564605712890625, -1.30731201171875, -1.2581634521484375, -1.209014892578125, -1.1598663330078125, -1.1107177734375, -1.0615692138671875, -1.012420654296875, -0.9632720947265625, -0.91412353515625, -0.8649749755859375, -0.815826416015625, -0.7666778564453125, -0.717529296875, -0.6683807373046875, -0.619232177734375, -0.5700836181640625, -0.52093505859375, -0.4717864990234375, -0.422637939453125, -0.3734893798828125, -0.3243408203125, -0.2751922607421875, -0.226043701171875, -0.1768951416015625, -0.12774658203125, -0.0785980224609375, -0.029449462890625, 0.0196990966796875, 0.06884765625, 0.1179962158203125, 0.167144775390625, 0.2162933349609375, 0.26544189453125, 0.3145904541015625, 0.363739013671875, 0.4128875732421875, 0.4620361328125, 0.5111846923828125, 0.560333251953125, 0.6094818115234375, 0.65863037109375, 0.7077789306640625, 0.756927490234375, 0.8060760498046875, 0.855224609375, 0.9043731689453125, 0.953521728515625, 1.0026702880859375, 1.05181884765625, 1.1009674072265625, 1.150115966796875, 1.1992645263671875, 1.2484130859375, 1.2975616455078125, 1.346710205078125, 1.3958587646484375, 1.44500732421875, 1.4941558837890625, 1.543304443359375, 1.5924530029296875, 1.6416015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 4.0, 6.0, 11.0, 15.0, 16.0, 34.0, 61.0, 87.0, 183.0, 304.0, 620.0, 1223.0, 2540.0, 5317.0, 11307.0, 24020.0, 49941.0, 100125.0, 178558.0, 238797.0, 200273.0, 118500.0, 60328.0, 28932.0, 13993.0, 6666.0, 3254.0, 1576.0, 809.0, 461.0, 234.0, 129.0, 86.0, 44.0, 37.0, 27.0, 13.0, 13.0, 9.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2113037109375, -0.20392417907714844, -0.19654464721679688, -0.1891651153564453, -0.18178558349609375, -0.1744060516357422, -0.16702651977539062, -0.15964698791503906, -0.1522674560546875, -0.14488792419433594, -0.13750839233398438, -0.1301288604736328, -0.12274932861328125, -0.11536979675292969, -0.10799026489257812, -0.10061073303222656, -0.093231201171875, -0.08585166931152344, -0.07847213745117188, -0.07109260559082031, -0.06371307373046875, -0.05633354187011719, -0.048954010009765625, -0.04157447814941406, -0.0341949462890625, -0.026815414428710938, -0.019435882568359375, -0.012056350708007812, -0.00467681884765625, 0.0027027130126953125, 0.010082244873046875, 0.017461776733398438, 0.02484130859375, 0.03222084045410156, 0.039600372314453125, 0.04697990417480469, 0.05435943603515625, 0.06173896789550781, 0.06911849975585938, 0.07649803161621094, 0.0838775634765625, 0.09125709533691406, 0.09863662719726562, 0.10601615905761719, 0.11339569091796875, 0.12077522277832031, 0.12815475463867188, 0.13553428649902344, 0.142913818359375, 0.15029335021972656, 0.15767288208007812, 0.1650524139404297, 0.17243194580078125, 0.1798114776611328, 0.18719100952148438, 0.19457054138183594, 0.2019500732421875, 0.20932960510253906, 0.21670913696289062, 0.2240886688232422, 0.23146820068359375, 0.2388477325439453, 0.24622726440429688, 0.25360679626464844, 0.260986328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 10.0, 14.0, 18.0, 10.0, 21.0, 25.0, 24.0, 25.0, 32.0, 33.0, 42.0, 28.0, 41.0, 48.0, 43.0, 37.0, 53.0, 54.0, 32.0, 33.0, 53.0, 34.0, 42.0, 22.0, 34.0, 23.0, 21.0, 15.0, 23.0, 12.0, 19.0, 8.0, 8.0, 10.0, 11.0, 4.0, 0.0, 6.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.7421875, -3.61822509765625, -3.4942626953125, -3.37030029296875, -3.246337890625, -3.12237548828125, -2.9984130859375, -2.87445068359375, -2.75048828125, -2.62652587890625, -2.5025634765625, -2.37860107421875, -2.254638671875, -2.13067626953125, -2.0067138671875, -1.88275146484375, -1.7587890625, -1.63482666015625, -1.5108642578125, -1.38690185546875, -1.262939453125, -1.13897705078125, -1.0150146484375, -0.89105224609375, -0.76708984375, -0.64312744140625, -0.5191650390625, -0.39520263671875, -0.271240234375, -0.14727783203125, -0.0233154296875, 0.10064697265625, 0.224609375, 0.34857177734375, 0.4725341796875, 0.59649658203125, 0.720458984375, 0.84442138671875, 0.9683837890625, 1.09234619140625, 1.21630859375, 1.34027099609375, 1.4642333984375, 1.58819580078125, 1.712158203125, 1.83612060546875, 1.9600830078125, 2.08404541015625, 2.2080078125, 2.33197021484375, 2.4559326171875, 2.57989501953125, 2.703857421875, 2.82781982421875, 2.9517822265625, 3.07574462890625, 3.19970703125, 3.32366943359375, 3.4476318359375, 3.57159423828125, 3.695556640625, 3.81951904296875, 3.9434814453125, 4.06744384765625, 4.19140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 9.0, 9.0, 13.0, 22.0, 30.0, 49.0, 54.0, 61.0, 115.0, 173.0, 267.0, 439.0, 779.0, 1342.0, 3009.0, 10045.0, 50601.0, 430687.0, 475877.0, 56725.0, 11185.0, 3382.0, 1583.0, 792.0, 480.0, 280.0, 155.0, 123.0, 79.0, 37.0, 36.0, 44.0, 19.0, 13.0, 14.0, 6.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11688232421875, -0.1129903793334961, -0.10909843444824219, -0.10520648956298828, -0.10131454467773438, -0.09742259979248047, -0.09353065490722656, -0.08963871002197266, -0.08574676513671875, -0.08185482025146484, -0.07796287536621094, -0.07407093048095703, -0.07017898559570312, -0.06628704071044922, -0.06239509582519531, -0.058503150939941406, -0.0546112060546875, -0.050719261169433594, -0.04682731628417969, -0.04293537139892578, -0.039043426513671875, -0.03515148162841797, -0.03125953674316406, -0.027367591857910156, -0.02347564697265625, -0.019583702087402344, -0.015691757202148438, -0.011799812316894531, -0.007907867431640625, -0.004015922546386719, -0.0001239776611328125, 0.0037679672241210938, 0.007659912109375, 0.011551856994628906, 0.015443801879882812, 0.01933574676513672, 0.023227691650390625, 0.02711963653564453, 0.031011581420898438, 0.034903526306152344, 0.03879547119140625, 0.042687416076660156, 0.04657936096191406, 0.05047130584716797, 0.054363250732421875, 0.05825519561767578, 0.06214714050292969, 0.0660390853881836, 0.0699310302734375, 0.0738229751586914, 0.07771492004394531, 0.08160686492919922, 0.08549880981445312, 0.08939075469970703, 0.09328269958496094, 0.09717464447021484, 0.10106658935546875, 0.10495853424072266, 0.10885047912597656, 0.11274242401123047, 0.11663436889648438, 0.12052631378173828, 0.12441825866699219, 0.1283102035522461, 0.1322021484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 11.0, 27.0, 50.0, 68.0, 96.0, 136.0, 162.0, 135.0, 101.0, 97.0, 53.0, 26.0, 19.0, 5.0, 9.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0001443624496459961, -0.0001411382108926773, -0.00013791397213935852, -0.00013468973338603973, -0.00013146549463272095, -0.00012824125587940216, -0.00012501701712608337, -0.00012179277837276459, -0.0001185685396194458, -0.00011534430086612701, -0.00011212006211280823, -0.00010889582335948944, -0.00010567158460617065, -0.00010244734585285187, -9.922310709953308e-05, -9.59988683462143e-05, -9.277462959289551e-05, -8.955039083957672e-05, -8.632615208625793e-05, -8.310191333293915e-05, -7.987767457962036e-05, -7.665343582630157e-05, -7.342919707298279e-05, -7.0204958319664e-05, -6.698071956634521e-05, -6.375648081302643e-05, -6.053224205970764e-05, -5.7308003306388855e-05, -5.408376455307007e-05, -5.085952579975128e-05, -4.7635287046432495e-05, -4.441104829311371e-05, -4.118680953979492e-05, -3.7962570786476135e-05, -3.473833203315735e-05, -3.151409327983856e-05, -2.8289854526519775e-05, -2.506561577320099e-05, -2.1841377019882202e-05, -1.8617138266563416e-05, -1.539289951324463e-05, -1.2168660759925842e-05, -8.944422006607056e-06, -5.720183253288269e-06, -2.4959444999694824e-06, 7.282942533493042e-07, 3.952533006668091e-06, 7.1767717599868774e-06, 1.0401010513305664e-05, 1.362524926662445e-05, 1.6849488019943237e-05, 2.0073726773262024e-05, 2.329796552658081e-05, 2.6522204279899597e-05, 2.9746443033218384e-05, 3.297068178653717e-05, 3.619492053985596e-05, 3.9419159293174744e-05, 4.264339804649353e-05, 4.586763679981232e-05, 4.9091875553131104e-05, 5.231611430644989e-05, 5.554035305976868e-05, 5.876459181308746e-05, 6.198883056640625e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 13.0, 14.0, 21.0, 31.0, 75.0, 90.0, 135.0, 224.0, 382.0, 619.0, 1164.0, 2024.0, 3571.0, 6515.0, 12323.0, 24708.0, 54786.0, 161422.0, 494048.0, 175596.0, 57590.0, 25635.0, 12663.0, 6642.0, 3609.0, 2010.0, 1090.0, 627.0, 365.0, 200.0, 130.0, 76.0, 37.0, 33.0, 22.0, 15.0, 13.0, 4.0, 4.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09375, -0.0905752182006836, -0.08740043640136719, -0.08422565460205078, -0.08105087280273438, -0.07787609100341797, -0.07470130920410156, -0.07152652740478516, -0.06835174560546875, -0.06517696380615234, -0.06200218200683594, -0.05882740020751953, -0.055652618408203125, -0.05247783660888672, -0.04930305480957031, -0.046128273010253906, -0.0429534912109375, -0.039778709411621094, -0.03660392761230469, -0.03342914581298828, -0.030254364013671875, -0.02707958221435547, -0.023904800415039062, -0.020730018615722656, -0.01755523681640625, -0.014380455017089844, -0.011205673217773438, -0.008030891418457031, -0.004856109619140625, -0.0016813278198242188, 0.0014934539794921875, 0.004668235778808594, 0.007843017578125, 0.011017799377441406, 0.014192581176757812, 0.01736736297607422, 0.020542144775390625, 0.02371692657470703, 0.026891708374023438, 0.030066490173339844, 0.03324127197265625, 0.036416053771972656, 0.03959083557128906, 0.04276561737060547, 0.045940399169921875, 0.04911518096923828, 0.05228996276855469, 0.055464744567871094, 0.0586395263671875, 0.061814308166503906, 0.06498908996582031, 0.06816387176513672, 0.07133865356445312, 0.07451343536376953, 0.07768821716308594, 0.08086299896240234, 0.08403778076171875, 0.08721256256103516, 0.09038734436035156, 0.09356212615966797, 0.09673690795898438, 0.09991168975830078, 0.10308647155761719, 0.1062612533569336, 0.10943603515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 8.0, 7.0, 7.0, 4.0, 13.0, 10.0, 7.0, 14.0, 20.0, 17.0, 25.0, 29.0, 32.0, 36.0, 44.0, 80.0, 117.0, 122.0, 97.0, 78.0, 31.0, 39.0, 21.0, 29.0, 15.0, 12.0, 11.0, 12.0, 9.0, 12.0, 4.0, 6.0, 7.0, 3.0, 10.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0379638671875, -0.03681802749633789, -0.03567218780517578, -0.03452634811401367, -0.03338050842285156, -0.03223466873168945, -0.031088829040527344, -0.029942989349365234, -0.028797149658203125, -0.027651309967041016, -0.026505470275878906, -0.025359630584716797, -0.024213790893554688, -0.023067951202392578, -0.02192211151123047, -0.02077627182006836, -0.01963043212890625, -0.01848459243774414, -0.01733875274658203, -0.016192913055419922, -0.015047073364257812, -0.013901233673095703, -0.012755393981933594, -0.011609554290771484, -0.010463714599609375, -0.009317874908447266, -0.008172035217285156, -0.007026195526123047, -0.0058803558349609375, -0.004734516143798828, -0.0035886764526367188, -0.0024428367614746094, -0.0012969970703125, -0.00015115737915039062, 0.0009946823120117188, 0.002140522003173828, 0.0032863616943359375, 0.004432201385498047, 0.005578041076660156, 0.006723880767822266, 0.007869720458984375, 0.009015560150146484, 0.010161399841308594, 0.011307239532470703, 0.012453079223632812, 0.013598918914794922, 0.014744758605957031, 0.01589059829711914, 0.01703643798828125, 0.01818227767944336, 0.01932811737060547, 0.020473957061767578, 0.021619796752929688, 0.022765636444091797, 0.023911476135253906, 0.025057315826416016, 0.026203155517578125, 0.027348995208740234, 0.028494834899902344, 0.029640674591064453, 0.030786514282226562, 0.03193235397338867, 0.03307819366455078, 0.03422403335571289, 0.035369873046875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 7.0, 16.0, 24.0, 19.0, 20.0, 21.0, 31.0, 34.0, 50.0, 37.0, 50.0, 43.0, 44.0, 56.0, 52.0, 52.0, 59.0, 49.0, 43.0, 50.0, 38.0, 41.0, 40.0, 23.0, 26.0, 13.0, 13.0, 11.0, 5.0, 6.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6552765369415283, -1.6028623580932617, -1.5504481792449951, -1.498033881187439, -1.4456197023391724, -1.3932055234909058, -1.3407912254333496, -1.288377046585083, -1.2359628677368164, -1.1835486888885498, -1.1311345100402832, -1.078720211982727, -1.0263060331344604, -0.9738918542861938, -0.9214776158332825, -0.8690633773803711, -0.8166491985321045, -0.7642350196838379, -0.7118207812309265, -0.6594065427780151, -0.6069923639297485, -0.5545781850814819, -0.5021639466285706, -0.44974973797798157, -0.3973355293273926, -0.3449213206768036, -0.2925071120262146, -0.2400929033756256, -0.18767869472503662, -0.13526448607444763, -0.08285027742385864, -0.030436068773269653, 0.021978139877319336, 0.07439234852790833, 0.12680655717849731, 0.1792207658290863, 0.2316349744796753, 0.2840491831302643, 0.33646339178085327, 0.38887760043144226, 0.44129180908203125, 0.49370601773262024, 0.5461202263832092, 0.5985344648361206, 0.6509486436843872, 0.7033628225326538, 0.7557770609855652, 0.8081912994384766, 0.8606054782867432, 0.9130196571350098, 0.9654338955879211, 1.0178481340408325, 1.0702623128890991, 1.1226764917373657, 1.1750907897949219, 1.2275049686431885, 1.279919147491455, 1.3323333263397217, 1.3847475051879883, 1.4371618032455444, 1.489575982093811, 1.5419901609420776, 1.5944044589996338, 1.6468186378479004, 1.699232816696167]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 3.0, 4.0, 3.0, 8.0, 8.0, 7.0, 13.0, 10.0, 13.0, 13.0, 19.0, 17.0, 13.0, 25.0, 18.0, 27.0, 28.0, 24.0, 28.0, 32.0, 34.0, 40.0, 44.0, 31.0, 31.0, 49.0, 33.0, 38.0, 26.0, 41.0, 35.0, 34.0, 32.0, 22.0, 19.0, 23.0, 27.0, 17.0, 14.0, 10.0, 17.0, 12.0, 3.0, 7.0, 12.0, 4.0, 4.0, 5.0, 4.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2711260318756104, -1.2295622825622559, -1.187998652458191, -1.1464349031448364, -1.1048712730407715, -1.063307523727417, -1.0217437744140625, -0.9801800847053528, -0.9386163949966431, -0.8970527052879333, -0.8554890155792236, -0.8139252662658691, -0.7723615765571594, -0.7307978868484497, -0.6892341375350952, -0.6476704478263855, -0.6061067581176758, -0.5645430684089661, -0.5229793787002563, -0.48141562938690186, -0.43985193967819214, -0.3982882499694824, -0.3567245304584503, -0.3151608109474182, -0.2735971212387085, -0.23203341662883759, -0.19046971201896667, -0.14890600740909576, -0.10734230279922485, -0.06577859818935394, -0.024214893579483032, 0.017348825931549072, 0.05891263484954834, 0.10047633945941925, 0.14204004406929016, 0.18360374867916107, 0.22516745328903198, 0.2667311429977417, 0.3082948625087738, 0.3498585820198059, 0.3914222717285156, 0.43298596143722534, 0.47454968094825745, 0.5161134004592896, 0.5576770901679993, 0.599240779876709, 0.6408045291900635, 0.6823682188987732, 0.7239319086074829, 0.7654955983161926, 0.8070592880249023, 0.8486230373382568, 0.8901867270469666, 0.9317504167556763, 0.9733141660690308, 1.0148777961730957, 1.0564415454864502, 1.0980052947998047, 1.1395689249038696, 1.1811326742172241, 1.222696304321289, 1.2642600536346436, 1.305823802947998, 1.3473875522613525, 1.3889511823654175]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 8.0, 7.0, 11.0, 13.0, 22.0, 22.0, 30.0, 47.0, 57.0, 90.0, 94.0, 140.0, 226.0, 304.0, 457.0, 814.0, 1458.0, 2592.0, 4705.0, 9090.0, 18215.0, 36226.0, 71433.0, 130497.0, 199966.0, 220859.0, 160039.0, 92886.0, 47856.0, 24220.0, 12004.0, 6117.0, 3230.0, 1819.0, 1053.0, 654.0, 385.0, 262.0, 174.0, 129.0, 73.0, 65.0, 38.0, 37.0, 36.0, 23.0, 22.0, 13.0, 9.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0], "bins": [-2.060546875, -2.00030517578125, -1.9400634765625, -1.87982177734375, -1.819580078125, -1.75933837890625, -1.6990966796875, -1.63885498046875, -1.57861328125, -1.51837158203125, -1.4581298828125, -1.39788818359375, -1.337646484375, -1.27740478515625, -1.2171630859375, -1.15692138671875, -1.0966796875, -1.03643798828125, -0.9761962890625, -0.91595458984375, -0.855712890625, -0.79547119140625, -0.7352294921875, -0.67498779296875, -0.61474609375, -0.55450439453125, -0.4942626953125, -0.43402099609375, -0.373779296875, -0.31353759765625, -0.2532958984375, -0.19305419921875, -0.1328125, -0.07257080078125, -0.0123291015625, 0.04791259765625, 0.108154296875, 0.16839599609375, 0.2286376953125, 0.28887939453125, 0.34912109375, 0.40936279296875, 0.4696044921875, 0.52984619140625, 0.590087890625, 0.65032958984375, 0.7105712890625, 0.77081298828125, 0.8310546875, 0.89129638671875, 0.9515380859375, 1.01177978515625, 1.072021484375, 1.13226318359375, 1.1925048828125, 1.25274658203125, 1.31298828125, 1.37322998046875, 1.4334716796875, 1.49371337890625, 1.553955078125, 1.61419677734375, 1.6744384765625, 1.73468017578125, 1.794921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 5.0, 6.0, 4.0, 11.0, 9.0, 11.0, 20.0, 17.0, 16.0, 19.0, 27.0, 27.0, 28.0, 29.0, 34.0, 26.0, 36.0, 39.0, 27.0, 33.0, 43.0, 47.0, 42.0, 38.0, 51.0, 34.0, 31.0, 28.0, 28.0, 21.0, 24.0, 34.0, 23.0, 15.0, 14.0, 13.0, 9.0, 9.0, 9.0, 12.0, 5.0, 9.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.48828125, -2.41522216796875, -2.3421630859375, -2.26910400390625, -2.196044921875, -2.12298583984375, -2.0499267578125, -1.97686767578125, -1.90380859375, -1.83074951171875, -1.7576904296875, -1.68463134765625, -1.611572265625, -1.53851318359375, -1.4654541015625, -1.39239501953125, -1.3193359375, -1.24627685546875, -1.1732177734375, -1.10015869140625, -1.027099609375, -0.95404052734375, -0.8809814453125, -0.80792236328125, -0.73486328125, -0.66180419921875, -0.5887451171875, -0.51568603515625, -0.442626953125, -0.36956787109375, -0.2965087890625, -0.22344970703125, -0.150390625, -0.07733154296875, -0.0042724609375, 0.06878662109375, 0.141845703125, 0.21490478515625, 0.2879638671875, 0.36102294921875, 0.43408203125, 0.50714111328125, 0.5802001953125, 0.65325927734375, 0.726318359375, 0.79937744140625, 0.8724365234375, 0.94549560546875, 1.0185546875, 1.09161376953125, 1.1646728515625, 1.23773193359375, 1.310791015625, 1.38385009765625, 1.4569091796875, 1.52996826171875, 1.60302734375, 1.67608642578125, 1.7491455078125, 1.82220458984375, 1.895263671875, 1.96832275390625, 2.0413818359375, 2.11444091796875, 2.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 8.0, 20.0, 16.0, 18.0, 31.0, 51.0, 70.0, 129.0, 230.0, 365.0, 721.0, 1727.0, 5212.0, 18450.0, 75947.0, 288450.0, 439141.0, 162912.0, 39443.0, 10142.0, 3013.0, 1137.0, 533.0, 264.0, 173.0, 92.0, 81.0, 56.0, 25.0, 23.0, 16.0, 6.0, 12.0, 6.0, 2.0, 4.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.27728271484375, -4.1405029296875, -4.00372314453125, -3.866943359375, -3.73016357421875, -3.5933837890625, -3.45660400390625, -3.31982421875, -3.18304443359375, -3.0462646484375, -2.90948486328125, -2.772705078125, -2.63592529296875, -2.4991455078125, -2.36236572265625, -2.2255859375, -2.08880615234375, -1.9520263671875, -1.81524658203125, -1.678466796875, -1.54168701171875, -1.4049072265625, -1.26812744140625, -1.13134765625, -0.99456787109375, -0.8577880859375, -0.72100830078125, -0.584228515625, -0.44744873046875, -0.3106689453125, -0.17388916015625, -0.037109375, 0.09967041015625, 0.2364501953125, 0.37322998046875, 0.510009765625, 0.64678955078125, 0.7835693359375, 0.92034912109375, 1.05712890625, 1.19390869140625, 1.3306884765625, 1.46746826171875, 1.604248046875, 1.74102783203125, 1.8778076171875, 2.01458740234375, 2.1513671875, 2.28814697265625, 2.4249267578125, 2.56170654296875, 2.698486328125, 2.83526611328125, 2.9720458984375, 3.10882568359375, 3.24560546875, 3.38238525390625, 3.5191650390625, 3.65594482421875, 3.792724609375, 3.92950439453125, 4.0662841796875, 4.20306396484375, 4.33984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 7.0, 7.0, 9.0, 11.0, 11.0, 15.0, 16.0, 16.0, 23.0, 21.0, 23.0, 29.0, 34.0, 37.0, 38.0, 29.0, 42.0, 42.0, 50.0, 48.0, 40.0, 45.0, 54.0, 37.0, 34.0, 35.0, 35.0, 37.0, 30.0, 22.0, 26.0, 22.0, 10.0, 9.0, 14.0, 17.0, 4.0, 9.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.076171875, -2.98394775390625, -2.8917236328125, -2.79949951171875, -2.707275390625, -2.61505126953125, -2.5228271484375, -2.43060302734375, -2.33837890625, -2.24615478515625, -2.1539306640625, -2.06170654296875, -1.969482421875, -1.87725830078125, -1.7850341796875, -1.69281005859375, -1.6005859375, -1.50836181640625, -1.4161376953125, -1.32391357421875, -1.231689453125, -1.13946533203125, -1.0472412109375, -0.95501708984375, -0.86279296875, -0.77056884765625, -0.6783447265625, -0.58612060546875, -0.493896484375, -0.40167236328125, -0.3094482421875, -0.21722412109375, -0.125, -0.03277587890625, 0.0594482421875, 0.15167236328125, 0.243896484375, 0.33612060546875, 0.4283447265625, 0.52056884765625, 0.61279296875, 0.70501708984375, 0.7972412109375, 0.88946533203125, 0.981689453125, 1.07391357421875, 1.1661376953125, 1.25836181640625, 1.3505859375, 1.44281005859375, 1.5350341796875, 1.62725830078125, 1.719482421875, 1.81170654296875, 1.9039306640625, 1.99615478515625, 2.08837890625, 2.18060302734375, 2.2728271484375, 2.36505126953125, 2.457275390625, 2.54949951171875, 2.6417236328125, 2.73394775390625, 2.826171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 1.0, 3.0, 3.0, 9.0, 15.0, 29.0, 38.0, 45.0, 84.0, 194.0, 316.0, 596.0, 1236.0, 2579.0, 5802.0, 13992.0, 36254.0, 93159.0, 210795.0, 355619.0, 191133.0, 82554.0, 31944.0, 12301.0, 5178.0, 2287.0, 1125.0, 586.0, 295.0, 155.0, 83.0, 56.0, 24.0, 23.0, 20.0, 14.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5356216430664062, -0.5180206298828125, -0.5004196166992188, -0.482818603515625, -0.46521759033203125, -0.4476165771484375, -0.43001556396484375, -0.41241455078125, -0.39481353759765625, -0.3772125244140625, -0.35961151123046875, -0.342010498046875, -0.32440948486328125, -0.3068084716796875, -0.28920745849609375, -0.2716064453125, -0.25400543212890625, -0.2364044189453125, -0.21880340576171875, -0.201202392578125, -0.18360137939453125, -0.1660003662109375, -0.14839935302734375, -0.13079833984375, -0.11319732666015625, -0.0955963134765625, -0.07799530029296875, -0.060394287109375, -0.04279327392578125, -0.0251922607421875, -0.00759124755859375, 0.010009765625, 0.02761077880859375, 0.0452117919921875, 0.06281280517578125, 0.080413818359375, 0.09801483154296875, 0.1156158447265625, 0.13321685791015625, 0.15081787109375, 0.16841888427734375, 0.1860198974609375, 0.20362091064453125, 0.221221923828125, 0.23882293701171875, 0.2564239501953125, 0.27402496337890625, 0.2916259765625, 0.30922698974609375, 0.3268280029296875, 0.34442901611328125, 0.362030029296875, 0.37963104248046875, 0.3972320556640625, 0.41483306884765625, 0.43243408203125, 0.45003509521484375, 0.4676361083984375, 0.48523712158203125, 0.502838134765625, 0.5204391479492188, 0.5380401611328125, 0.5556411743164062, 0.5732421875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 5.0, 5.0, 7.0, 8.0, 17.0, 13.0, 24.0, 15.0, 22.0, 26.0, 41.0, 50.0, 39.0, 56.0, 71.0, 85.0, 99.0, 70.0, 67.0, 43.0, 41.0, 22.0, 29.0, 31.0, 18.0, 21.0, 16.0, 9.0, 10.0, 10.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011259317398071289, -0.00010884646326303482, -0.00010509975254535675, -0.00010135304182767868, -9.760633111000061e-05, -9.385962039232254e-05, -9.011290967464447e-05, -8.63661989569664e-05, -8.261948823928833e-05, -7.887277752161026e-05, -7.512606680393219e-05, -7.137935608625412e-05, -6.763264536857605e-05, -6.388593465089798e-05, -6.013922393321991e-05, -5.639251321554184e-05, -5.264580249786377e-05, -4.88990917801857e-05, -4.515238106250763e-05, -4.140567034482956e-05, -3.765895962715149e-05, -3.391224890947342e-05, -3.016553819179535e-05, -2.641882747411728e-05, -2.267211675643921e-05, -1.892540603876114e-05, -1.5178695321083069e-05, -1.1431984603404999e-05, -7.685273885726929e-06, -3.938563168048859e-06, -1.9185245037078857e-07, 3.5548582673072815e-06, 7.3015689849853516e-06, 1.1048279702663422e-05, 1.4794990420341492e-05, 1.8541701138019562e-05, 2.2288411855697632e-05, 2.6035122573375702e-05, 2.9781833291053772e-05, 3.352854400873184e-05, 3.727525472640991e-05, 4.102196544408798e-05, 4.476867616176605e-05, 4.851538687944412e-05, 5.226209759712219e-05, 5.600880831480026e-05, 5.975551903247833e-05, 6.35022297501564e-05, 6.724894046783447e-05, 7.099565118551254e-05, 7.474236190319061e-05, 7.848907262086868e-05, 8.223578333854675e-05, 8.598249405622482e-05, 8.972920477390289e-05, 9.347591549158096e-05, 9.722262620925903e-05, 0.0001009693369269371, 0.00010471604764461517, 0.00010846275836229324, 0.00011220946907997131, 0.00011595617979764938, 0.00011970289051532745, 0.00012344960123300552, 0.0001271963119506836]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 11.0, 16.0, 18.0, 24.0, 28.0, 55.0, 65.0, 103.0, 104.0, 141.0, 196.0, 306.0, 451.0, 650.0, 1047.0, 1682.0, 3328.0, 6821.0, 17371.0, 50643.0, 160878.0, 418060.0, 253953.0, 84229.0, 27243.0, 10342.0, 4560.0, 2318.0, 1342.0, 778.0, 534.0, 371.0, 233.0, 191.0, 127.0, 95.0, 51.0, 55.0, 41.0, 25.0, 12.0, 19.0, 10.0, 11.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.8837890625, -0.8575820922851562, -0.8313751220703125, -0.8051681518554688, -0.778961181640625, -0.7527542114257812, -0.7265472412109375, -0.7003402709960938, -0.67413330078125, -0.6479263305664062, -0.6217193603515625, -0.5955123901367188, -0.569305419921875, -0.5430984497070312, -0.5168914794921875, -0.49068450927734375, -0.4644775390625, -0.43827056884765625, -0.4120635986328125, -0.38585662841796875, -0.359649658203125, -0.33344268798828125, -0.3072357177734375, -0.28102874755859375, -0.25482177734375, -0.22861480712890625, -0.2024078369140625, -0.17620086669921875, -0.149993896484375, -0.12378692626953125, -0.0975799560546875, -0.07137298583984375, -0.045166015625, -0.01895904541015625, 0.0072479248046875, 0.03345489501953125, 0.059661865234375, 0.08586883544921875, 0.1120758056640625, 0.13828277587890625, 0.16448974609375, 0.19069671630859375, 0.2169036865234375, 0.24311065673828125, 0.269317626953125, 0.29552459716796875, 0.3217315673828125, 0.34793853759765625, 0.3741455078125, 0.40035247802734375, 0.4265594482421875, 0.45276641845703125, 0.478973388671875, 0.5051803588867188, 0.5313873291015625, 0.5575942993164062, 0.58380126953125, 0.6100082397460938, 0.6362152099609375, 0.6624221801757812, 0.688629150390625, 0.7148361206054688, 0.7410430908203125, 0.7672500610351562, 0.79345703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 10.0, 6.0, 13.0, 15.0, 25.0, 36.0, 37.0, 52.0, 79.0, 88.0, 151.0, 117.0, 82.0, 65.0, 50.0, 41.0, 44.0, 14.0, 13.0, 18.0, 8.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.642578125, -0.6255722045898438, -0.6085662841796875, -0.5915603637695312, -0.574554443359375, -0.5575485229492188, -0.5405426025390625, -0.5235366821289062, -0.50653076171875, -0.48952484130859375, -0.4725189208984375, -0.45551300048828125, -0.438507080078125, -0.42150115966796875, -0.4044952392578125, -0.38748931884765625, -0.3704833984375, -0.35347747802734375, -0.3364715576171875, -0.31946563720703125, -0.302459716796875, -0.28545379638671875, -0.2684478759765625, -0.25144195556640625, -0.23443603515625, -0.21743011474609375, -0.2004241943359375, -0.18341827392578125, -0.166412353515625, -0.14940643310546875, -0.1324005126953125, -0.11539459228515625, -0.098388671875, -0.08138275146484375, -0.0643768310546875, -0.04737091064453125, -0.030364990234375, -0.01335906982421875, 0.0036468505859375, 0.02065277099609375, 0.03765869140625, 0.05466461181640625, 0.0716705322265625, 0.08867645263671875, 0.105682373046875, 0.12268829345703125, 0.1396942138671875, 0.15670013427734375, 0.1737060546875, 0.19071197509765625, 0.2077178955078125, 0.22472381591796875, 0.241729736328125, 0.25873565673828125, 0.2757415771484375, 0.29274749755859375, 0.30975341796875, 0.32675933837890625, 0.3437652587890625, 0.36077117919921875, 0.377777099609375, 0.39478302001953125, 0.4117889404296875, 0.42879486083984375, 0.44580078125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 14.0, 18.0, 22.0, 37.0, 29.0, 46.0, 53.0, 69.0, 66.0, 87.0, 78.0, 82.0, 70.0, 67.0, 61.0, 48.0, 35.0, 35.0, 24.0, 17.0, 12.0, 7.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5778732299804688, -3.433126449584961, -3.288379669189453, -3.1436328887939453, -2.9988861083984375, -2.8541393280029297, -2.709392786026001, -2.564646005630493, -2.4198992252349854, -2.2751524448394775, -2.1304056644439697, -1.9856590032577515, -1.8409122228622437, -1.6961654424667358, -1.5514187812805176, -1.4066720008850098, -1.261925220489502, -1.1171784400939941, -0.9724317193031311, -0.8276849985122681, -0.6829382181167603, -0.5381914377212524, -0.3934447169303894, -0.24869799613952637, -0.10395121574401855, 0.04079553484916687, 0.1855422854423523, 0.3302890360355377, 0.47503578662872314, 0.619782567024231, 0.764529287815094, 0.909276008605957, 1.0540223121643066, 1.1987690925598145, 1.3435158729553223, 1.4882625341415405, 1.6330093145370483, 1.7777560949325562, 1.9225027561187744, 2.0672495365142822, 2.21199631690979, 2.356743097305298, 2.5014898777008057, 2.6462366580963135, 2.790983200073242, 2.93572998046875, 3.080476760864258, 3.2252235412597656, 3.3699703216552734, 3.5147171020507812, 3.659463882446289, 3.804210662841797, 3.9489574432373047, 4.0937042236328125, 4.23845100402832, 4.383197784423828, 4.527944564819336, 4.672691345214844, 4.817438125610352, 4.962184906005859, 5.106931686401367, 5.251678466796875, 5.396425247192383, 5.541172027587891, 5.68591833114624]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 9.0, 9.0, 22.0, 10.0, 14.0, 19.0, 18.0, 26.0, 30.0, 27.0, 31.0, 24.0, 40.0, 30.0, 43.0, 44.0, 40.0, 44.0, 40.0, 43.0, 44.0, 53.0, 23.0, 37.0, 37.0, 14.0, 31.0, 19.0, 28.0, 18.0, 21.0, 19.0, 16.0, 15.0, 8.0, 9.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.603392601013184, -4.45352029800415, -4.303647994995117, -4.153775691986084, -4.003903388977051, -3.8540310859680176, -3.7041587829589844, -3.554286479949951, -3.404414176940918, -3.2545418739318848, -3.1046695709228516, -2.9547972679138184, -2.804924964904785, -2.655052661895752, -2.5051803588867188, -2.3553080558776855, -2.2054355144500732, -2.05556321144104, -1.9056909084320068, -1.7558186054229736, -1.6059463024139404, -1.4560739994049072, -1.3062015771865845, -1.1563292741775513, -1.006456971168518, -0.8565846681594849, -0.7067123651504517, -0.5568400025367737, -0.4069676995277405, -0.2570953965187073, -0.1072230339050293, 0.042649269104003906, 0.1925215721130371, 0.3423938751220703, 0.4922662079334259, 0.6421385407447815, 0.7920108437538147, 0.9418831467628479, 1.0917555093765259, 1.241627812385559, 1.3915001153945923, 1.5413724184036255, 1.6912447214126587, 1.8411171436309814, 1.9909894466400146, 2.140861749649048, 2.290734052658081, 2.4406063556671143, 2.5904786586761475, 2.7403509616851807, 2.890223264694214, 3.040095567703247, 3.1899678707122803, 3.3398401737213135, 3.489712715148926, 3.639585018157959, 3.789457321166992, 3.9393296241760254, 4.089201927185059, 4.239074230194092, 4.388946533203125, 4.538818836212158, 4.688691139221191, 4.838563442230225, 4.988435745239258]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 23.0, 25.0, 17.0, 26.0, 50.0, 57.0, 70.0, 114.0, 158.0, 285.0, 379.0, 608.0, 926.0, 1418.0, 1996.0, 2778.0, 3827.0, 5062.0, 1011780.0, 5696.0, 4437.0, 3354.0, 2346.0, 1730.0, 1122.0, 778.0, 533.0, 309.0, 214.0, 130.0, 92.0, 75.0, 41.0, 27.0, 33.0, 21.0, 19.0, 10.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.396050453186035, -4.261873722076416, -4.127696514129639, -3.9935197830200195, -3.8593428134918213, -3.725165843963623, -3.590989112854004, -3.4568121433258057, -3.3226351737976074, -3.188458204269409, -3.054281234741211, -2.920104503631592, -2.7859275341033936, -2.6517505645751953, -2.517573833465576, -2.383396863937378, -2.2492198944091797, -2.1150429248809814, -1.9808660745620728, -1.846689224243164, -1.7125122547149658, -1.5783352851867676, -1.4441584348678589, -1.3099815845489502, -1.175804615020752, -1.0416276454925537, -0.907450795173645, -0.7732738852500916, -0.6390969753265381, -0.5049200654029846, -0.37074315547943115, -0.23656624555587769, -0.10238933563232422, 0.03178757429122925, 0.16596448421478271, 0.3001413941383362, 0.43431830406188965, 0.5684952139854431, 0.7026721239089966, 0.83684903383255, 0.9710259437561035, 1.1052029132843018, 1.2393797636032104, 1.3735566139221191, 1.5077335834503174, 1.6419105529785156, 1.7760874032974243, 1.910264253616333, 2.0444412231445312, 2.1786181926727295, 2.3127951622009277, 2.446971893310547, 2.581148862838745, 2.7153258323669434, 2.8495025634765625, 2.9836795330047607, 3.117856502532959, 3.2520334720611572, 3.3862104415893555, 3.5203871726989746, 3.654564142227173, 3.788741111755371, 3.9229178428649902, 4.057095050811768, 4.191271781921387]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 13.0, 17.0, 12.0, 30.0, 84.0, 172.0, 568.0, 1994.0, 12188.0, 202732.0, 51230040.0, 18953.0, 2525.0, 617.0, 215.0, 103.0, 57.0, 35.0, 19.0, 10.0, 15.0, 10.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.517032623291016, -20.72156524658203, -19.926097869873047, -19.130630493164062, -18.335161209106445, -17.53969383239746, -16.744226455688477, -15.948759078979492, -15.153291702270508, -14.357824325561523, -13.562355995178223, -12.766888618469238, -11.971421241760254, -11.175952911376953, -10.380485534667969, -9.585018157958984, -8.78955078125, -7.994082927703857, -7.198615074157715, -6.4031476974487305, -5.607680320739746, -4.8122124671936035, -4.016744613647461, -3.2212772369384766, -2.425809621810913, -1.6303420066833496, -0.8348743915557861, -0.039406776428222656, 0.7560608386993408, 1.5515284538269043, 2.346996307373047, 3.142465591430664, 3.9379332065582275, 4.733400821685791, 5.528868675231934, 6.324336051940918, 7.119803428649902, 7.915271282196045, 8.710739135742188, 9.506206512451172, 10.301673889160156, 11.09714126586914, 11.892609596252441, 12.688076972961426, 13.48354434967041, 14.279012680053711, 15.074480056762695, 15.86994743347168, 16.665414810180664, 17.46088218688965, 18.256349563598633, 19.05181884765625, 19.847286224365234, 20.64275360107422, 21.438220977783203, 22.233688354492188, 23.029155731201172, 23.824623107910156, 24.62009048461914, 25.415557861328125, 26.211027145385742, 27.006494522094727, 27.80196189880371, 28.597429275512695]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 13.0, 23.0, 29.0, 51.0, 76.0, 114.0, 173.0, 322.0, 496.0, 738.0, 1229.0, 2046.0, 3253.0, 5317.0, 8471.0, 13764.0, 22545.0, 36844.0, 60496.0, 97897.0, 152356.0, 228561.0, 320699.0, 407698.0, 3584658.0, 403366.0, 316463.0, 225475.0, 149588.0, 95631.0, 59263.0, 36937.0, 22229.0, 13417.0, 8189.0, 5036.0, 2916.0, 1953.0, 1127.0, 753.0, 465.0, 276.0, 197.0, 116.0, 64.0, 34.0, 32.0, 18.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.0185546875, -0.988128662109375, -0.95770263671875, -0.927276611328125, -0.8968505859375, -0.866424560546875, -0.83599853515625, -0.805572509765625, -0.775146484375, -0.744720458984375, -0.71429443359375, -0.683868408203125, -0.6534423828125, -0.623016357421875, -0.59259033203125, -0.562164306640625, -0.53173828125, -0.501312255859375, -0.47088623046875, -0.440460205078125, -0.4100341796875, -0.379608154296875, -0.34918212890625, -0.318756103515625, -0.288330078125, -0.257904052734375, -0.22747802734375, -0.197052001953125, -0.1666259765625, -0.136199951171875, -0.10577392578125, -0.075347900390625, -0.044921875, -0.014495849609375, 0.01593017578125, 0.046356201171875, 0.0767822265625, 0.107208251953125, 0.13763427734375, 0.168060302734375, 0.198486328125, 0.228912353515625, 0.25933837890625, 0.289764404296875, 0.3201904296875, 0.350616455078125, 0.38104248046875, 0.411468505859375, 0.44189453125, 0.472320556640625, 0.50274658203125, 0.533172607421875, 0.5635986328125, 0.594024658203125, 0.62445068359375, 0.654876708984375, 0.685302734375, 0.715728759765625, 0.74615478515625, 0.776580810546875, 0.8070068359375, 0.837432861328125, 0.86785888671875, 0.898284912109375, 0.9287109375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 5.0, 14.0, 11.0, 12.0, 25.0, 18.0, 15.0, 26.0, 21.0, 32.0, 26.0, 46.0, 43.0, 49.0, 58.0, 37.0, 42.0, 1065.0, 62.0, 34.0, 41.0, 46.0, 62.0, 35.0, 34.0, 26.0, 17.0, 27.0, 13.0, 9.0, 16.0, 12.0, 15.0, 3.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -23.122802734375, -22.43310546875, -21.743408203125, -21.0537109375, -20.364013671875, -19.67431640625, -18.984619140625, -18.294921875, -17.605224609375, -16.91552734375, -16.225830078125, -15.5361328125, -14.846435546875, -14.15673828125, -13.467041015625, -12.77734375, -12.087646484375, -11.39794921875, -10.708251953125, -10.0185546875, -9.328857421875, -8.63916015625, -7.949462890625, -7.259765625, -6.570068359375, -5.88037109375, -5.190673828125, -4.5009765625, -3.811279296875, -3.12158203125, -2.431884765625, -1.7421875, -1.052490234375, -0.36279296875, 0.326904296875, 1.0166015625, 1.706298828125, 2.39599609375, 3.085693359375, 3.775390625, 4.465087890625, 5.15478515625, 5.844482421875, 6.5341796875, 7.223876953125, 7.91357421875, 8.603271484375, 9.29296875, 9.982666015625, 10.67236328125, 11.362060546875, 12.0517578125, 12.741455078125, 13.43115234375, 14.120849609375, 14.810546875, 15.500244140625, 16.18994140625, 16.879638671875, 17.5693359375, 18.259033203125, 18.94873046875, 19.638427734375, 20.328125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 19.0, 33.0, 39.0, 78.0, 128.0, 231.0, 340.0, 650.0, 936.0, 1457.0, 2365.0, 3728.0, 5734.0, 8697.0, 13410.0, 20449.0, 30954.0, 45955.0, 67120.0, 96906.0, 135646.0, 183338.0, 235026.0, 286786.0, 426930.0, 3356878.0, 325351.0, 270109.0, 218447.0, 166912.0, 121681.0, 86492.0, 59883.0, 40593.0, 27483.0, 17830.0, 11685.0, 7662.0, 4882.0, 3176.0, 2070.0, 1245.0, 804.0, 477.0, 330.0, 195.0, 112.0, 74.0, 40.0, 20.0, 17.0, 13.0, 7.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.74853515625, -0.7253875732421875, -0.702239990234375, -0.6790924072265625, -0.65594482421875, -0.6327972412109375, -0.609649658203125, -0.5865020751953125, -0.5633544921875, -0.5402069091796875, -0.517059326171875, -0.4939117431640625, -0.47076416015625, -0.4476165771484375, -0.424468994140625, -0.4013214111328125, -0.378173828125, -0.3550262451171875, -0.331878662109375, -0.3087310791015625, -0.28558349609375, -0.2624359130859375, -0.239288330078125, -0.2161407470703125, -0.1929931640625, -0.1698455810546875, -0.146697998046875, -0.1235504150390625, -0.10040283203125, -0.0772552490234375, -0.054107666015625, -0.0309600830078125, -0.0078125, 0.0153350830078125, 0.038482666015625, 0.0616302490234375, 0.08477783203125, 0.1079254150390625, 0.131072998046875, 0.1542205810546875, 0.1773681640625, 0.2005157470703125, 0.223663330078125, 0.2468109130859375, 0.26995849609375, 0.2931060791015625, 0.316253662109375, 0.3394012451171875, 0.362548828125, 0.3856964111328125, 0.408843994140625, 0.4319915771484375, 0.45513916015625, 0.4782867431640625, 0.501434326171875, 0.5245819091796875, 0.5477294921875, 0.5708770751953125, 0.594024658203125, 0.6171722412109375, 0.64031982421875, 0.6634674072265625, 0.686614990234375, 0.7097625732421875, 0.73291015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 10.0, 11.0, 5.0, 10.0, 20.0, 19.0, 19.0, 29.0, 22.0, 38.0, 29.0, 28.0, 35.0, 48.0, 41.0, 37.0, 32.0, 674.0, 428.0, 32.0, 41.0, 34.0, 44.0, 30.0, 21.0, 34.0, 21.0, 30.0, 14.0, 20.0, 26.0, 16.0, 21.0, 16.0, 10.0, 17.0, 10.0, 7.0, 8.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.9609375, -12.5675048828125, -12.174072265625, -11.7806396484375, -11.38720703125, -10.9937744140625, -10.600341796875, -10.2069091796875, -9.8134765625, -9.4200439453125, -9.026611328125, -8.6331787109375, -8.23974609375, -7.8463134765625, -7.452880859375, -7.0594482421875, -6.666015625, -6.2725830078125, -5.879150390625, -5.4857177734375, -5.09228515625, -4.6988525390625, -4.305419921875, -3.9119873046875, -3.5185546875, -3.1251220703125, -2.731689453125, -2.3382568359375, -1.94482421875, -1.5513916015625, -1.157958984375, -0.7645263671875, -0.37109375, 0.0223388671875, 0.415771484375, 0.8092041015625, 1.20263671875, 1.5960693359375, 1.989501953125, 2.3829345703125, 2.7763671875, 3.1697998046875, 3.563232421875, 3.9566650390625, 4.35009765625, 4.7435302734375, 5.136962890625, 5.5303955078125, 5.923828125, 6.3172607421875, 6.710693359375, 7.1041259765625, 7.49755859375, 7.8909912109375, 8.284423828125, 8.6778564453125, 9.0712890625, 9.4647216796875, 9.858154296875, 10.2515869140625, 10.64501953125, 11.0384521484375, 11.431884765625, 11.8253173828125, 12.21875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 7.0, 12.0, 15.0, 17.0, 40.0, 48.0, 68.0, 89.0, 156.0, 211.0, 350.0, 525.0, 732.0, 1131.0, 1729.0, 2702.0, 4143.0, 6706.0, 10656.0, 17457.0, 28159.0, 44590.0, 70957.0, 117416.0, 5560456.0, 185104.0, 88118.0, 56082.0, 35309.0, 21781.0, 13537.0, 8393.0, 5285.0, 3313.0, 2091.0, 1346.0, 917.0, 585.0, 358.0, 287.0, 177.0, 124.0, 83.0, 50.0, 45.0, 26.0, 25.0, 14.0, 10.0, 3.0, 4.0, 2.0, 2.0], "bins": [-2.267578125, -2.2041168212890625, -2.140655517578125, -2.0771942138671875, -2.01373291015625, -1.9502716064453125, -1.886810302734375, -1.8233489990234375, -1.7598876953125, -1.6964263916015625, -1.632965087890625, -1.5695037841796875, -1.50604248046875, -1.4425811767578125, -1.379119873046875, -1.3156585693359375, -1.252197265625, -1.1887359619140625, -1.125274658203125, -1.0618133544921875, -0.99835205078125, -0.9348907470703125, -0.871429443359375, -0.8079681396484375, -0.7445068359375, -0.6810455322265625, -0.617584228515625, -0.5541229248046875, -0.49066162109375, -0.4272003173828125, -0.363739013671875, -0.3002777099609375, -0.23681640625, -0.1733551025390625, -0.109893798828125, -0.0464324951171875, 0.01702880859375, 0.0804901123046875, 0.143951416015625, 0.2074127197265625, 0.2708740234375, 0.3343353271484375, 0.397796630859375, 0.4612579345703125, 0.52471923828125, 0.5881805419921875, 0.651641845703125, 0.7151031494140625, 0.778564453125, 0.8420257568359375, 0.905487060546875, 0.9689483642578125, 1.03240966796875, 1.0958709716796875, 1.159332275390625, 1.2227935791015625, 1.2862548828125, 1.3497161865234375, 1.413177490234375, 1.4766387939453125, 1.54010009765625, 1.6035614013671875, 1.667022705078125, 1.7304840087890625, 1.7939453125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 6.0, 4.0, 13.0, 10.0, 12.0, 17.0, 15.0, 22.0, 18.0, 19.0, 32.0, 41.0, 33.0, 25.0, 34.0, 47.0, 36.0, 43.0, 78.0, 1031.0, 50.0, 38.0, 27.0, 36.0, 33.0, 34.0, 39.0, 36.0, 22.0, 32.0, 23.0, 17.0, 15.0, 12.0, 15.0, 7.0, 9.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.11181640625, -8.8017578125, -8.49169921875, -8.181640625, -7.87158203125, -7.5615234375, -7.25146484375, -6.94140625, -6.63134765625, -6.3212890625, -6.01123046875, -5.701171875, -5.39111328125, -5.0810546875, -4.77099609375, -4.4609375, -4.15087890625, -3.8408203125, -3.53076171875, -3.220703125, -2.91064453125, -2.6005859375, -2.29052734375, -1.98046875, -1.67041015625, -1.3603515625, -1.05029296875, -0.740234375, -0.43017578125, -0.1201171875, 0.18994140625, 0.5, 0.81005859375, 1.1201171875, 1.43017578125, 1.740234375, 2.05029296875, 2.3603515625, 2.67041015625, 2.98046875, 3.29052734375, 3.6005859375, 3.91064453125, 4.220703125, 4.53076171875, 4.8408203125, 5.15087890625, 5.4609375, 5.77099609375, 6.0810546875, 6.39111328125, 6.701171875, 7.01123046875, 7.3212890625, 7.63134765625, 7.94140625, 8.25146484375, 8.5615234375, 8.87158203125, 9.181640625, 9.49169921875, 9.8017578125, 10.11181640625, 10.421875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 9.0, 19.0, 26.0, 55.0, 90.0, 151.0, 212.0, 185.0, 93.0, 60.0, 31.0, 16.0, 15.0, 9.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.20254135131836, -12.558789253234863, -11.91503620147705, -11.271284103393555, -10.627531051635742, -9.983778953552246, -9.34002685546875, -8.696273803710938, -8.052521705627441, -7.408769130706787, -6.765016555786133, -6.121264457702637, -5.477511882781982, -4.833759307861328, -4.190007209777832, -3.5462546348571777, -2.9025020599365234, -2.258749485015869, -1.614997148513794, -0.9712446928024292, -0.32749223709106445, 0.31626033782958984, 0.960012674331665, 1.6037650108337402, 2.2475175857543945, 2.891270160675049, 3.535022497177124, 4.178774833679199, 4.8225274085998535, 5.466279983520508, 6.110032081604004, 6.753784656524658, 7.3975372314453125, 8.041289329528809, 8.685042381286621, 9.328794479370117, 9.97254753112793, 10.616299629211426, 11.260051727294922, 11.903804779052734, 12.54755687713623, 13.191308975219727, 13.835062026977539, 14.478814125061035, 15.122566223144531, 15.766319274902344, 16.410072326660156, 17.053823471069336, 17.69757652282715, 18.34132957458496, 18.98508071899414, 19.628833770751953, 20.272586822509766, 20.916339874267578, 21.560091018676758, 22.20384407043457, 22.84759521484375, 23.491348266601562, 24.135099411010742, 24.778852462768555, 25.422605514526367, 26.066356658935547, 26.71010971069336, 27.353862762451172, 27.997615814208984]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 4.0, 3.0, 4.0, 11.0, 10.0, 14.0, 16.0, 29.0, 18.0, 23.0, 20.0, 31.0, 34.0, 31.0, 35.0, 43.0, 49.0, 49.0, 43.0, 40.0, 58.0, 44.0, 43.0, 33.0, 48.0, 42.0, 32.0, 30.0, 23.0, 27.0, 21.0, 19.0, 15.0, 16.0, 9.0, 4.0, 6.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.096481323242188, -17.58935546875, -17.08222770690918, -16.575101852416992, -16.067975997924805, -15.5608491897583, -15.053722381591797, -14.54659652709961, -14.039470672607422, -13.532343864440918, -13.02521800994873, -12.518091201782227, -12.010965347290039, -11.503838539123535, -10.996711730957031, -10.489585876464844, -9.98245906829834, -9.475332260131836, -8.968206405639648, -8.461079597473145, -7.953953742980957, -7.446826934814453, -6.939700603485107, -6.432574272155762, -5.925447940826416, -5.41832160949707, -4.911195278167725, -4.404068946838379, -3.896942377090454, -3.3898160457611084, -2.8826894760131836, -2.375563144683838, -1.8684368133544922, -1.3613104820251465, -0.8541840314865112, -0.347057580947876, 0.16006875038146973, 0.6671950817108154, 1.1743216514587402, 1.681447982788086, 2.1885743141174316, 2.6957006454467773, 3.202826976776123, 3.709953546524048, 4.217080116271973, 4.72420597076416, 5.231332778930664, 5.73845911026001, 6.2455854415893555, 6.752711772918701, 7.259838104248047, 7.766964912414551, 8.274090766906738, 8.781217575073242, 9.28834342956543, 9.795470237731934, 10.302597045898438, 10.809723854064941, 11.316849708557129, 11.823976516723633, 12.33110237121582, 12.838229179382324, 13.345355987548828, 13.852481842041016, 14.359607696533203]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 6.0, 4.0, 4.0, 7.0, 18.0, 20.0, 24.0, 42.0, 59.0, 72.0, 99.0, 165.0, 201.0, 282.0, 425.0, 580.0, 877.0, 1172.0, 1877.0, 3025.0, 5195.0, 9301.0, 18981.0, 48758.0, 317071.0, 3698238.0, 51591.0, 18082.0, 8103.0, 4137.0, 2266.0, 1363.0, 815.0, 520.0, 296.0, 191.0, 135.0, 94.0, 62.0, 42.0, 35.0, 19.0, 9.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.40771484375, -0.3960838317871094, -0.38445281982421875, -0.3728218078613281, -0.3611907958984375, -0.3495597839355469, -0.33792877197265625, -0.3262977600097656, -0.314666748046875, -0.3030357360839844, -0.29140472412109375, -0.2797737121582031, -0.2681427001953125, -0.2565116882324219, -0.24488067626953125, -0.23324966430664062, -0.22161865234375, -0.20998764038085938, -0.19835662841796875, -0.18672561645507812, -0.1750946044921875, -0.16346359252929688, -0.15183258056640625, -0.14020156860351562, -0.128570556640625, -0.11693954467773438, -0.10530853271484375, -0.09367752075195312, -0.0820465087890625, -0.07041549682617188, -0.05878448486328125, -0.047153472900390625, -0.0355224609375, -0.023891448974609375, -0.01226043701171875, -0.000629425048828125, 0.0110015869140625, 0.022632598876953125, 0.03426361083984375, 0.045894622802734375, 0.057525634765625, 0.06915664672851562, 0.08078765869140625, 0.09241867065429688, 0.1040496826171875, 0.11568069458007812, 0.12731170654296875, 0.13894271850585938, 0.15057373046875, 0.16220474243164062, 0.17383575439453125, 0.18546676635742188, 0.1970977783203125, 0.20872879028320312, 0.22035980224609375, 0.23199081420898438, 0.243621826171875, 0.2552528381347656, 0.26688385009765625, 0.2785148620605469, 0.2901458740234375, 0.3017768859863281, 0.31340789794921875, 0.3250389099121094, 0.336669921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 6.0, 16.0, 9.0, 12.0, 16.0, 28.0, 774.0, 19.0, 14.0, 14.0, 5.0, 8.0, 6.0, 11.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.1331472396850586, -0.1294536590576172, -0.12576007843017578, -0.12206649780273438, -0.11837291717529297, -0.11467933654785156, -0.11098575592041016, -0.10729217529296875, -0.10359859466552734, -0.09990501403808594, -0.09621143341064453, -0.09251785278320312, -0.08882427215576172, -0.08513069152832031, -0.0814371109008789, -0.0777435302734375, -0.0740499496459961, -0.07035636901855469, -0.06666278839111328, -0.06296920776367188, -0.05927562713623047, -0.05558204650878906, -0.051888465881347656, -0.04819488525390625, -0.044501304626464844, -0.04080772399902344, -0.03711414337158203, -0.033420562744140625, -0.02972698211669922, -0.026033401489257812, -0.022339820861816406, -0.018646240234375, -0.014952659606933594, -0.011259078979492188, -0.007565498352050781, -0.003871917724609375, -0.00017833709716796875, 0.0035152435302734375, 0.007208824157714844, 0.01090240478515625, 0.014595985412597656, 0.018289566040039062, 0.02198314666748047, 0.025676727294921875, 0.02937030792236328, 0.03306388854980469, 0.036757469177246094, 0.0404510498046875, 0.044144630432128906, 0.04783821105957031, 0.05153179168701172, 0.055225372314453125, 0.05891895294189453, 0.06261253356933594, 0.06630611419677734, 0.06999969482421875, 0.07369327545166016, 0.07738685607910156, 0.08108043670654297, 0.08477401733398438, 0.08846759796142578, 0.09216117858886719, 0.0958547592163086, 0.09954833984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 11.0, 11.0, 10.0, 21.0, 36.0, 48.0, 86.0, 121.0, 188.0, 313.0, 513.0, 1064.0, 2338.0, 5603.0, 15333.0, 50430.0, 226399.0, 2730020.0, 976448.0, 132523.0, 33695.0, 11067.0, 4323.0, 1792.0, 876.0, 448.0, 219.0, 120.0, 80.0, 43.0, 28.0, 28.0, 15.0, 11.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.414794921875, -0.40383148193359375, -0.3928680419921875, -0.38190460205078125, -0.370941162109375, -0.35997772216796875, -0.3490142822265625, -0.33805084228515625, -0.32708740234375, -0.31612396240234375, -0.3051605224609375, -0.29419708251953125, -0.283233642578125, -0.27227020263671875, -0.2613067626953125, -0.25034332275390625, -0.2393798828125, -0.22841644287109375, -0.2174530029296875, -0.20648956298828125, -0.195526123046875, -0.18456268310546875, -0.1735992431640625, -0.16263580322265625, -0.15167236328125, -0.14070892333984375, -0.1297454833984375, -0.11878204345703125, -0.107818603515625, -0.09685516357421875, -0.0858917236328125, -0.07492828369140625, -0.06396484375, -0.05300140380859375, -0.0420379638671875, -0.03107452392578125, -0.020111083984375, -0.00914764404296875, 0.0018157958984375, 0.01277923583984375, 0.02374267578125, 0.03470611572265625, 0.0456695556640625, 0.05663299560546875, 0.067596435546875, 0.07855987548828125, 0.0895233154296875, 0.10048675537109375, 0.1114501953125, 0.12241363525390625, 0.1333770751953125, 0.14434051513671875, 0.155303955078125, 0.16626739501953125, 0.1772308349609375, 0.18819427490234375, 0.19915771484375, 0.21012115478515625, 0.2210845947265625, 0.23204803466796875, 0.243011474609375, 0.25397491455078125, 0.2649383544921875, 0.27590179443359375, 0.286865234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 11.0, 6.0, 17.0, 18.0, 30.0, 39.0, 58.0, 78.0, 82.0, 136.0, 202.0, 296.0, 520.0, 1164.0, 451.0, 271.0, 184.0, 130.0, 113.0, 67.0, 48.0, 46.0, 23.0, 24.0, 20.0, 3.0, 7.0, 6.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21875, -0.2133350372314453, -0.20792007446289062, -0.20250511169433594, -0.19709014892578125, -0.19167518615722656, -0.18626022338867188, -0.1808452606201172, -0.1754302978515625, -0.1700153350830078, -0.16460037231445312, -0.15918540954589844, -0.15377044677734375, -0.14835548400878906, -0.14294052124023438, -0.1375255584716797, -0.132110595703125, -0.1266956329345703, -0.12128067016601562, -0.11586570739746094, -0.11045074462890625, -0.10503578186035156, -0.09962081909179688, -0.09420585632324219, -0.0887908935546875, -0.08337593078613281, -0.07796096801757812, -0.07254600524902344, -0.06713104248046875, -0.06171607971191406, -0.056301116943359375, -0.05088615417480469, -0.04547119140625, -0.04005622863769531, -0.034641265869140625, -0.029226303100585938, -0.02381134033203125, -0.018396377563476562, -0.012981414794921875, -0.0075664520263671875, -0.0021514892578125, 0.0032634735107421875, 0.008678436279296875, 0.014093399047851562, 0.01950836181640625, 0.024923324584960938, 0.030338287353515625, 0.03575325012207031, 0.041168212890625, 0.04658317565917969, 0.051998138427734375, 0.05741310119628906, 0.06282806396484375, 0.06824302673339844, 0.07365798950195312, 0.07907295227050781, 0.0844879150390625, 0.08990287780761719, 0.09531784057617188, 0.10073280334472656, 0.10614776611328125, 0.11156272888183594, 0.11697769165039062, 0.12239265441894531, 0.1278076171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 17.0, 24.0, 52.0, 96.0, 184.0, 270.0, 157.0, 90.0, 59.0, 20.0, 10.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4969843029975891, -0.4568801522254944, -0.41677597165107727, -0.37667182087898254, -0.33656764030456543, -0.2964634895324707, -0.256359338760376, -0.21625515818595886, -0.17615100741386414, -0.13604684174060822, -0.09594268351793289, -0.05583852529525757, -0.015734359622001648, 0.024369806051254272, 0.064473956823349, 0.10457813739776611, 0.14468228816986084, 0.18478645384311676, 0.22489061951637268, 0.2649947702884674, 0.3050989508628845, 0.34520310163497925, 0.385307252407074, 0.4254114329814911, 0.4655155837535858, 0.5056197643280029, 0.5457239151000977, 0.5858280658721924, 0.6259322166442871, 0.6660363674163818, 0.7061405181884766, 0.7462447285652161, 0.7863489389419556, 0.8264530897140503, 0.866557240486145, 0.9066613912582397, 0.9467656016349792, 0.986869752407074, 1.0269739627838135, 1.0670781135559082, 1.107182264328003, 1.1472864151000977, 1.1873905658721924, 1.227494716644287, 1.2675988674163818, 1.3077030181884766, 1.3478071689605713, 1.3879114389419556, 1.4280154705047607, 1.4681196212768555, 1.5082237720489502, 1.548327922821045, 1.5884320735931396, 1.6285362243652344, 1.668640375137329, 1.7087446451187134, 1.748848795890808, 1.7889529466629028, 1.8290570974349976, 1.8691612482070923, 1.909265398979187, 1.9493696689605713, 1.989473819732666, 2.0295779705047607, 2.0696821212768555]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 10.0, 9.0, 14.0, 11.0, 17.0, 19.0, 15.0, 21.0, 34.0, 41.0, 31.0, 37.0, 52.0, 44.0, 69.0, 41.0, 56.0, 39.0, 43.0, 53.0, 53.0, 39.0, 45.0, 43.0, 31.0, 21.0, 27.0, 31.0, 14.0, 14.0, 9.0, 3.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8590982556343079, -0.8344303965568542, -0.8097624778747559, -0.7850946187973022, -0.7604267001152039, -0.7357588410377502, -0.7110909223556519, -0.6864230632781982, -0.6617552042007446, -0.637087345123291, -0.6124194264411926, -0.587751567363739, -0.5630836486816406, -0.538415789604187, -0.5137479305267334, -0.489080011844635, -0.4644120931625366, -0.4397442042827606, -0.4150763154029846, -0.390408456325531, -0.3657405376434326, -0.341072678565979, -0.316404789686203, -0.291736900806427, -0.267069011926651, -0.242401123046875, -0.217733234167099, -0.1930653601884842, -0.1683974713087082, -0.1437295824289322, -0.11906170845031738, -0.09439381957054138, -0.06972599029541016, -0.045058105140924454, -0.02039021998643875, 0.004277661442756653, 0.028945550322532654, 0.053613439202308655, 0.07828131318092346, 0.10294920206069946, 0.12761709094047546, 0.15228497982025146, 0.17695286870002747, 0.20162074267864227, 0.22628863155841827, 0.25095653533935547, 0.2756243944168091, 0.3002922832965851, 0.3249601721763611, 0.3496280610561371, 0.3742959499359131, 0.3989638090133667, 0.4236317276954651, 0.4482995867729187, 0.4729674756526947, 0.4976353645324707, 0.5223032236099243, 0.5469710826873779, 0.5716390013694763, 0.5963068604469299, 0.6209747791290283, 0.6456426382064819, 0.6703104972839355, 0.6949784159660339, 0.7196463346481323]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 7.0, 12.0, 24.0, 20.0, 32.0, 51.0, 56.0, 84.0, 126.0, 155.0, 198.0, 274.0, 401.0, 576.0, 840.0, 1211.0, 1929.0, 2994.0, 4859.0, 8539.0, 16043.0, 42378.0, 723566.0, 187425.0, 26672.0, 11907.0, 6726.0, 4022.0, 2489.0, 1511.0, 1056.0, 698.0, 487.0, 326.0, 244.0, 165.0, 121.0, 98.0, 64.0, 46.0, 38.0, 22.0, 15.0, 17.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.262939453125, -0.2541160583496094, -0.24529266357421875, -0.23646926879882812, -0.2276458740234375, -0.21882247924804688, -0.20999908447265625, -0.20117568969726562, -0.192352294921875, -0.18352890014648438, -0.17470550537109375, -0.16588211059570312, -0.1570587158203125, -0.14823532104492188, -0.13941192626953125, -0.13058853149414062, -0.12176513671875, -0.11294174194335938, -0.10411834716796875, -0.09529495239257812, -0.0864715576171875, -0.07764816284179688, -0.06882476806640625, -0.060001373291015625, -0.051177978515625, -0.042354583740234375, -0.03353118896484375, -0.024707794189453125, -0.0158843994140625, -0.007061004638671875, 0.00176239013671875, 0.010585784912109375, 0.0194091796875, 0.028232574462890625, 0.03705596923828125, 0.045879364013671875, 0.0547027587890625, 0.06352615356445312, 0.07234954833984375, 0.08117294311523438, 0.089996337890625, 0.09881973266601562, 0.10764312744140625, 0.11646652221679688, 0.1252899169921875, 0.13411331176757812, 0.14293670654296875, 0.15176010131835938, 0.16058349609375, 0.16940689086914062, 0.17823028564453125, 0.18705368041992188, 0.1958770751953125, 0.20470046997070312, 0.21352386474609375, 0.22234725952148438, 0.231170654296875, 0.23999404907226562, 0.24881744384765625, 0.2576408386230469, 0.2664642333984375, 0.2752876281738281, 0.28411102294921875, 0.2929344177246094, 0.3017578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 7.0, 5.0, 5.0, 8.0, 8.0, 7.0, 9.0, 18.0, 32.0, 97.0, 299.0, 296.0, 110.0, 23.0, 16.0, 9.0, 5.0, 6.0, 5.0, 8.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12436866760253906, -0.12068557739257812, -0.11700248718261719, -0.11331939697265625, -0.10963630676269531, -0.10595321655273438, -0.10227012634277344, -0.0985870361328125, -0.09490394592285156, -0.09122085571289062, -0.08753776550292969, -0.08385467529296875, -0.08017158508300781, -0.07648849487304688, -0.07280540466308594, -0.069122314453125, -0.06543922424316406, -0.061756134033203125, -0.05807304382324219, -0.05438995361328125, -0.05070686340332031, -0.047023773193359375, -0.04334068298339844, -0.0396575927734375, -0.03597450256347656, -0.032291412353515625, -0.028608322143554688, -0.02492523193359375, -0.021242141723632812, -0.017559051513671875, -0.013875961303710938, -0.01019287109375, -0.0065097808837890625, -0.002826690673828125, 0.0008563995361328125, 0.00453948974609375, 0.008222579956054688, 0.011905670166015625, 0.015588760375976562, 0.0192718505859375, 0.022954940795898438, 0.026638031005859375, 0.030321121215820312, 0.03400421142578125, 0.03768730163574219, 0.041370391845703125, 0.04505348205566406, 0.048736572265625, 0.05241966247558594, 0.056102752685546875, 0.05978584289550781, 0.06346893310546875, 0.06715202331542969, 0.07083511352539062, 0.07451820373535156, 0.0782012939453125, 0.08188438415527344, 0.08556747436523438, 0.08925056457519531, 0.09293365478515625, 0.09661674499511719, 0.10029983520507812, 0.10398292541503906, 0.107666015625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 14.0, 26.0, 38.0, 67.0, 154.0, 332.0, 868.0, 2377.0, 6781.0, 22696.0, 88537.0, 402214.0, 402715.0, 88736.0, 22192.0, 6831.0, 2404.0, 854.0, 350.0, 164.0, 80.0, 52.0, 26.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.55810546875, -0.5426025390625, -0.527099609375, -0.5115966796875, -0.49609375, -0.4805908203125, -0.465087890625, -0.4495849609375, -0.43408203125, -0.4185791015625, -0.403076171875, -0.3875732421875, -0.3720703125, -0.3565673828125, -0.341064453125, -0.3255615234375, -0.31005859375, -0.2945556640625, -0.279052734375, -0.2635498046875, -0.248046875, -0.2325439453125, -0.217041015625, -0.2015380859375, -0.18603515625, -0.1705322265625, -0.155029296875, -0.1395263671875, -0.1240234375, -0.1085205078125, -0.093017578125, -0.0775146484375, -0.06201171875, -0.0465087890625, -0.031005859375, -0.0155029296875, 0.0, 0.0155029296875, 0.031005859375, 0.0465087890625, 0.06201171875, 0.0775146484375, 0.093017578125, 0.1085205078125, 0.1240234375, 0.1395263671875, 0.155029296875, 0.1705322265625, 0.18603515625, 0.2015380859375, 0.217041015625, 0.2325439453125, 0.248046875, 0.2635498046875, 0.279052734375, 0.2945556640625, 0.31005859375, 0.3255615234375, 0.341064453125, 0.3565673828125, 0.3720703125, 0.3875732421875, 0.403076171875, 0.4185791015625, 0.43408203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 13.0, 12.0, 9.0, 7.0, 24.0, 19.0, 31.0, 23.0, 21.0, 30.0, 36.0, 40.0, 33.0, 44.0, 35.0, 31.0, 32.0, 45.0, 40.0, 33.0, 39.0, 30.0, 38.0, 46.0, 31.0, 30.0, 28.0, 25.0, 34.0, 22.0, 19.0, 13.0, 14.0, 10.0, 10.0, 12.0, 2.0, 6.0, 7.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.419921875, -0.4068756103515625, -0.393829345703125, -0.3807830810546875, -0.36773681640625, -0.3546905517578125, -0.341644287109375, -0.3285980224609375, -0.3155517578125, -0.3025054931640625, -0.289459228515625, -0.2764129638671875, -0.26336669921875, -0.2503204345703125, -0.237274169921875, -0.2242279052734375, -0.211181640625, -0.1981353759765625, -0.185089111328125, -0.1720428466796875, -0.15899658203125, -0.1459503173828125, -0.132904052734375, -0.1198577880859375, -0.1068115234375, -0.0937652587890625, -0.080718994140625, -0.0676727294921875, -0.05462646484375, -0.0415802001953125, -0.028533935546875, -0.0154876708984375, -0.00244140625, 0.0106048583984375, 0.023651123046875, 0.0366973876953125, 0.04974365234375, 0.0627899169921875, 0.075836181640625, 0.0888824462890625, 0.1019287109375, 0.1149749755859375, 0.128021240234375, 0.1410675048828125, 0.15411376953125, 0.1671600341796875, 0.180206298828125, 0.1932525634765625, 0.206298828125, 0.2193450927734375, 0.232391357421875, 0.2454376220703125, 0.25848388671875, 0.2715301513671875, 0.284576416015625, 0.2976226806640625, 0.3106689453125, 0.3237152099609375, 0.336761474609375, 0.3498077392578125, 0.36285400390625, 0.3759002685546875, 0.388946533203125, 0.4019927978515625, 0.4150390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 2.0, 4.0, 11.0, 5.0, 21.0, 29.0, 48.0, 117.0, 214.0, 634.0, 2497.0, 57799.0, 979611.0, 5885.0, 1057.0, 329.0, 126.0, 61.0, 39.0, 26.0, 12.0, 10.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80224609375, -0.7780838012695312, -0.7539215087890625, -0.7297592163085938, -0.705596923828125, -0.6814346313476562, -0.6572723388671875, -0.6331100463867188, -0.60894775390625, -0.5847854614257812, -0.5606231689453125, -0.5364608764648438, -0.512298583984375, -0.48813629150390625, -0.4639739990234375, -0.43981170654296875, -0.4156494140625, -0.39148712158203125, -0.3673248291015625, -0.34316253662109375, -0.319000244140625, -0.29483795166015625, -0.2706756591796875, -0.24651336669921875, -0.22235107421875, -0.19818878173828125, -0.1740264892578125, -0.14986419677734375, -0.125701904296875, -0.10153961181640625, -0.0773773193359375, -0.05321502685546875, -0.029052734375, -0.00489044189453125, 0.0192718505859375, 0.04343414306640625, 0.067596435546875, 0.09175872802734375, 0.1159210205078125, 0.14008331298828125, 0.16424560546875, 0.18840789794921875, 0.2125701904296875, 0.23673248291015625, 0.260894775390625, 0.28505706787109375, 0.3092193603515625, 0.33338165283203125, 0.3575439453125, 0.38170623779296875, 0.4058685302734375, 0.43003082275390625, 0.454193115234375, 0.47835540771484375, 0.5025177001953125, 0.5266799926757812, 0.55084228515625, 0.5750045776367188, 0.5991668701171875, 0.6233291625976562, 0.647491455078125, 0.6716537475585938, 0.6958160400390625, 0.7199783325195312, 0.744140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 2.0, 14.0, 14.0, 33.0, 36.0, 39.0, 76.0, 122.0, 170.0, 152.0, 122.0, 74.0, 56.0, 20.0, 20.0, 10.0, 11.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.357929229736328e-05, -9.117275476455688e-05, -8.876621723175049e-05, -8.635967969894409e-05, -8.39531421661377e-05, -8.15466046333313e-05, -7.91400671005249e-05, -7.67335295677185e-05, -7.432699203491211e-05, -7.192045450210571e-05, -6.951391696929932e-05, -6.710737943649292e-05, -6.470084190368652e-05, -6.229430437088013e-05, -5.988776683807373e-05, -5.7481229305267334e-05, -5.507469177246094e-05, -5.266815423965454e-05, -5.0261616706848145e-05, -4.785507917404175e-05, -4.544854164123535e-05, -4.3042004108428955e-05, -4.063546657562256e-05, -3.822892904281616e-05, -3.5822391510009766e-05, -3.341585397720337e-05, -3.100931644439697e-05, -2.8602778911590576e-05, -2.619624137878418e-05, -2.3789703845977783e-05, -2.1383166313171387e-05, -1.897662878036499e-05, -1.6570091247558594e-05, -1.4163553714752197e-05, -1.17570161819458e-05, -9.350478649139404e-06, -6.943941116333008e-06, -4.537403583526611e-06, -2.130866050720215e-06, 2.7567148208618164e-07, 2.682209014892578e-06, 5.088746547698975e-06, 7.495284080505371e-06, 9.901821613311768e-06, 1.2308359146118164e-05, 1.471489667892456e-05, 1.7121434211730957e-05, 1.9527971744537354e-05, 2.193450927734375e-05, 2.4341046810150146e-05, 2.6747584342956543e-05, 2.915412187576294e-05, 3.1560659408569336e-05, 3.396719694137573e-05, 3.637373447418213e-05, 3.8780272006988525e-05, 4.118680953979492e-05, 4.359334707260132e-05, 4.5999884605407715e-05, 4.840642213821411e-05, 5.081295967102051e-05, 5.3219497203826904e-05, 5.56260347366333e-05, 5.80325722694397e-05, 6.0439109802246094e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 1.0, 7.0, 7.0, 8.0, 15.0, 17.0, 23.0, 42.0, 53.0, 67.0, 96.0, 161.0, 196.0, 303.0, 498.0, 808.0, 1543.0, 2925.0, 6619.0, 18858.0, 79650.0, 567033.0, 299858.0, 46422.0, 12859.0, 4988.0, 2262.0, 1225.0, 671.0, 478.0, 269.0, 196.0, 113.0, 84.0, 54.0, 40.0, 29.0, 21.0, 15.0, 12.0, 8.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13307952880859375, -0.1284637451171875, -0.12384796142578125, -0.119232177734375, -0.11461639404296875, -0.1100006103515625, -0.10538482666015625, -0.10076904296875, -0.09615325927734375, -0.0915374755859375, -0.08692169189453125, -0.082305908203125, -0.07769012451171875, -0.0730743408203125, -0.06845855712890625, -0.0638427734375, -0.05922698974609375, -0.0546112060546875, -0.04999542236328125, -0.045379638671875, -0.04076385498046875, -0.0361480712890625, -0.03153228759765625, -0.02691650390625, -0.02230072021484375, -0.0176849365234375, -0.01306915283203125, -0.008453369140625, -0.00383758544921875, 0.0007781982421875, 0.00539398193359375, 0.010009765625, 0.01462554931640625, 0.0192413330078125, 0.02385711669921875, 0.028472900390625, 0.03308868408203125, 0.0377044677734375, 0.04232025146484375, 0.04693603515625, 0.05155181884765625, 0.0561676025390625, 0.06078338623046875, 0.065399169921875, 0.07001495361328125, 0.0746307373046875, 0.07924652099609375, 0.0838623046875, 0.08847808837890625, 0.0930938720703125, 0.09770965576171875, 0.102325439453125, 0.10694122314453125, 0.1115570068359375, 0.11617279052734375, 0.12078857421875, 0.12540435791015625, 0.1300201416015625, 0.13463592529296875, 0.139251708984375, 0.14386749267578125, 0.1484832763671875, 0.15309906005859375, 0.15771484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 10.0, 26.0, 45.0, 64.0, 96.0, 131.0, 143.0, 148.0, 95.0, 78.0, 41.0, 31.0, 21.0, 15.0, 12.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.31103515625, -0.3033618927001953, -0.2956886291503906, -0.28801536560058594, -0.28034210205078125, -0.27266883850097656, -0.2649955749511719, -0.2573223114013672, -0.2496490478515625, -0.2419757843017578, -0.23430252075195312, -0.22662925720214844, -0.21895599365234375, -0.21128273010253906, -0.20360946655273438, -0.1959362030029297, -0.188262939453125, -0.1805896759033203, -0.17291641235351562, -0.16524314880371094, -0.15756988525390625, -0.14989662170410156, -0.14222335815429688, -0.1345500946044922, -0.1268768310546875, -0.11920356750488281, -0.11153030395507812, -0.10385704040527344, -0.09618377685546875, -0.08851051330566406, -0.08083724975585938, -0.07316398620605469, -0.06549072265625, -0.05781745910644531, -0.050144195556640625, -0.04247093200683594, -0.03479766845703125, -0.027124404907226562, -0.019451141357421875, -0.011777877807617188, -0.0041046142578125, 0.0035686492919921875, 0.011241912841796875, 0.018915176391601562, 0.02658843994140625, 0.03426170349121094, 0.041934967041015625, 0.04960823059082031, 0.057281494140625, 0.06495475769042969, 0.07262802124023438, 0.08030128479003906, 0.08797454833984375, 0.09564781188964844, 0.10332107543945312, 0.11099433898925781, 0.1186676025390625, 0.1263408660888672, 0.13401412963867188, 0.14168739318847656, 0.14936065673828125, 0.15703392028808594, 0.16470718383789062, 0.1723804473876953, 0.1800537109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 19.0, 27.0, 50.0, 101.0, 137.0, 208.0, 193.0, 90.0, 57.0, 19.0, 24.0, 14.0, 7.0, 11.0, 4.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.763348340988159, -3.6514241695404053, -3.5394997596740723, -3.4275755882263184, -3.3156511783599854, -3.2037270069122314, -3.0918025970458984, -2.9798784255981445, -2.8679540157318115, -2.7560298442840576, -2.6441054344177246, -2.5321812629699707, -2.4202568531036377, -2.308332681655884, -2.196408271789551, -2.084484100341797, -1.9725598096847534, -1.86063551902771, -1.7487112283706665, -1.636786937713623, -1.5248626470565796, -1.4129383563995361, -1.3010141849517822, -1.1890897750854492, -1.0771656036376953, -0.9652413129806519, -0.8533170223236084, -0.7413927316665649, -0.6294684410095215, -0.5175442099571228, -0.40561991930007935, -0.2936956286430359, -0.18177127838134766, -0.0698469951748848, 0.042077288031578064, 0.15400156378746033, 0.2659258544445038, 0.37785011529922485, 0.4897744059562683, 0.6016986966133118, 0.7136229872703552, 0.8255472779273987, 0.9374715685844421, 1.0493957996368408, 1.1613200902938843, 1.2732443809509277, 1.3851686716079712, 1.4970929622650146, 1.609017252922058, 1.7209415435791016, 1.832865834236145, 1.9447901248931885, 2.0567142963409424, 2.1686387062072754, 2.2805628776550293, 2.3924872875213623, 2.504411458969116, 2.61633563041687, 2.728260040283203, 2.840184211730957, 2.95210862159729, 3.064032793045044, 3.175957202911377, 3.287881374359131, 3.399805784225464]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 0.0, 7.0, 3.0, 11.0, 7.0, 13.0, 24.0, 45.0, 62.0, 114.0, 179.0, 178.0, 124.0, 83.0, 43.0, 25.0, 24.0, 8.0, 10.0, 4.0, 4.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.913475036621094, -9.615315437316895, -9.317155838012695, -9.018996238708496, -8.720836639404297, -8.422677993774414, -8.124518394470215, -7.826358795166016, -7.528199195861816, -7.230039596557617, -6.931879997253418, -6.633720874786377, -6.335561275482178, -6.0374016761779785, -5.7392425537109375, -5.441082954406738, -5.142923355102539, -4.84476375579834, -4.546604156494141, -4.2484450340271, -3.9502854347229004, -3.652125835418701, -3.353966474533081, -3.055807113647461, -2.7576475143432617, -2.4594879150390625, -2.1613285541534424, -1.8631690740585327, -1.565009593963623, -1.2668501138687134, -0.9686906337738037, -0.6705312728881836, -0.3723716735839844, -0.07421219348907471, 0.22394728660583496, 0.5221067667007446, 0.8202662467956543, 1.118425726890564, 1.4165852069854736, 1.7147445678710938, 2.012904167175293, 2.311063766479492, 2.6092231273651123, 2.9073824882507324, 3.2055420875549316, 3.503701686859131, 3.801861047744751, 4.100020408630371, 4.39818000793457, 4.6963396072387695, 4.994499206542969, 5.29265832901001, 5.590817928314209, 5.888977527618408, 6.187136650085449, 6.485296249389648, 6.783455848693848, 7.081615447998047, 7.379775047302246, 7.677934169769287, 7.976093769073486, 8.274252891540527, 8.572412490844727, 8.870572090148926, 9.168731689453125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 6.0, 10.0, 12.0, 9.0, 20.0, 19.0, 39.0, 42.0, 76.0, 103.0, 132.0, 210.0, 280.0, 441.0, 742.0, 1229.0, 2229.0, 4224.0, 9569.0, 35314.0, 3759570.0, 339212.0, 24359.0, 7736.0, 3539.0, 1876.0, 1119.0, 744.0, 430.0, 284.0, 200.0, 149.0, 96.0, 77.0, 39.0, 36.0, 33.0, 16.0, 11.0, 9.0, 10.0, 8.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.001953125, -0.97052001953125, -0.9390869140625, -0.90765380859375, -0.876220703125, -0.84478759765625, -0.8133544921875, -0.78192138671875, -0.75048828125, -0.71905517578125, -0.6876220703125, -0.65618896484375, -0.624755859375, -0.59332275390625, -0.5618896484375, -0.53045654296875, -0.4990234375, -0.46759033203125, -0.4361572265625, -0.40472412109375, -0.373291015625, -0.34185791015625, -0.3104248046875, -0.27899169921875, -0.24755859375, -0.21612548828125, -0.1846923828125, -0.15325927734375, -0.121826171875, -0.09039306640625, -0.0589599609375, -0.02752685546875, 0.00390625, 0.03533935546875, 0.0667724609375, 0.09820556640625, 0.129638671875, 0.16107177734375, 0.1925048828125, 0.22393798828125, 0.25537109375, 0.28680419921875, 0.3182373046875, 0.34967041015625, 0.381103515625, 0.41253662109375, 0.4439697265625, 0.47540283203125, 0.5068359375, 0.53826904296875, 0.5697021484375, 0.60113525390625, 0.632568359375, 0.66400146484375, 0.6954345703125, 0.72686767578125, 0.75830078125, 0.78973388671875, 0.8211669921875, 0.85260009765625, 0.884033203125, 0.91546630859375, 0.9468994140625, 0.97833251953125, 1.009765625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 6.0, 6.0, 7.0, 14.0, 11.0, 23.0, 60.0, 107.0, 168.0, 223.0, 140.0, 82.0, 37.0, 22.0, 16.0, 11.0, 11.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.11290168762207031, -0.10940933227539062, -0.10591697692871094, -0.10242462158203125, -0.09893226623535156, -0.09543991088867188, -0.09194755554199219, -0.0884552001953125, -0.08496284484863281, -0.08147048950195312, -0.07797813415527344, -0.07448577880859375, -0.07099342346191406, -0.06750106811523438, -0.06400871276855469, -0.060516357421875, -0.05702400207519531, -0.053531646728515625, -0.05003929138183594, -0.04654693603515625, -0.04305458068847656, -0.039562225341796875, -0.03606986999511719, -0.0325775146484375, -0.029085159301757812, -0.025592803955078125, -0.022100448608398438, -0.01860809326171875, -0.015115737915039062, -0.011623382568359375, -0.008131027221679688, -0.004638671875, -0.0011463165283203125, 0.002346038818359375, 0.0058383941650390625, 0.00933074951171875, 0.012823104858398438, 0.016315460205078125, 0.019807815551757812, 0.0233001708984375, 0.026792526245117188, 0.030284881591796875, 0.03377723693847656, 0.03726959228515625, 0.04076194763183594, 0.044254302978515625, 0.04774665832519531, 0.051239013671875, 0.05473136901855469, 0.058223724365234375, 0.06171607971191406, 0.06520843505859375, 0.06870079040527344, 0.07219314575195312, 0.07568550109863281, 0.0791778564453125, 0.08267021179199219, 0.08616256713867188, 0.08965492248535156, 0.09314727783203125, 0.09663963317871094, 0.10013198852539062, 0.10362434387207031, 0.10711669921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 9.0, 18.0, 26.0, 34.0, 52.0, 74.0, 129.0, 188.0, 291.0, 463.0, 815.0, 1534.0, 2846.0, 6206.0, 15650.0, 58367.0, 2844432.0, 1186350.0, 50364.0, 14381.0, 5702.0, 2646.0, 1487.0, 822.0, 504.0, 294.0, 187.0, 125.0, 78.0, 58.0, 45.0, 23.0, 16.0, 12.0, 14.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.82470703125, -0.8004226684570312, -0.7761383056640625, -0.7518539428710938, -0.727569580078125, -0.7032852172851562, -0.6790008544921875, -0.6547164916992188, -0.63043212890625, -0.6061477661132812, -0.5818634033203125, -0.5575790405273438, -0.533294677734375, -0.5090103149414062, -0.4847259521484375, -0.46044158935546875, -0.4361572265625, -0.41187286376953125, -0.3875885009765625, -0.36330413818359375, -0.339019775390625, -0.31473541259765625, -0.2904510498046875, -0.26616668701171875, -0.24188232421875, -0.21759796142578125, -0.1933135986328125, -0.16902923583984375, -0.144744873046875, -0.12046051025390625, -0.0961761474609375, -0.07189178466796875, -0.047607421875, -0.02332305908203125, 0.0009613037109375, 0.02524566650390625, 0.049530029296875, 0.07381439208984375, 0.0980987548828125, 0.12238311767578125, 0.14666748046875, 0.17095184326171875, 0.1952362060546875, 0.21952056884765625, 0.243804931640625, 0.26808929443359375, 0.2923736572265625, 0.31665802001953125, 0.3409423828125, 0.36522674560546875, 0.3895111083984375, 0.41379547119140625, 0.438079833984375, 0.46236419677734375, 0.4866485595703125, 0.5109329223632812, 0.53521728515625, 0.5595016479492188, 0.5837860107421875, 0.6080703735351562, 0.632354736328125, 0.6566390991210938, 0.6809234619140625, 0.7052078247070312, 0.7294921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 2.0, 4.0, 8.0, 11.0, 15.0, 28.0, 26.0, 47.0, 100.0, 226.0, 1727.0, 1419.0, 224.0, 81.0, 39.0, 21.0, 25.0, 17.0, 9.0, 9.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2247314453125, -0.21791839599609375, -0.2111053466796875, -0.20429229736328125, -0.197479248046875, -0.19066619873046875, -0.1838531494140625, -0.17704010009765625, -0.17022705078125, -0.16341400146484375, -0.1566009521484375, -0.14978790283203125, -0.142974853515625, -0.13616180419921875, -0.1293487548828125, -0.12253570556640625, -0.11572265625, -0.10890960693359375, -0.1020965576171875, -0.09528350830078125, -0.088470458984375, -0.08165740966796875, -0.0748443603515625, -0.06803131103515625, -0.06121826171875, -0.05440521240234375, -0.0475921630859375, -0.04077911376953125, -0.033966064453125, -0.02715301513671875, -0.0203399658203125, -0.01352691650390625, -0.0067138671875, 9.918212890625e-05, 0.0069122314453125, 0.01372528076171875, 0.020538330078125, 0.02735137939453125, 0.0341644287109375, 0.04097747802734375, 0.04779052734375, 0.05460357666015625, 0.0614166259765625, 0.06822967529296875, 0.075042724609375, 0.08185577392578125, 0.0886688232421875, 0.09548187255859375, 0.102294921875, 0.10910797119140625, 0.1159210205078125, 0.12273406982421875, 0.129547119140625, 0.13636016845703125, 0.1431732177734375, 0.14998626708984375, 0.15679931640625, 0.16361236572265625, 0.1704254150390625, 0.17723846435546875, 0.184051513671875, 0.19086456298828125, 0.1976776123046875, 0.20449066162109375, 0.2113037109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 9.0, 5.0, 15.0, 26.0, 63.0, 163.0, 313.0, 233.0, 92.0, 34.0, 22.0, 11.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.194875955581665, -1.1681782007217407, -1.1414804458618164, -1.1147825717926025, -1.0880848169326782, -1.061387062072754, -1.0346893072128296, -1.0079915523529053, -0.9812937378883362, -0.9545959830284119, -0.9278981685638428, -0.9012004137039185, -0.8745025992393494, -0.847804844379425, -0.821107029914856, -0.7944092750549316, -0.7677115201950073, -0.741013765335083, -0.7143159508705139, -0.6876181960105896, -0.6609203815460205, -0.6342226266860962, -0.6075248718261719, -0.5808270573616028, -0.5541292428970337, -0.5274314880371094, -0.5007336735725403, -0.47403591871261597, -0.44733813405036926, -0.42064034938812256, -0.39394256472587585, -0.36724478006362915, -0.34054702520370483, -0.31384924054145813, -0.2871514558792114, -0.2604537010192871, -0.2337559163570404, -0.2070581316947937, -0.180360347032547, -0.1536625772714615, -0.12696479260921478, -0.10026701539754868, -0.07356923818588257, -0.046871453523635864, -0.020173676311969757, 0.00652410089969635, 0.033221885561943054, 0.059919655323028564, 0.08661743998527527, 0.11331521719694138, 0.14001299440860748, 0.1667107790708542, 0.1934085488319397, 0.2201063334941864, 0.2468041181564331, 0.2735018730163574, 0.3001996874809265, 0.3268974721431732, 0.3535952568054199, 0.38029301166534424, 0.40699079632759094, 0.43368858098983765, 0.46038636565208435, 0.48708415031433105, 0.5137819051742554]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 6.0, 8.0, 6.0, 12.0, 23.0, 44.0, 80.0, 120.0, 150.0, 141.0, 140.0, 115.0, 55.0, 29.0, 20.0, 12.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0649104118347168, -1.027033805847168, -0.9891572594642639, -0.9512807130813599, -0.913404107093811, -0.8755275011062622, -0.8376509547233582, -0.7997744083404541, -0.7618978023529053, -0.7240211963653564, -0.6861446499824524, -0.6482681035995483, -0.6103914976119995, -0.5725148916244507, -0.5346383452415466, -0.4967617690563202, -0.45888519287109375, -0.4210086166858673, -0.38313204050064087, -0.34525546431541443, -0.307378888130188, -0.26950231194496155, -0.2316257357597351, -0.19374915957450867, -0.15587258338928223, -0.11799600720405579, -0.08011943101882935, -0.042242854833602905, -0.004366278648376465, 0.033510297536849976, 0.07138687372207642, 0.10926344990730286, 0.1471400260925293, 0.18501660227775574, 0.22289317846298218, 0.2607697546482086, 0.29864633083343506, 0.3365229070186615, 0.37439948320388794, 0.4122760593891144, 0.4501526355743408, 0.48802921175956726, 0.5259057879447937, 0.5637823343276978, 0.6016589403152466, 0.6395355463027954, 0.6774120926856995, 0.7152886390686035, 0.7531652450561523, 0.7910418510437012, 0.8289183974266052, 0.8667949438095093, 0.9046715497970581, 0.9425481557846069, 0.980424702167511, 1.018301248550415, 1.0561778545379639, 1.0940544605255127, 1.1319310665130615, 1.1698075532913208, 1.2076841592788696, 1.2455607652664185, 1.2834372520446777, 1.3213138580322266, 1.3591904640197754]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 12.0, 14.0, 8.0, 25.0, 44.0, 79.0, 85.0, 142.0, 277.0, 587.0, 1016.0, 2220.0, 4606.0, 12156.0, 48109.0, 735843.0, 204833.0, 24183.0, 7614.0, 3374.0, 1592.0, 744.0, 368.0, 242.0, 147.0, 77.0, 41.0, 29.0, 22.0, 24.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6298828125, -0.608734130859375, -0.58758544921875, -0.566436767578125, -0.5452880859375, -0.524139404296875, -0.50299072265625, -0.481842041015625, -0.460693359375, -0.439544677734375, -0.41839599609375, -0.397247314453125, -0.3760986328125, -0.354949951171875, -0.33380126953125, -0.312652587890625, -0.29150390625, -0.270355224609375, -0.24920654296875, -0.228057861328125, -0.2069091796875, -0.185760498046875, -0.16461181640625, -0.143463134765625, -0.122314453125, -0.101165771484375, -0.08001708984375, -0.058868408203125, -0.0377197265625, -0.016571044921875, 0.00457763671875, 0.025726318359375, 0.046875, 0.068023681640625, 0.08917236328125, 0.110321044921875, 0.1314697265625, 0.152618408203125, 0.17376708984375, 0.194915771484375, 0.216064453125, 0.237213134765625, 0.25836181640625, 0.279510498046875, 0.3006591796875, 0.321807861328125, 0.34295654296875, 0.364105224609375, 0.38525390625, 0.406402587890625, 0.42755126953125, 0.448699951171875, 0.4698486328125, 0.490997314453125, 0.51214599609375, 0.533294677734375, 0.554443359375, 0.575592041015625, 0.59674072265625, 0.617889404296875, 0.6390380859375, 0.660186767578125, 0.68133544921875, 0.702484130859375, 0.7236328125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 5.0, 9.0, 6.0, 9.0, 6.0, 19.0, 27.0, 48.0, 100.0, 130.0, 219.0, 142.0, 106.0, 51.0, 31.0, 19.0, 12.0, 12.0, 7.0, 3.0, 5.0, 3.0, 2.0, 5.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09527587890625, -0.0926656723022461, -0.09005546569824219, -0.08744525909423828, -0.08483505249023438, -0.08222484588623047, -0.07961463928222656, -0.07700443267822266, -0.07439422607421875, -0.07178401947021484, -0.06917381286621094, -0.06656360626220703, -0.06395339965820312, -0.06134319305419922, -0.05873298645019531, -0.056122779846191406, -0.0535125732421875, -0.050902366638183594, -0.04829216003417969, -0.04568195343017578, -0.043071746826171875, -0.04046154022216797, -0.03785133361816406, -0.035241127014160156, -0.03263092041015625, -0.030020713806152344, -0.027410507202148438, -0.02480030059814453, -0.022190093994140625, -0.01957988739013672, -0.016969680786132812, -0.014359474182128906, -0.011749267578125, -0.009139060974121094, -0.0065288543701171875, -0.003918647766113281, -0.001308441162109375, 0.0013017654418945312, 0.0039119720458984375, 0.006522178649902344, 0.00913238525390625, 0.011742591857910156, 0.014352798461914062, 0.01696300506591797, 0.019573211669921875, 0.02218341827392578, 0.024793624877929688, 0.027403831481933594, 0.0300140380859375, 0.032624244689941406, 0.03523445129394531, 0.03784465789794922, 0.040454864501953125, 0.04306507110595703, 0.04567527770996094, 0.048285484313964844, 0.05089569091796875, 0.053505897521972656, 0.05611610412597656, 0.05872631072998047, 0.061336517333984375, 0.06394672393798828, 0.06655693054199219, 0.0691671371459961, 0.07177734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 12.0, 5.0, 13.0, 22.0, 18.0, 42.0, 46.0, 84.0, 127.0, 182.0, 306.0, 479.0, 746.0, 1244.0, 2118.0, 3645.0, 6481.0, 11636.0, 21487.0, 41540.0, 84787.0, 186589.0, 305140.0, 199318.0, 90080.0, 43207.0, 22046.0, 11838.0, 6489.0, 3541.0, 2030.0, 1280.0, 776.0, 411.0, 278.0, 190.0, 116.0, 63.0, 42.0, 36.0, 24.0, 11.0, 11.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.234375, -0.2273883819580078, -0.22040176391601562, -0.21341514587402344, -0.20642852783203125, -0.19944190979003906, -0.19245529174804688, -0.1854686737060547, -0.1784820556640625, -0.1714954376220703, -0.16450881958007812, -0.15752220153808594, -0.15053558349609375, -0.14354896545410156, -0.13656234741210938, -0.1295757293701172, -0.122589111328125, -0.11560249328613281, -0.10861587524414062, -0.10162925720214844, -0.09464263916015625, -0.08765602111816406, -0.08066940307617188, -0.07368278503417969, -0.0666961669921875, -0.05970954895019531, -0.052722930908203125, -0.04573631286621094, -0.03874969482421875, -0.03176307678222656, -0.024776458740234375, -0.017789840698242188, -0.01080322265625, -0.0038166046142578125, 0.003170013427734375, 0.010156631469726562, 0.01714324951171875, 0.024129867553710938, 0.031116485595703125, 0.03810310363769531, 0.0450897216796875, 0.05207633972167969, 0.059062957763671875, 0.06604957580566406, 0.07303619384765625, 0.08002281188964844, 0.08700942993164062, 0.09399604797363281, 0.100982666015625, 0.10796928405761719, 0.11495590209960938, 0.12194252014160156, 0.12892913818359375, 0.13591575622558594, 0.14290237426757812, 0.1498889923095703, 0.1568756103515625, 0.1638622283935547, 0.17084884643554688, 0.17783546447753906, 0.18482208251953125, 0.19180870056152344, 0.19879531860351562, 0.2057819366455078, 0.2127685546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 7.0, 5.0, 14.0, 10.0, 17.0, 21.0, 20.0, 23.0, 18.0, 28.0, 31.0, 33.0, 36.0, 36.0, 34.0, 35.0, 38.0, 43.0, 47.0, 34.0, 40.0, 41.0, 33.0, 43.0, 32.0, 33.0, 23.0, 22.0, 25.0, 25.0, 22.0, 25.0, 14.0, 16.0, 19.0, 14.0, 2.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2587890625, -0.2504730224609375, -0.242156982421875, -0.2338409423828125, -0.22552490234375, -0.2172088623046875, -0.208892822265625, -0.2005767822265625, -0.1922607421875, -0.1839447021484375, -0.175628662109375, -0.1673126220703125, -0.15899658203125, -0.1506805419921875, -0.142364501953125, -0.1340484619140625, -0.125732421875, -0.1174163818359375, -0.109100341796875, -0.1007843017578125, -0.09246826171875, -0.0841522216796875, -0.075836181640625, -0.0675201416015625, -0.0592041015625, -0.0508880615234375, -0.042572021484375, -0.0342559814453125, -0.02593994140625, -0.0176239013671875, -0.009307861328125, -0.0009918212890625, 0.00732421875, 0.0156402587890625, 0.023956298828125, 0.0322723388671875, 0.04058837890625, 0.0489044189453125, 0.057220458984375, 0.0655364990234375, 0.0738525390625, 0.0821685791015625, 0.090484619140625, 0.0988006591796875, 0.10711669921875, 0.1154327392578125, 0.123748779296875, 0.1320648193359375, 0.140380859375, 0.1486968994140625, 0.157012939453125, 0.1653289794921875, 0.17364501953125, 0.1819610595703125, 0.190277099609375, 0.1985931396484375, 0.2069091796875, 0.2152252197265625, 0.223541259765625, 0.2318572998046875, 0.24017333984375, 0.2484893798828125, 0.256805419921875, 0.2651214599609375, 0.2734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 10.0, 13.0, 17.0, 20.0, 44.0, 70.0, 154.0, 352.0, 1122.0, 6205.0, 947436.0, 88891.0, 2891.0, 746.0, 268.0, 120.0, 57.0, 33.0, 22.0, 25.0, 12.0, 14.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.03515625, -0.99346923828125, -0.9517822265625, -0.91009521484375, -0.868408203125, -0.82672119140625, -0.7850341796875, -0.74334716796875, -0.70166015625, -0.65997314453125, -0.6182861328125, -0.57659912109375, -0.534912109375, -0.49322509765625, -0.4515380859375, -0.40985107421875, -0.3681640625, -0.32647705078125, -0.2847900390625, -0.24310302734375, -0.201416015625, -0.15972900390625, -0.1180419921875, -0.07635498046875, -0.03466796875, 0.00701904296875, 0.0487060546875, 0.09039306640625, 0.132080078125, 0.17376708984375, 0.2154541015625, 0.25714111328125, 0.298828125, 0.34051513671875, 0.3822021484375, 0.42388916015625, 0.465576171875, 0.50726318359375, 0.5489501953125, 0.59063720703125, 0.63232421875, 0.67401123046875, 0.7156982421875, 0.75738525390625, 0.799072265625, 0.84075927734375, 0.8824462890625, 0.92413330078125, 0.9658203125, 1.00750732421875, 1.0491943359375, 1.09088134765625, 1.132568359375, 1.17425537109375, 1.2159423828125, 1.25762939453125, 1.29931640625, 1.34100341796875, 1.3826904296875, 1.42437744140625, 1.466064453125, 1.50775146484375, 1.5494384765625, 1.59112548828125, 1.6328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 9.0, 5.0, 14.0, 8.0, 14.0, 23.0, 26.0, 28.0, 47.0, 52.0, 61.0, 88.0, 112.0, 120.0, 99.0, 71.0, 52.0, 31.0, 40.0, 21.0, 14.0, 15.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.283687591552734e-05, -7.062684744596481e-05, -6.841681897640228e-05, -6.620679050683975e-05, -6.399676203727722e-05, -6.178673356771469e-05, -5.957670509815216e-05, -5.736667662858963e-05, -5.51566481590271e-05, -5.294661968946457e-05, -5.073659121990204e-05, -4.852656275033951e-05, -4.631653428077698e-05, -4.410650581121445e-05, -4.1896477341651917e-05, -3.9686448872089386e-05, -3.7476420402526855e-05, -3.5266391932964325e-05, -3.3056363463401794e-05, -3.0846334993839264e-05, -2.8636306524276733e-05, -2.6426278054714203e-05, -2.4216249585151672e-05, -2.2006221115589142e-05, -1.979619264602661e-05, -1.758616417646408e-05, -1.537613570690155e-05, -1.316610723733902e-05, -1.095607876777649e-05, -8.746050298213959e-06, -6.536021828651428e-06, -4.325993359088898e-06, -2.115964889526367e-06, 9.406358003616333e-08, 2.304092049598694e-06, 4.514120519161224e-06, 6.724148988723755e-06, 8.934177458286285e-06, 1.1144205927848816e-05, 1.3354234397411346e-05, 1.5564262866973877e-05, 1.7774291336536407e-05, 1.9984319806098938e-05, 2.219434827566147e-05, 2.4404376745224e-05, 2.661440521478653e-05, 2.882443368434906e-05, 3.103446215391159e-05, 3.324449062347412e-05, 3.545451909303665e-05, 3.766454756259918e-05, 3.987457603216171e-05, 4.208460450172424e-05, 4.4294632971286774e-05, 4.6504661440849304e-05, 4.8714689910411835e-05, 5.0924718379974365e-05, 5.3134746849536896e-05, 5.5344775319099426e-05, 5.755480378866196e-05, 5.976483225822449e-05, 6.197486072778702e-05, 6.418488919734955e-05, 6.639491766691208e-05, 6.860494613647461e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 8.0, 6.0, 12.0, 8.0, 19.0, 19.0, 29.0, 33.0, 49.0, 66.0, 96.0, 124.0, 166.0, 228.0, 302.0, 487.0, 708.0, 1057.0, 1632.0, 2937.0, 5596.0, 13041.0, 38851.0, 233916.0, 618655.0, 88993.0, 22689.0, 8695.0, 4176.0, 2201.0, 1252.0, 842.0, 512.0, 326.0, 216.0, 170.0, 135.0, 75.0, 65.0, 36.0, 32.0, 23.0, 20.0, 13.0, 12.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 4.0], "bins": [-0.301513671875, -0.2931995391845703, -0.2848854064941406, -0.27657127380371094, -0.26825714111328125, -0.25994300842285156, -0.2516288757324219, -0.2433147430419922, -0.2350006103515625, -0.2266864776611328, -0.21837234497070312, -0.21005821228027344, -0.20174407958984375, -0.19342994689941406, -0.18511581420898438, -0.1768016815185547, -0.168487548828125, -0.1601734161376953, -0.15185928344726562, -0.14354515075683594, -0.13523101806640625, -0.12691688537597656, -0.11860275268554688, -0.11028861999511719, -0.1019744873046875, -0.09366035461425781, -0.08534622192382812, -0.07703208923339844, -0.06871795654296875, -0.06040382385253906, -0.052089691162109375, -0.04377555847167969, -0.03546142578125, -0.027147293090820312, -0.018833160400390625, -0.010519027709960938, -0.00220489501953125, 0.0061092376708984375, 0.014423370361328125, 0.022737503051757812, 0.0310516357421875, 0.03936576843261719, 0.047679901123046875, 0.05599403381347656, 0.06430816650390625, 0.07262229919433594, 0.08093643188476562, 0.08925056457519531, 0.097564697265625, 0.10587882995605469, 0.11419296264648438, 0.12250709533691406, 0.13082122802734375, 0.13913536071777344, 0.14744949340820312, 0.1557636260986328, 0.1640777587890625, 0.1723918914794922, 0.18070602416992188, 0.18902015686035156, 0.19733428955078125, 0.20564842224121094, 0.21396255493164062, 0.2222766876220703, 0.2305908203125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 11.0, 4.0, 4.0, 18.0, 16.0, 19.0, 43.0, 67.0, 108.0, 150.0, 177.0, 134.0, 76.0, 51.0, 29.0, 26.0, 17.0, 15.0, 10.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.41796875, -0.4064292907714844, -0.39488983154296875, -0.3833503723144531, -0.3718109130859375, -0.3602714538574219, -0.34873199462890625, -0.3371925354003906, -0.325653076171875, -0.3141136169433594, -0.30257415771484375, -0.2910346984863281, -0.2794952392578125, -0.2679557800292969, -0.25641632080078125, -0.24487686157226562, -0.23333740234375, -0.22179794311523438, -0.21025848388671875, -0.19871902465820312, -0.1871795654296875, -0.17564010620117188, -0.16410064697265625, -0.15256118774414062, -0.141021728515625, -0.12948226928710938, -0.11794281005859375, -0.10640335083007812, -0.0948638916015625, -0.08332443237304688, -0.07178497314453125, -0.060245513916015625, -0.0487060546875, -0.037166595458984375, -0.02562713623046875, -0.014087677001953125, -0.0025482177734375, 0.008991241455078125, 0.02053070068359375, 0.032070159912109375, 0.043609619140625, 0.055149078369140625, 0.06668853759765625, 0.07822799682617188, 0.0897674560546875, 0.10130691528320312, 0.11284637451171875, 0.12438583374023438, 0.13592529296875, 0.14746475219726562, 0.15900421142578125, 0.17054367065429688, 0.1820831298828125, 0.19362258911132812, 0.20516204833984375, 0.21670150756835938, 0.228240966796875, 0.23978042602539062, 0.25131988525390625, 0.2628593444824219, 0.2743988037109375, 0.2859382629394531, 0.29747772216796875, 0.3090171813964844, 0.320556640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 7.0, 9.0, 34.0, 79.0, 300.0, 372.0, 125.0, 39.0, 18.0, 14.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1503190994262695, -3.9789814949035645, -3.8076441287994385, -3.6363065242767334, -3.4649691581726074, -3.2936315536499023, -3.1222939491271973, -2.950956344604492, -2.779618978500366, -2.608281373977661, -2.436944007873535, -2.26560640335083, -2.094268798828125, -1.922931432723999, -1.751593828201294, -1.5802563428878784, -1.408918857574463, -1.2375813722610474, -1.0662438869476318, -0.8949062824249268, -0.7235687971115112, -0.5522313117980957, -0.3808937072753906, -0.2095562219619751, -0.03821873664855957, 0.13311877846717834, 0.30445629358291626, 0.47579383850097656, 0.6471313238143921, 0.8184688091278076, 0.9898064136505127, 1.1611438989639282, 1.3324813842773438, 1.5038188695907593, 1.6751563549041748, 1.8464939594268799, 2.017831325531006, 2.189168930053711, 2.360506534576416, 2.531844139099121, 2.703181505203247, 2.874519109725952, 3.045856475830078, 3.217194080352783, 3.3885316848754883, 3.5598690509796143, 3.7312066555023193, 3.9025440216064453, 4.07388162612915, 4.2452192306518555, 4.4165568351745605, 4.587894439697266, 4.7592315673828125, 4.930569171905518, 5.101906776428223, 5.273244380950928, 5.444581985473633, 5.615919589996338, 5.787257194519043, 5.95859432220459, 6.129931926727295, 6.30126953125, 6.472607135772705, 6.64394474029541, 6.815281867980957]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 3.0, 2.0, 4.0, 8.0, 7.0, 14.0, 22.0, 43.0, 59.0, 77.0, 107.0, 95.0, 118.0, 119.0, 81.0, 55.0, 55.0, 33.0, 20.0, 11.0, 11.0, 12.0, 11.0, 2.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.70256233215332, -4.5700154304504395, -4.437468528747559, -4.304921627044678, -4.172374725341797, -4.039827823638916, -3.907280683517456, -3.774733781814575, -3.6421868801116943, -3.5096399784088135, -3.3770930767059326, -3.2445461750030518, -3.111999034881592, -2.979452133178711, -2.84690523147583, -2.714358329772949, -2.5818114280700684, -2.4492645263671875, -2.3167176246643066, -2.184170722961426, -2.051623821258545, -1.9190768003463745, -1.786529779434204, -1.6539828777313232, -1.5214359760284424, -1.3888890743255615, -1.2563421726226807, -1.1237951517105103, -0.9912482500076294, -0.8587013483047485, -0.7261543869972229, -0.5936074256896973, -0.4610610008239746, -0.32851406931877136, -0.19596713781356812, -0.06342020630836487, 0.06912672519683838, 0.20167362689971924, 0.3342205882072449, 0.4667675495147705, 0.5993144512176514, 0.7318613529205322, 0.8644083142280579, 0.9969552755355835, 1.1295021772384644, 1.2620490789413452, 1.3945960998535156, 1.5271430015563965, 1.6596899032592773, 1.7922368049621582, 1.924783706665039, 2.05733060836792, 2.189877510070801, 2.3224244117736816, 2.4549715518951416, 2.5875184535980225, 2.7200653553009033, 2.852612257003784, 2.985159158706665, 3.117706060409546, 3.250253200531006, 3.3828001022338867, 3.5153470039367676, 3.6478939056396484, 3.7804408073425293]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 13.0, 28.0, 30.0, 68.0, 85.0, 119.0, 135.0, 225.0, 358.0, 469.0, 644.0, 947.0, 1437.0, 2735.0, 5537.0, 13793.0, 53109.0, 3315675.0, 736355.0, 38761.0, 11406.0, 5052.0, 2608.0, 1460.0, 938.0, 607.0, 418.0, 297.0, 208.0, 165.0, 136.0, 97.0, 70.0, 64.0, 36.0, 39.0, 37.0, 29.0, 18.0, 10.0, 15.0, 7.0, 7.0, 6.0, 7.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70751953125, -0.6779403686523438, -0.6483612060546875, -0.6187820434570312, -0.589202880859375, -0.5596237182617188, -0.5300445556640625, -0.5004653930664062, -0.47088623046875, -0.44130706787109375, -0.4117279052734375, -0.38214874267578125, -0.352569580078125, -0.32299041748046875, -0.2934112548828125, -0.26383209228515625, -0.2342529296875, -0.20467376708984375, -0.1750946044921875, -0.14551544189453125, -0.115936279296875, -0.08635711669921875, -0.0567779541015625, -0.02719879150390625, 0.00238037109375, 0.03195953369140625, 0.0615386962890625, 0.09111785888671875, 0.120697021484375, 0.15027618408203125, 0.1798553466796875, 0.20943450927734375, 0.239013671875, 0.26859283447265625, 0.2981719970703125, 0.32775115966796875, 0.357330322265625, 0.38690948486328125, 0.4164886474609375, 0.44606781005859375, 0.47564697265625, 0.5052261352539062, 0.5348052978515625, 0.5643844604492188, 0.593963623046875, 0.6235427856445312, 0.6531219482421875, 0.6827011108398438, 0.7122802734375, 0.7418594360351562, 0.7714385986328125, 0.8010177612304688, 0.830596923828125, 0.8601760864257812, 0.8897552490234375, 0.9193344116210938, 0.94891357421875, 0.9784927368164062, 1.0080718994140625, 1.0376510620117188, 1.067230224609375, 1.0968093872070312, 1.1263885498046875, 1.1559677124023438, 1.185546875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 2.0, 7.0, 6.0, 4.0, 5.0, 6.0, 8.0, 5.0, 17.0, 18.0, 33.0, 53.0, 63.0, 98.0, 114.0, 149.0, 109.0, 87.0, 61.0, 37.0, 30.0, 25.0, 17.0, 11.0, 7.0, 6.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0555419921875, -0.053272247314453125, -0.05100250244140625, -0.048732757568359375, -0.0464630126953125, -0.044193267822265625, -0.04192352294921875, -0.039653778076171875, -0.037384033203125, -0.035114288330078125, -0.03284454345703125, -0.030574798583984375, -0.0283050537109375, -0.026035308837890625, -0.02376556396484375, -0.021495819091796875, -0.01922607421875, -0.016956329345703125, -0.01468658447265625, -0.012416839599609375, -0.0101470947265625, -0.007877349853515625, -0.00560760498046875, -0.003337860107421875, -0.001068115234375, 0.001201629638671875, 0.00347137451171875, 0.005741119384765625, 0.0080108642578125, 0.010280609130859375, 0.01255035400390625, 0.014820098876953125, 0.01708984375, 0.019359588623046875, 0.02162933349609375, 0.023899078369140625, 0.0261688232421875, 0.028438568115234375, 0.03070831298828125, 0.032978057861328125, 0.035247802734375, 0.037517547607421875, 0.03978729248046875, 0.042057037353515625, 0.0443267822265625, 0.046596527099609375, 0.04886627197265625, 0.051136016845703125, 0.05340576171875, 0.055675506591796875, 0.05794525146484375, 0.060214996337890625, 0.0624847412109375, 0.06475448608398438, 0.06702423095703125, 0.06929397583007812, 0.071563720703125, 0.07383346557617188, 0.07610321044921875, 0.07837295532226562, 0.0806427001953125, 0.08291244506835938, 0.08518218994140625, 0.08745193481445312, 0.0897216796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 12.0, 3.0, 9.0, 15.0, 22.0, 29.0, 32.0, 63.0, 123.0, 359.0, 1359.0, 13209.0, 3653517.0, 516148.0, 7797.0, 1016.0, 286.0, 101.0, 56.0, 29.0, 24.0, 19.0, 6.0, 12.0, 6.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.806640625, -1.744140625, -1.681640625, -1.619140625, -1.556640625, -1.494140625, -1.431640625, -1.369140625, -1.306640625, -1.244140625, -1.181640625, -1.119140625, -1.056640625, -0.994140625, -0.931640625, -0.869140625, -0.806640625, -0.744140625, -0.681640625, -0.619140625, -0.556640625, -0.494140625, -0.431640625, -0.369140625, -0.306640625, -0.244140625, -0.181640625, -0.119140625, -0.056640625, 0.005859375, 0.068359375, 0.130859375, 0.193359375, 0.255859375, 0.318359375, 0.380859375, 0.443359375, 0.505859375, 0.568359375, 0.630859375, 0.693359375, 0.755859375, 0.818359375, 0.880859375, 0.943359375, 1.005859375, 1.068359375, 1.130859375, 1.193359375, 1.255859375, 1.318359375, 1.380859375, 1.443359375, 1.505859375, 1.568359375, 1.630859375, 1.693359375, 1.755859375, 1.818359375, 1.880859375, 1.943359375, 2.005859375, 2.068359375, 2.130859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 11.0, 4.0, 8.0, 14.0, 13.0, 14.0, 33.0, 42.0, 68.0, 95.0, 207.0, 390.0, 1360.0, 1022.0, 332.0, 163.0, 100.0, 64.0, 29.0, 27.0, 16.0, 19.0, 12.0, 7.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15673828125, -0.15224647521972656, -0.14775466918945312, -0.1432628631591797, -0.13877105712890625, -0.1342792510986328, -0.12978744506835938, -0.12529563903808594, -0.1208038330078125, -0.11631202697753906, -0.11182022094726562, -0.10732841491699219, -0.10283660888671875, -0.09834480285644531, -0.09385299682617188, -0.08936119079589844, -0.084869384765625, -0.08037757873535156, -0.07588577270507812, -0.07139396667480469, -0.06690216064453125, -0.06241035461425781, -0.057918548583984375, -0.05342674255371094, -0.0489349365234375, -0.04444313049316406, -0.039951324462890625, -0.03545951843261719, -0.03096771240234375, -0.026475906372070312, -0.021984100341796875, -0.017492294311523438, -0.01300048828125, -0.008508682250976562, -0.004016876220703125, 0.0004749298095703125, 0.00496673583984375, 0.009458541870117188, 0.013950347900390625, 0.018442153930664062, 0.0229339599609375, 0.027425765991210938, 0.031917572021484375, 0.03640937805175781, 0.04090118408203125, 0.04539299011230469, 0.049884796142578125, 0.05437660217285156, 0.058868408203125, 0.06336021423339844, 0.06785202026367188, 0.07234382629394531, 0.07683563232421875, 0.08132743835449219, 0.08581924438476562, 0.09031105041503906, 0.0948028564453125, 0.09929466247558594, 0.10378646850585938, 0.10827827453613281, 0.11277008056640625, 0.11726188659667969, 0.12175369262695312, 0.12624549865722656, 0.1307373046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 10.0, 13.0, 38.0, 125.0, 331.0, 328.0, 103.0, 40.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7489442825317383, -1.7062439918518066, -1.6635435819625854, -1.6208432912826538, -1.5781428813934326, -1.535442590713501, -1.4927421808242798, -1.4500418901443481, -1.407341480255127, -1.3646411895751953, -1.3219407796859741, -1.2792404890060425, -1.2365400791168213, -1.1938397884368896, -1.1511393785476685, -1.1084390878677368, -1.0657386779785156, -1.023038387298584, -0.9803379774093628, -0.9376376271247864, -0.89493727684021, -0.8522369265556335, -0.8095365762710571, -0.7668362855911255, -0.7241359949111938, -0.6814356446266174, -0.638735294342041, -0.5960349440574646, -0.5533345937728882, -0.5106342434883118, -0.46793392300605774, -0.4252335727214813, -0.38253313302993774, -0.33983278274536133, -0.2971324324607849, -0.2544320821762085, -0.21173174679279327, -0.16903139650821686, -0.12633106112480164, -0.08363071084022522, -0.040930360555648804, 0.0017699860036373138, 0.04447033256292343, 0.08717067539691925, 0.12987102568149567, 0.17257137596607208, 0.2152717113494873, 0.2579720616340637, 0.30067241191864014, 0.34337276220321655, 0.38607311248779297, 0.4287734627723694, 0.4714738130569458, 0.5141741633415222, 0.5568745136260986, 0.5995748043060303, 0.6422752141952515, 0.6849755644798279, 0.7276759147644043, 0.7703762650489807, 0.8130766153335571, 0.8557769656181335, 0.89847731590271, 0.9411776065826416, 0.983877956867218]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 8.0, 18.0, 15.0, 15.0, 33.0, 40.0, 46.0, 63.0, 56.0, 74.0, 71.0, 64.0, 77.0, 69.0, 54.0, 57.0, 41.0, 47.0, 30.0, 26.0, 19.0, 14.0, 16.0, 5.0, 7.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5972145199775696, -0.5785411596298218, -0.5598677396774292, -0.5411943793296814, -0.5225209593772888, -0.503847599029541, -0.4851742088794708, -0.46650081872940063, -0.44782742857933044, -0.42915403842926025, -0.41048064827919006, -0.3918072581291199, -0.37313389778137207, -0.3544604778289795, -0.3357871174812317, -0.3171137273311615, -0.2984403371810913, -0.2797669470310211, -0.2610935568809509, -0.24242018163204193, -0.22374679148197174, -0.20507340133190155, -0.18640002608299255, -0.16772663593292236, -0.14905324578285217, -0.13037985563278198, -0.11170647293329239, -0.0930330902338028, -0.0743597000837326, -0.055686309933662415, -0.03701292723417282, -0.018339544534683228, 0.0003337860107421875, 0.01900717243552208, 0.03768055886030197, 0.05635394528508186, 0.07502733170986176, 0.09370072185993195, 0.11237410455942154, 0.13104748725891113, 0.14972087740898132, 0.1683942675590515, 0.1870676577091217, 0.2057410329580307, 0.2244144231081009, 0.24308781325817108, 0.2617611885070801, 0.28043457865715027, 0.29910796880722046, 0.31778135895729065, 0.33645474910736084, 0.35512813925743103, 0.3738015294075012, 0.392474889755249, 0.4111482799053192, 0.4298216700553894, 0.4484950602054596, 0.4671684503555298, 0.4858418405056, 0.5045152306556702, 0.523188591003418, 0.5418620109558105, 0.5605353713035583, 0.5792087316513062, 0.5978821516036987]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 12.0, 13.0, 15.0, 37.0, 34.0, 58.0, 91.0, 165.0, 275.0, 484.0, 1003.0, 2183.0, 5892.0, 21191.0, 136429.0, 713222.0, 136210.0, 20994.0, 5736.0, 2245.0, 961.0, 527.0, 256.0, 185.0, 98.0, 83.0, 42.0, 32.0, 23.0, 13.0, 15.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60546875, -0.5873947143554688, -0.5693206787109375, -0.5512466430664062, -0.533172607421875, -0.5150985717773438, -0.4970245361328125, -0.47895050048828125, -0.46087646484375, -0.44280242919921875, -0.4247283935546875, -0.40665435791015625, -0.388580322265625, -0.37050628662109375, -0.3524322509765625, -0.33435821533203125, -0.3162841796875, -0.29821014404296875, -0.2801361083984375, -0.26206207275390625, -0.243988037109375, -0.22591400146484375, -0.2078399658203125, -0.18976593017578125, -0.17169189453125, -0.15361785888671875, -0.1355438232421875, -0.11746978759765625, -0.099395751953125, -0.08132171630859375, -0.0632476806640625, -0.04517364501953125, -0.027099609375, -0.00902557373046875, 0.0090484619140625, 0.02712249755859375, 0.045196533203125, 0.06327056884765625, 0.0813446044921875, 0.09941864013671875, 0.11749267578125, 0.13556671142578125, 0.1536407470703125, 0.17171478271484375, 0.189788818359375, 0.20786285400390625, 0.2259368896484375, 0.24401092529296875, 0.2620849609375, 0.28015899658203125, 0.2982330322265625, 0.31630706787109375, 0.334381103515625, 0.35245513916015625, 0.3705291748046875, 0.38860321044921875, 0.40667724609375, 0.42475128173828125, 0.4428253173828125, 0.46089935302734375, 0.478973388671875, 0.49704742431640625, 0.5151214599609375, 0.5331954956054688, 0.55126953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 6.0, 16.0, 15.0, 21.0, 37.0, 62.0, 83.0, 78.0, 122.0, 132.0, 110.0, 95.0, 76.0, 46.0, 34.0, 16.0, 10.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059478759765625, -0.05713033676147461, -0.05478191375732422, -0.05243349075317383, -0.05008506774902344, -0.04773664474487305, -0.045388221740722656, -0.043039798736572266, -0.040691375732421875, -0.038342952728271484, -0.035994529724121094, -0.0336461067199707, -0.03129768371582031, -0.028949260711669922, -0.02660083770751953, -0.02425241470336914, -0.02190399169921875, -0.01955556869506836, -0.01720714569091797, -0.014858722686767578, -0.012510299682617188, -0.010161876678466797, -0.007813453674316406, -0.005465030670166016, -0.003116607666015625, -0.0007681846618652344, 0.0015802383422851562, 0.003928661346435547, 0.0062770843505859375, 0.008625507354736328, 0.010973930358886719, 0.01332235336303711, 0.0156707763671875, 0.01801919937133789, 0.02036762237548828, 0.022716045379638672, 0.025064468383789062, 0.027412891387939453, 0.029761314392089844, 0.032109737396240234, 0.034458160400390625, 0.036806583404541016, 0.039155006408691406, 0.0415034294128418, 0.04385185241699219, 0.04620027542114258, 0.04854869842529297, 0.05089712142944336, 0.05324554443359375, 0.05559396743774414, 0.05794239044189453, 0.06029081344604492, 0.06263923645019531, 0.0649876594543457, 0.0673360824584961, 0.06968450546264648, 0.07203292846679688, 0.07438135147094727, 0.07672977447509766, 0.07907819747924805, 0.08142662048339844, 0.08377504348754883, 0.08612346649169922, 0.08847188949584961, 0.0908203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 8.0, 15.0, 11.0, 23.0, 18.0, 21.0, 37.0, 35.0, 43.0, 70.0, 78.0, 113.0, 178.0, 350.0, 511.0, 1184.0, 2664.0, 6529.0, 16301.0, 43628.0, 147900.0, 463386.0, 256640.0, 68274.0, 23617.0, 9378.0, 3899.0, 1708.0, 781.0, 383.0, 211.0, 144.0, 86.0, 74.0, 61.0, 40.0, 38.0, 30.0, 16.0, 18.0, 12.0, 10.0, 6.0, 5.0, 3.0, 6.0, 5.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.402099609375, -0.390167236328125, -0.37823486328125, -0.366302490234375, -0.3543701171875, -0.342437744140625, -0.33050537109375, -0.318572998046875, -0.306640625, -0.294708251953125, -0.28277587890625, -0.270843505859375, -0.2589111328125, -0.246978759765625, -0.23504638671875, -0.223114013671875, -0.211181640625, -0.199249267578125, -0.18731689453125, -0.175384521484375, -0.1634521484375, -0.151519775390625, -0.13958740234375, -0.127655029296875, -0.11572265625, -0.103790283203125, -0.09185791015625, -0.079925537109375, -0.0679931640625, -0.056060791015625, -0.04412841796875, -0.032196044921875, -0.020263671875, -0.008331298828125, 0.00360107421875, 0.015533447265625, 0.0274658203125, 0.039398193359375, 0.05133056640625, 0.063262939453125, 0.0751953125, 0.087127685546875, 0.09906005859375, 0.110992431640625, 0.1229248046875, 0.134857177734375, 0.14678955078125, 0.158721923828125, 0.170654296875, 0.182586669921875, 0.19451904296875, 0.206451416015625, 0.2183837890625, 0.230316162109375, 0.24224853515625, 0.254180908203125, 0.26611328125, 0.278045654296875, 0.28997802734375, 0.301910400390625, 0.3138427734375, 0.325775146484375, 0.33770751953125, 0.349639892578125, 0.361572265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 14.0, 9.0, 8.0, 5.0, 11.0, 17.0, 14.0, 18.0, 12.0, 28.0, 14.0, 22.0, 25.0, 31.0, 32.0, 28.0, 47.0, 44.0, 43.0, 36.0, 39.0, 29.0, 40.0, 45.0, 38.0, 35.0, 47.0, 30.0, 22.0, 19.0, 19.0, 22.0, 17.0, 21.0, 17.0, 9.0, 9.0, 12.0, 12.0, 4.0, 11.0, 6.0, 5.0, 2.0, 8.0, 8.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2286376953125, -0.22144699096679688, -0.21425628662109375, -0.20706558227539062, -0.1998748779296875, -0.19268417358398438, -0.18549346923828125, -0.17830276489257812, -0.171112060546875, -0.16392135620117188, -0.15673065185546875, -0.14953994750976562, -0.1423492431640625, -0.13515853881835938, -0.12796783447265625, -0.12077713012695312, -0.11358642578125, -0.10639572143554688, -0.09920501708984375, -0.09201431274414062, -0.0848236083984375, -0.07763290405273438, -0.07044219970703125, -0.06325149536132812, -0.056060791015625, -0.048870086669921875, -0.04167938232421875, -0.034488677978515625, -0.0272979736328125, -0.020107269287109375, -0.01291656494140625, -0.005725860595703125, 0.00146484375, 0.008655548095703125, 0.01584625244140625, 0.023036956787109375, 0.0302276611328125, 0.037418365478515625, 0.04460906982421875, 0.051799774169921875, 0.058990478515625, 0.06618118286132812, 0.07337188720703125, 0.08056259155273438, 0.0877532958984375, 0.09494400024414062, 0.10213470458984375, 0.10932540893554688, 0.11651611328125, 0.12370681762695312, 0.13089752197265625, 0.13808822631835938, 0.1452789306640625, 0.15246963500976562, 0.15966033935546875, 0.16685104370117188, 0.174041748046875, 0.18123245239257812, 0.18842315673828125, 0.19561386108398438, 0.2028045654296875, 0.20999526977539062, 0.21718597412109375, 0.22437667846679688, 0.2315673828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 10.0, 9.0, 17.0, 27.0, 35.0, 55.0, 62.0, 100.0, 170.0, 246.0, 484.0, 1130.0, 3232.0, 14349.0, 145023.0, 772684.0, 95220.0, 10972.0, 2696.0, 958.0, 432.0, 230.0, 108.0, 91.0, 46.0, 36.0, 31.0, 26.0, 18.0, 9.0, 11.0, 7.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.38232421875, -0.3705329895019531, -0.35874176025390625, -0.3469505310058594, -0.3351593017578125, -0.3233680725097656, -0.31157684326171875, -0.2997856140136719, -0.287994384765625, -0.2762031555175781, -0.26441192626953125, -0.2526206970214844, -0.2408294677734375, -0.22903823852539062, -0.21724700927734375, -0.20545578002929688, -0.19366455078125, -0.18187332153320312, -0.17008209228515625, -0.15829086303710938, -0.1464996337890625, -0.13470840454101562, -0.12291717529296875, -0.11112594604492188, -0.099334716796875, -0.08754348754882812, -0.07575225830078125, -0.06396102905273438, -0.0521697998046875, -0.040378570556640625, -0.02858734130859375, -0.016796112060546875, -0.0050048828125, 0.006786346435546875, 0.01857757568359375, 0.030368804931640625, 0.0421600341796875, 0.053951263427734375, 0.06574249267578125, 0.07753372192382812, 0.089324951171875, 0.10111618041992188, 0.11290740966796875, 0.12469863891601562, 0.1364898681640625, 0.14828109741210938, 0.16007232666015625, 0.17186355590820312, 0.18365478515625, 0.19544601440429688, 0.20723724365234375, 0.21902847290039062, 0.2308197021484375, 0.24261093139648438, 0.25440216064453125, 0.2661933898925781, 0.277984619140625, 0.2897758483886719, 0.30156707763671875, 0.3133583068847656, 0.3251495361328125, 0.3369407653808594, 0.34873199462890625, 0.3605232238769531, 0.372314453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 11.0, 14.0, 11.0, 21.0, 28.0, 27.0, 55.0, 61.0, 57.0, 74.0, 74.0, 70.0, 63.0, 72.0, 65.0, 57.0, 47.0, 42.0, 22.0, 19.0, 15.0, 14.0, 9.0, 11.0, 6.0, 5.0, 2.0, 7.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439188003540039e-05, -3.313738852739334e-05, -3.188289701938629e-05, -3.062840551137924e-05, -2.9373914003372192e-05, -2.8119422495365143e-05, -2.6864930987358093e-05, -2.5610439479351044e-05, -2.4355947971343994e-05, -2.3101456463336945e-05, -2.1846964955329895e-05, -2.0592473447322845e-05, -1.9337981939315796e-05, -1.8083490431308746e-05, -1.6828998923301697e-05, -1.5574507415294647e-05, -1.4320015907287598e-05, -1.3065524399280548e-05, -1.1811032891273499e-05, -1.0556541383266449e-05, -9.3020498752594e-06, -8.04755836725235e-06, -6.7930668592453e-06, -5.538575351238251e-06, -4.284083843231201e-06, -3.0295923352241516e-06, -1.775100827217102e-06, -5.206093192100525e-07, 7.338821887969971e-07, 1.9883736968040466e-06, 3.242865204811096e-06, 4.497356712818146e-06, 5.751848220825195e-06, 7.006339728832245e-06, 8.260831236839294e-06, 9.515322744846344e-06, 1.0769814252853394e-05, 1.2024305760860443e-05, 1.3278797268867493e-05, 1.4533288776874542e-05, 1.5787780284881592e-05, 1.704227179288864e-05, 1.829676330089569e-05, 1.955125480890274e-05, 2.080574631690979e-05, 2.206023782491684e-05, 2.331472933292389e-05, 2.456922084093094e-05, 2.5823712348937988e-05, 2.7078203856945038e-05, 2.8332695364952087e-05, 2.9587186872959137e-05, 3.0841678380966187e-05, 3.2096169888973236e-05, 3.3350661396980286e-05, 3.4605152904987335e-05, 3.5859644412994385e-05, 3.7114135921001434e-05, 3.8368627429008484e-05, 3.9623118937015533e-05, 4.087761044502258e-05, 4.213210195302963e-05, 4.338659346103668e-05, 4.464108496904373e-05, 4.589557647705078e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 7.0, 7.0, 8.0, 28.0, 43.0, 67.0, 119.0, 222.0, 509.0, 1239.0, 4009.0, 15468.0, 117547.0, 753098.0, 132370.0, 17030.0, 4278.0, 1395.0, 574.0, 214.0, 126.0, 68.0, 36.0, 25.0, 16.0, 14.0, 11.0, 4.0, 3.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.365234375, -0.3528633117675781, -0.34049224853515625, -0.3281211853027344, -0.3157501220703125, -0.3033790588378906, -0.29100799560546875, -0.2786369323730469, -0.266265869140625, -0.2538948059082031, -0.24152374267578125, -0.22915267944335938, -0.2167816162109375, -0.20441055297851562, -0.19203948974609375, -0.17966842651367188, -0.16729736328125, -0.15492630004882812, -0.14255523681640625, -0.13018417358398438, -0.1178131103515625, -0.10544204711914062, -0.09307098388671875, -0.08069992065429688, -0.068328857421875, -0.055957794189453125, -0.04358673095703125, -0.031215667724609375, -0.0188446044921875, -0.006473541259765625, 0.00589752197265625, 0.018268585205078125, 0.0306396484375, 0.043010711669921875, 0.05538177490234375, 0.06775283813476562, 0.0801239013671875, 0.09249496459960938, 0.10486602783203125, 0.11723709106445312, 0.129608154296875, 0.14197921752929688, 0.15435028076171875, 0.16672134399414062, 0.1790924072265625, 0.19146347045898438, 0.20383453369140625, 0.21620559692382812, 0.22857666015625, 0.24094772338867188, 0.25331878662109375, 0.2656898498535156, 0.2780609130859375, 0.2904319763183594, 0.30280303955078125, 0.3151741027832031, 0.327545166015625, 0.3399162292480469, 0.35228729248046875, 0.3646583557128906, 0.3770294189453125, 0.3894004821777344, 0.40177154541015625, 0.4141426086425781, 0.426513671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 6.0, 10.0, 12.0, 30.0, 32.0, 39.0, 57.0, 64.0, 114.0, 102.0, 107.0, 110.0, 73.0, 48.0, 35.0, 40.0, 24.0, 25.0, 9.0, 9.0, 8.0, 5.0, 2.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1630859375, -0.15728187561035156, -0.15147781372070312, -0.1456737518310547, -0.13986968994140625, -0.1340656280517578, -0.12826156616210938, -0.12245750427246094, -0.1166534423828125, -0.11084938049316406, -0.10504531860351562, -0.09924125671386719, -0.09343719482421875, -0.08763313293457031, -0.08182907104492188, -0.07602500915527344, -0.070220947265625, -0.06441688537597656, -0.058612823486328125, -0.05280876159667969, -0.04700469970703125, -0.04120063781738281, -0.035396575927734375, -0.029592514038085938, -0.0237884521484375, -0.017984390258789062, -0.012180328369140625, -0.0063762664794921875, -0.00057220458984375, 0.0052318572998046875, 0.011035919189453125, 0.016839981079101562, 0.02264404296875, 0.028448104858398438, 0.034252166748046875, 0.04005622863769531, 0.04586029052734375, 0.05166435241699219, 0.057468414306640625, 0.06327247619628906, 0.0690765380859375, 0.07488059997558594, 0.08068466186523438, 0.08648872375488281, 0.09229278564453125, 0.09809684753417969, 0.10390090942382812, 0.10970497131347656, 0.115509033203125, 0.12131309509277344, 0.12711715698242188, 0.1329212188720703, 0.13872528076171875, 0.1445293426513672, 0.15033340454101562, 0.15613746643066406, 0.1619415283203125, 0.16774559020996094, 0.17354965209960938, 0.1793537139892578, 0.18515777587890625, 0.1909618377685547, 0.19676589965820312, 0.20256996154785156, 0.2083740234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 5.0, 10.0, 25.0, 72.0, 201.0, 372.0, 188.0, 72.0, 32.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2419800758361816, -2.0755553245544434, -1.9091308116912842, -1.742706060409546, -1.5762814283370972, -1.4098567962646484, -1.2434320449829102, -1.0770074129104614, -0.9105827808380127, -0.744158148765564, -0.5777334570884705, -0.41130879521369934, -0.24488413333892822, -0.07845950126647949, 0.08796519041061401, 0.2543898820877075, 0.42081451416015625, 0.587239146232605, 0.7536638379096985, 0.920088529586792, 1.0865131616592407, 1.2529377937316895, 1.4193625450134277, 1.5857871770858765, 1.7522118091583252, 1.918636441230774, 2.0850610733032227, 2.251485824584961, 2.417910575866699, 2.5843350887298584, 2.7507598400115967, 2.917184352874756, 3.0836095809936523, 3.2500343322753906, 3.41645884513855, 3.582883596420288, 3.7493081092834473, 3.9157328605651855, 4.082157611846924, 4.248582363128662, 4.415006637573242, 4.5814313888549805, 4.747856140136719, 4.914280414581299, 5.080705165863037, 5.247129917144775, 5.413554668426514, 5.579979419708252, 5.74640417098999, 5.9128289222717285, 6.079253673553467, 6.245677947998047, 6.412102699279785, 6.578527450561523, 6.744952201843262, 6.911376953125, 7.077801704406738, 7.244226455688477, 7.410651206970215, 7.577075481414795, 7.743500232696533, 7.9099249839782715, 8.076349258422852, 8.24277400970459, 8.409198760986328]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 7.0, 12.0, 7.0, 15.0, 12.0, 22.0, 31.0, 30.0, 38.0, 39.0, 41.0, 54.0, 59.0, 57.0, 65.0, 58.0, 67.0, 69.0, 46.0, 46.0, 40.0, 34.0, 39.0, 32.0, 10.0, 22.0, 7.0, 15.0, 6.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0954370498657227, -2.0118963718414307, -1.9283556938171387, -1.8448150157928467, -1.7612743377685547, -1.6777336597442627, -1.5941928625106812, -1.5106521844863892, -1.4271115064620972, -1.3435708284378052, -1.2600301504135132, -1.1764893531799316, -1.0929486751556396, -1.0094079971313477, -0.9258673191070557, -0.8423266410827637, -0.7587859630584717, -0.6752452850341797, -0.5917046070098877, -0.5081638693809509, -0.42462319135665894, -0.34108251333236694, -0.2575417757034302, -0.17400109767913818, -0.09046041965484619, -0.006919726729393005, 0.07662096619606018, 0.16016167402267456, 0.24370235204696655, 0.32724303007125854, 0.4107837677001953, 0.4943244457244873, 0.5778648853302002, 0.6614055633544922, 0.7449462413787842, 0.828486979007721, 0.9120276570320129, 0.9955683350563049, 1.0791090726852417, 1.1626497507095337, 1.2461904287338257, 1.3297311067581177, 1.4132717847824097, 1.4968125820159912, 1.5803532600402832, 1.6638939380645752, 1.7474346160888672, 1.8309752941131592, 1.9145159721374512, 1.9980566501617432, 2.081597328186035, 2.165138006210327, 2.248678684234619, 2.332219362258911, 2.415760040283203, 2.499300956726074, 2.582841396331787, 2.666382074356079, 2.749922752380371, 2.833463430404663, 2.917004108428955, 3.000544786453247, 3.084085464477539, 3.16762638092041, 3.251167058944702]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 5.0, 13.0, 24.0, 43.0, 62.0, 154.0, 301.0, 840.0, 3186.0, 34689.0, 4122045.0, 28603.0, 2912.0, 755.0, 311.0, 131.0, 78.0, 43.0, 23.0, 16.0, 12.0, 8.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.42218017578125, -2.3306884765625, -2.23919677734375, -2.147705078125, -2.05621337890625, -1.9647216796875, -1.87322998046875, -1.78173828125, -1.69024658203125, -1.5987548828125, -1.50726318359375, -1.415771484375, -1.32427978515625, -1.2327880859375, -1.14129638671875, -1.0498046875, -0.95831298828125, -0.8668212890625, -0.77532958984375, -0.683837890625, -0.59234619140625, -0.5008544921875, -0.40936279296875, -0.31787109375, -0.22637939453125, -0.1348876953125, -0.04339599609375, 0.048095703125, 0.13958740234375, 0.2310791015625, 0.32257080078125, 0.4140625, 0.50555419921875, 0.5970458984375, 0.68853759765625, 0.780029296875, 0.87152099609375, 0.9630126953125, 1.05450439453125, 1.14599609375, 1.23748779296875, 1.3289794921875, 1.42047119140625, 1.511962890625, 1.60345458984375, 1.6949462890625, 1.78643798828125, 1.8779296875, 1.96942138671875, 2.0609130859375, 2.15240478515625, 2.243896484375, 2.33538818359375, 2.4268798828125, 2.51837158203125, 2.60986328125, 2.70135498046875, 2.7928466796875, 2.88433837890625, 2.975830078125, 3.06732177734375, 3.1588134765625, 3.25030517578125, 3.341796875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 3.0, 2.0, 6.0, 10.0, 14.0, 20.0, 14.0, 39.0, 51.0, 76.0, 100.0, 105.0, 120.0, 99.0, 95.0, 61.0, 55.0, 47.0, 25.0, 22.0, 7.0, 11.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0943603515625, -0.0910482406616211, -0.08773612976074219, -0.08442401885986328, -0.08111190795898438, -0.07779979705810547, -0.07448768615722656, -0.07117557525634766, -0.06786346435546875, -0.06455135345458984, -0.06123924255371094, -0.05792713165283203, -0.054615020751953125, -0.05130290985107422, -0.04799079895019531, -0.044678688049316406, -0.0413665771484375, -0.038054466247558594, -0.03474235534667969, -0.03143024444580078, -0.028118133544921875, -0.02480602264404297, -0.021493911743164062, -0.018181800842285156, -0.01486968994140625, -0.011557579040527344, -0.008245468139648438, -0.004933357238769531, -0.001621246337890625, 0.0016908645629882812, 0.0050029754638671875, 0.008315086364746094, 0.011627197265625, 0.014939308166503906, 0.018251419067382812, 0.02156352996826172, 0.024875640869140625, 0.02818775177001953, 0.03149986267089844, 0.034811973571777344, 0.03812408447265625, 0.041436195373535156, 0.04474830627441406, 0.04806041717529297, 0.051372528076171875, 0.05468463897705078, 0.05799674987792969, 0.061308860778808594, 0.0646209716796875, 0.0679330825805664, 0.07124519348144531, 0.07455730438232422, 0.07786941528320312, 0.08118152618408203, 0.08449363708496094, 0.08780574798583984, 0.09111785888671875, 0.09442996978759766, 0.09774208068847656, 0.10105419158935547, 0.10436630249023438, 0.10767841339111328, 0.11099052429199219, 0.1143026351928711, 0.11761474609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 11.0, 12.0, 12.0, 25.0, 13.0, 26.0, 36.0, 51.0, 41.0, 60.0, 61.0, 74.0, 111.0, 162.0, 311.0, 1042.0, 8540.0, 724552.0, 3445179.0, 11940.0, 1128.0, 323.0, 132.0, 101.0, 79.0, 62.0, 42.0, 32.0, 31.0, 18.0, 19.0, 18.0, 15.0, 6.0, 10.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.38714599609375, -1.3270263671875, -1.26690673828125, -1.206787109375, -1.14666748046875, -1.0865478515625, -1.02642822265625, -0.96630859375, -0.90618896484375, -0.8460693359375, -0.78594970703125, -0.725830078125, -0.66571044921875, -0.6055908203125, -0.54547119140625, -0.4853515625, -0.42523193359375, -0.3651123046875, -0.30499267578125, -0.244873046875, -0.18475341796875, -0.1246337890625, -0.06451416015625, -0.00439453125, 0.05572509765625, 0.1158447265625, 0.17596435546875, 0.236083984375, 0.29620361328125, 0.3563232421875, 0.41644287109375, 0.4765625, 0.53668212890625, 0.5968017578125, 0.65692138671875, 0.717041015625, 0.77716064453125, 0.8372802734375, 0.89739990234375, 0.95751953125, 1.01763916015625, 1.0777587890625, 1.13787841796875, 1.197998046875, 1.25811767578125, 1.3182373046875, 1.37835693359375, 1.4384765625, 1.49859619140625, 1.5587158203125, 1.61883544921875, 1.678955078125, 1.73907470703125, 1.7991943359375, 1.85931396484375, 1.91943359375, 1.97955322265625, 2.0396728515625, 2.09979248046875, 2.159912109375, 2.22003173828125, 2.2801513671875, 2.34027099609375, 2.400390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 9.0, 12.0, 25.0, 21.0, 55.0, 71.0, 185.0, 445.0, 2087.0, 751.0, 206.0, 97.0, 50.0, 29.0, 20.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.37094688415527344, -0.3622550964355469, -0.3535633087158203, -0.34487152099609375, -0.3361797332763672, -0.3274879455566406, -0.31879615783691406, -0.3101043701171875, -0.30141258239746094, -0.2927207946777344, -0.2840290069580078, -0.27533721923828125, -0.2666454315185547, -0.2579536437988281, -0.24926185607910156, -0.240570068359375, -0.23187828063964844, -0.22318649291992188, -0.2144947052001953, -0.20580291748046875, -0.1971111297607422, -0.18841934204101562, -0.17972755432128906, -0.1710357666015625, -0.16234397888183594, -0.15365219116210938, -0.1449604034423828, -0.13626861572265625, -0.1275768280029297, -0.11888504028320312, -0.11019325256347656, -0.10150146484375, -0.09280967712402344, -0.08411788940429688, -0.07542610168457031, -0.06673431396484375, -0.05804252624511719, -0.049350738525390625, -0.04065895080566406, -0.0319671630859375, -0.023275375366210938, -0.014583587646484375, -0.0058917999267578125, 0.00279998779296875, 0.011491775512695312, 0.020183563232421875, 0.028875350952148438, 0.037567138671875, 0.04625892639160156, 0.054950714111328125, 0.06364250183105469, 0.07233428955078125, 0.08102607727050781, 0.08971786499023438, 0.09840965270996094, 0.1071014404296875, 0.11579322814941406, 0.12448501586914062, 0.1331768035888672, 0.14186859130859375, 0.1505603790283203, 0.15925216674804688, 0.16794395446777344, 0.1766357421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 10.0, 10.0, 27.0, 45.0, 89.0, 202.0, 257.0, 191.0, 85.0, 44.0, 17.0, 12.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3537534475326538, -1.2986661195755005, -1.2435786724090576, -1.1884913444519043, -1.133404016494751, -1.0783166885375977, -1.0232293605804443, -0.9681419134140015, -0.9130545854568481, -0.8579672574996948, -0.8028798699378967, -0.7477924823760986, -0.6927051544189453, -0.637617826461792, -0.5825304388999939, -0.5274430513381958, -0.4723557233810425, -0.4172683656215668, -0.36218100786209106, -0.30709365010261536, -0.25200629234313965, -0.19691893458366394, -0.14183157682418823, -0.08674421906471252, -0.031656861305236816, 0.02343049645423889, 0.0785178542137146, 0.1336052119731903, 0.18869256973266602, 0.24377992749214172, 0.29886728525161743, 0.35395464301109314, 0.4090421199798584, 0.4641294777393341, 0.5192168354988098, 0.5743042230606079, 0.6293915510177612, 0.6844788789749146, 0.7395662665367126, 0.7946536540985107, 0.8497409820556641, 0.9048283100128174, 0.9599156975746155, 1.0150030851364136, 1.070090413093567, 1.1251777410507202, 1.180265188217163, 1.2353525161743164, 1.2904398441314697, 1.345527172088623, 1.4006145000457764, 1.4557019472122192, 1.5107892751693726, 1.5658766031265259, 1.6209640502929688, 1.676051378250122, 1.7311387062072754, 1.7862260341644287, 1.841313362121582, 1.896400809288025, 1.9514881372451782, 2.006575584411621, 2.0616629123687744, 2.1167502403259277, 2.171837568283081]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 15.0, 28.0, 29.0, 41.0, 46.0, 73.0, 78.0, 78.0, 90.0, 74.0, 79.0, 72.0, 69.0, 59.0, 45.0, 27.0, 23.0, 23.0, 22.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1259791851043701, -1.0930366516113281, -1.0600941181182861, -1.0271515846252441, -0.9942091107368469, -0.9612666368484497, -0.9283241033554077, -0.8953815698623657, -0.8624390363693237, -0.8294965028762817, -0.7965540289878845, -0.7636114954948425, -0.7306689620018005, -0.6977264881134033, -0.6647839546203613, -0.6318414211273193, -0.5988989472389221, -0.5659564137458801, -0.5330139398574829, -0.5000714063644409, -0.4671288728713989, -0.4341863691806793, -0.4012438654899597, -0.3683013319969177, -0.3353588283061981, -0.3024163246154785, -0.2694737911224365, -0.23653128743171692, -0.20358876883983612, -0.17064625024795532, -0.13770374655723572, -0.10476122796535492, -0.0718187689781189, -0.0388762541115284, -0.005933739244937897, 0.027008771896362305, 0.0599512904882431, 0.0928938090801239, 0.1258363127708435, 0.1587788313627243, 0.1917213499546051, 0.2246638685464859, 0.2576063871383667, 0.2905488908290863, 0.3234913945198059, 0.3564339280128479, 0.3893764317035675, 0.4223189353942871, 0.4552614688873291, 0.4882039725780487, 0.5211464762687683, 0.5540890097618103, 0.5870315432548523, 0.6199740171432495, 0.6529165506362915, 0.6858590841293335, 0.7188016176223755, 0.7517441511154175, 0.7846866250038147, 0.8176291584968567, 0.8505716919898987, 0.8835141658782959, 0.9164566993713379, 0.9493992328643799, 0.9823417067527771]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 5.0, 12.0, 17.0, 17.0, 31.0, 46.0, 72.0, 99.0, 165.0, 366.0, 636.0, 1169.0, 2429.0, 5722.0, 17868.0, 93473.0, 625760.0, 250032.0, 34666.0, 8911.0, 3410.0, 1693.0, 845.0, 469.0, 219.0, 148.0, 87.0, 62.0, 35.0, 26.0, 16.0, 14.0, 6.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.6568450927734375, -0.635467529296875, -0.6140899658203125, -0.59271240234375, -0.5713348388671875, -0.549957275390625, -0.5285797119140625, -0.5072021484375, -0.4858245849609375, -0.464447021484375, -0.4430694580078125, -0.42169189453125, -0.4003143310546875, -0.378936767578125, -0.3575592041015625, -0.336181640625, -0.3148040771484375, -0.293426513671875, -0.2720489501953125, -0.25067138671875, -0.2292938232421875, -0.207916259765625, -0.1865386962890625, -0.1651611328125, -0.1437835693359375, -0.122406005859375, -0.1010284423828125, -0.07965087890625, -0.0582733154296875, -0.036895751953125, -0.0155181884765625, 0.005859375, 0.0272369384765625, 0.048614501953125, 0.0699920654296875, 0.09136962890625, 0.1127471923828125, 0.134124755859375, 0.1555023193359375, 0.1768798828125, 0.1982574462890625, 0.219635009765625, 0.2410125732421875, 0.26239013671875, 0.2837677001953125, 0.305145263671875, 0.3265228271484375, 0.347900390625, 0.3692779541015625, 0.390655517578125, 0.4120330810546875, 0.43341064453125, 0.4547882080078125, 0.476165771484375, 0.4975433349609375, 0.5189208984375, 0.5402984619140625, 0.561676025390625, 0.5830535888671875, 0.60443115234375, 0.6258087158203125, 0.647186279296875, 0.6685638427734375, 0.68994140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 3.0, 6.0, 3.0, 7.0, 14.0, 33.0, 37.0, 47.0, 69.0, 78.0, 104.0, 117.0, 105.0, 109.0, 79.0, 64.0, 27.0, 26.0, 21.0, 16.0, 9.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090576171875, -0.08719062805175781, -0.08380508422851562, -0.08041954040527344, -0.07703399658203125, -0.07364845275878906, -0.07026290893554688, -0.06687736511230469, -0.0634918212890625, -0.06010627746582031, -0.056720733642578125, -0.05333518981933594, -0.04994964599609375, -0.04656410217285156, -0.043178558349609375, -0.03979301452636719, -0.036407470703125, -0.03302192687988281, -0.029636383056640625, -0.026250839233398438, -0.02286529541015625, -0.019479751586914062, -0.016094207763671875, -0.012708663940429688, -0.0093231201171875, -0.0059375762939453125, -0.002552032470703125, 0.0008335113525390625, 0.00421905517578125, 0.0076045989990234375, 0.010990142822265625, 0.014375686645507812, 0.01776123046875, 0.021146774291992188, 0.024532318115234375, 0.027917861938476562, 0.03130340576171875, 0.03468894958496094, 0.038074493408203125, 0.04146003723144531, 0.0448455810546875, 0.04823112487792969, 0.051616668701171875, 0.05500221252441406, 0.05838775634765625, 0.06177330017089844, 0.06515884399414062, 0.06854438781738281, 0.071929931640625, 0.07531547546386719, 0.07870101928710938, 0.08208656311035156, 0.08547210693359375, 0.08885765075683594, 0.09224319458007812, 0.09562873840332031, 0.0990142822265625, 0.10239982604980469, 0.10578536987304688, 0.10917091369628906, 0.11255645751953125, 0.11594200134277344, 0.11932754516601562, 0.12271308898925781, 0.1260986328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 15.0, 10.0, 24.0, 34.0, 35.0, 47.0, 67.0, 92.0, 118.0, 165.0, 204.0, 345.0, 521.0, 855.0, 1624.0, 3301.0, 7059.0, 16339.0, 39904.0, 112504.0, 350768.0, 337833.0, 108178.0, 38264.0, 15774.0, 7020.0, 3256.0, 1659.0, 897.0, 488.0, 325.0, 202.0, 136.0, 96.0, 87.0, 73.0, 51.0, 44.0, 22.0, 30.0, 17.0, 23.0, 8.0, 7.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3544921875, -0.3426666259765625, -0.330841064453125, -0.3190155029296875, -0.30718994140625, -0.2953643798828125, -0.283538818359375, -0.2717132568359375, -0.2598876953125, -0.2480621337890625, -0.236236572265625, -0.2244110107421875, -0.21258544921875, -0.2007598876953125, -0.188934326171875, -0.1771087646484375, -0.165283203125, -0.1534576416015625, -0.141632080078125, -0.1298065185546875, -0.11798095703125, -0.1061553955078125, -0.094329833984375, -0.0825042724609375, -0.0706787109375, -0.0588531494140625, -0.047027587890625, -0.0352020263671875, -0.02337646484375, -0.0115509033203125, 0.000274658203125, 0.0121002197265625, 0.02392578125, 0.0357513427734375, 0.047576904296875, 0.0594024658203125, 0.07122802734375, 0.0830535888671875, 0.094879150390625, 0.1067047119140625, 0.1185302734375, 0.1303558349609375, 0.142181396484375, 0.1540069580078125, 0.16583251953125, 0.1776580810546875, 0.189483642578125, 0.2013092041015625, 0.213134765625, 0.2249603271484375, 0.236785888671875, 0.2486114501953125, 0.26043701171875, 0.2722625732421875, 0.284088134765625, 0.2959136962890625, 0.3077392578125, 0.3195648193359375, 0.331390380859375, 0.3432159423828125, 0.35504150390625, 0.3668670654296875, 0.378692626953125, 0.3905181884765625, 0.40234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 10.0, 2.0, 9.0, 5.0, 14.0, 15.0, 10.0, 17.0, 16.0, 28.0, 24.0, 24.0, 31.0, 22.0, 30.0, 30.0, 42.0, 39.0, 33.0, 38.0, 49.0, 24.0, 38.0, 49.0, 39.0, 28.0, 38.0, 46.0, 28.0, 36.0, 25.0, 23.0, 17.0, 21.0, 17.0, 16.0, 9.0, 16.0, 8.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.2936210632324219, -0.28353118896484375, -0.2734413146972656, -0.2633514404296875, -0.2532615661621094, -0.24317169189453125, -0.23308181762695312, -0.222991943359375, -0.21290206909179688, -0.20281219482421875, -0.19272232055664062, -0.1826324462890625, -0.17254257202148438, -0.16245269775390625, -0.15236282348632812, -0.14227294921875, -0.13218307495117188, -0.12209320068359375, -0.11200332641601562, -0.1019134521484375, -0.09182357788085938, -0.08173370361328125, -0.07164382934570312, -0.061553955078125, -0.051464080810546875, -0.04137420654296875, -0.031284332275390625, -0.0211944580078125, -0.011104583740234375, -0.00101470947265625, 0.009075164794921875, 0.0191650390625, 0.029254913330078125, 0.03934478759765625, 0.049434661865234375, 0.0595245361328125, 0.06961441040039062, 0.07970428466796875, 0.08979415893554688, 0.099884033203125, 0.10997390747070312, 0.12006378173828125, 0.13015365600585938, 0.1402435302734375, 0.15033340454101562, 0.16042327880859375, 0.17051315307617188, 0.18060302734375, 0.19069290161132812, 0.20078277587890625, 0.21087265014648438, 0.2209625244140625, 0.23105239868164062, 0.24114227294921875, 0.2512321472167969, 0.261322021484375, 0.2714118957519531, 0.28150177001953125, 0.2915916442871094, 0.3016815185546875, 0.3117713928222656, 0.32186126708984375, 0.3319511413574219, 0.342041015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 5.0, 13.0, 22.0, 33.0, 64.0, 116.0, 255.0, 675.0, 2110.0, 11396.0, 257863.0, 745688.0, 25195.0, 3502.0, 905.0, 346.0, 149.0, 80.0, 41.0, 21.0, 27.0, 6.0, 10.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.734375, -0.7151336669921875, -0.695892333984375, -0.6766510009765625, -0.65740966796875, -0.6381683349609375, -0.618927001953125, -0.5996856689453125, -0.5804443359375, -0.5612030029296875, -0.541961669921875, -0.5227203369140625, -0.50347900390625, -0.4842376708984375, -0.464996337890625, -0.4457550048828125, -0.426513671875, -0.4072723388671875, -0.388031005859375, -0.3687896728515625, -0.34954833984375, -0.3303070068359375, -0.311065673828125, -0.2918243408203125, -0.2725830078125, -0.2533416748046875, -0.234100341796875, -0.2148590087890625, -0.19561767578125, -0.1763763427734375, -0.157135009765625, -0.1378936767578125, -0.11865234375, -0.0994110107421875, -0.080169677734375, -0.0609283447265625, -0.04168701171875, -0.0224456787109375, -0.003204345703125, 0.0160369873046875, 0.0352783203125, 0.0545196533203125, 0.073760986328125, 0.0930023193359375, 0.11224365234375, 0.1314849853515625, 0.150726318359375, 0.1699676513671875, 0.189208984375, 0.2084503173828125, 0.227691650390625, 0.2469329833984375, 0.26617431640625, 0.2854156494140625, 0.304656982421875, 0.3238983154296875, 0.3431396484375, 0.3623809814453125, 0.381622314453125, 0.4008636474609375, 0.42010498046875, 0.4393463134765625, 0.458587646484375, 0.4778289794921875, 0.4970703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 10.0, 19.0, 23.0, 26.0, 36.0, 51.0, 45.0, 67.0, 68.0, 102.0, 89.0, 70.0, 73.0, 68.0, 64.0, 49.0, 22.0, 23.0, 22.0, 16.0, 7.0, 12.0, 4.0, 6.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.9664249420166016e-05, -5.8108940720558167e-05, -5.655363202095032e-05, -5.499832332134247e-05, -5.344301462173462e-05, -5.188770592212677e-05, -5.033239722251892e-05, -4.877708852291107e-05, -4.722177982330322e-05, -4.5666471123695374e-05, -4.4111162424087524e-05, -4.2555853724479675e-05, -4.1000545024871826e-05, -3.944523632526398e-05, -3.788992762565613e-05, -3.633461892604828e-05, -3.477931022644043e-05, -3.322400152683258e-05, -3.166869282722473e-05, -3.0113384127616882e-05, -2.8558075428009033e-05, -2.7002766728401184e-05, -2.5447458028793335e-05, -2.3892149329185486e-05, -2.2336840629577637e-05, -2.0781531929969788e-05, -1.922622323036194e-05, -1.767091453075409e-05, -1.611560583114624e-05, -1.4560297131538391e-05, -1.3004988431930542e-05, -1.1449679732322693e-05, -9.894371032714844e-06, -8.339062333106995e-06, -6.7837536334991455e-06, -5.228444933891296e-06, -3.6731362342834473e-06, -2.117827534675598e-06, -5.62518835067749e-07, 9.927898645401e-07, 2.5480985641479492e-06, 4.103407263755798e-06, 5.6587159633636475e-06, 7.214024662971497e-06, 8.769333362579346e-06, 1.0324642062187195e-05, 1.1879950761795044e-05, 1.3435259461402893e-05, 1.4990568161010742e-05, 1.654587686061859e-05, 1.810118556022644e-05, 1.965649425983429e-05, 2.121180295944214e-05, 2.2767111659049988e-05, 2.4322420358657837e-05, 2.5877729058265686e-05, 2.7433037757873535e-05, 2.8988346457481384e-05, 3.0543655157089233e-05, 3.209896385669708e-05, 3.365427255630493e-05, 3.520958125591278e-05, 3.676488995552063e-05, 3.832019865512848e-05, 3.987550735473633e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 10.0, 15.0, 10.0, 20.0, 43.0, 66.0, 69.0, 118.0, 161.0, 287.0, 471.0, 859.0, 1707.0, 3683.0, 9472.0, 32239.0, 169200.0, 567447.0, 206455.0, 37342.0, 10441.0, 4132.0, 1910.0, 1025.0, 534.0, 306.0, 193.0, 108.0, 67.0, 36.0, 32.0, 28.0, 15.0, 12.0, 15.0, 5.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2851524353027344, -0.27611541748046875, -0.2670783996582031, -0.2580413818359375, -0.24900436401367188, -0.23996734619140625, -0.23093032836914062, -0.221893310546875, -0.21285629272460938, -0.20381927490234375, -0.19478225708007812, -0.1857452392578125, -0.17670822143554688, -0.16767120361328125, -0.15863418579101562, -0.14959716796875, -0.14056015014648438, -0.13152313232421875, -0.12248611450195312, -0.1134490966796875, -0.10441207885742188, -0.09537506103515625, -0.08633804321289062, -0.077301025390625, -0.06826400756835938, -0.05922698974609375, -0.050189971923828125, -0.0411529541015625, -0.032115936279296875, -0.02307891845703125, -0.014041900634765625, -0.0050048828125, 0.004032135009765625, 0.01306915283203125, 0.022106170654296875, 0.0311431884765625, 0.040180206298828125, 0.04921722412109375, 0.058254241943359375, 0.067291259765625, 0.07632827758789062, 0.08536529541015625, 0.09440231323242188, 0.1034393310546875, 0.11247634887695312, 0.12151336669921875, 0.13055038452148438, 0.13958740234375, 0.14862442016601562, 0.15766143798828125, 0.16669845581054688, 0.1757354736328125, 0.18477249145507812, 0.19380950927734375, 0.20284652709960938, 0.211883544921875, 0.22092056274414062, 0.22995758056640625, 0.23899459838867188, 0.2480316162109375, 0.2570686340332031, 0.26610565185546875, 0.2751426696777344, 0.2841796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 13.0, 14.0, 20.0, 33.0, 37.0, 55.0, 61.0, 81.0, 92.0, 103.0, 93.0, 92.0, 56.0, 70.0, 57.0, 30.0, 23.0, 18.0, 14.0, 10.0, 0.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22776031494140625, -0.2213897705078125, -0.21501922607421875, -0.208648681640625, -0.20227813720703125, -0.1959075927734375, -0.18953704833984375, -0.18316650390625, -0.17679595947265625, -0.1704254150390625, -0.16405487060546875, -0.157684326171875, -0.15131378173828125, -0.1449432373046875, -0.13857269287109375, -0.1322021484375, -0.12583160400390625, -0.1194610595703125, -0.11309051513671875, -0.106719970703125, -0.10034942626953125, -0.0939788818359375, -0.08760833740234375, -0.08123779296875, -0.07486724853515625, -0.0684967041015625, -0.06212615966796875, -0.055755615234375, -0.04938507080078125, -0.0430145263671875, -0.03664398193359375, -0.0302734375, -0.02390289306640625, -0.0175323486328125, -0.01116180419921875, -0.004791259765625, 0.00157928466796875, 0.0079498291015625, 0.01432037353515625, 0.02069091796875, 0.02706146240234375, 0.0334320068359375, 0.03980255126953125, 0.046173095703125, 0.05254364013671875, 0.0589141845703125, 0.06528472900390625, 0.0716552734375, 0.07802581787109375, 0.0843963623046875, 0.09076690673828125, 0.097137451171875, 0.10350799560546875, 0.1098785400390625, 0.11624908447265625, 0.12261962890625, 0.12899017333984375, 0.1353607177734375, 0.14173126220703125, 0.148101806640625, 0.15447235107421875, 0.1608428955078125, 0.16721343994140625, 0.173583984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 32.0, 125.0, 360.0, 324.0, 105.0, 27.0, 15.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.488159656524658, -2.258094072341919, -2.0280284881591797, -1.7979629039764404, -1.5678973197937012, -1.337831735610962, -1.1077661514282227, -0.8777005672454834, -0.6476349830627441, -0.4175693988800049, -0.18750381469726562, 0.04256176948547363, 0.2726273536682129, 0.5026929378509521, 0.7327585220336914, 0.9628241062164307, 1.19288969039917, 1.4229552745819092, 1.6530208587646484, 1.8830864429473877, 2.113152027130127, 2.343217611312866, 2.5732831954956055, 2.8033487796783447, 3.033414363861084, 3.2634799480438232, 3.4935455322265625, 3.7236111164093018, 3.953676700592041, 4.183742523193359, 4.4138078689575195, 4.64387321472168, 4.873939514160156, 5.104004859924316, 5.334070682525635, 5.564136505126953, 5.794201850891113, 6.024267196655273, 6.254333019256592, 6.48439884185791, 6.71446418762207, 6.9445295333862305, 7.174595355987549, 7.404661178588867, 7.634726524353027, 7.8647918701171875, 8.094858169555664, 8.324923515319824, 8.554988861083984, 8.785054206848145, 9.015119552612305, 9.245185852050781, 9.475251197814941, 9.705316543579102, 9.935382843017578, 10.165448188781738, 10.395513534545898, 10.625578880310059, 10.855644226074219, 11.085710525512695, 11.315775871276855, 11.545841217041016, 11.775907516479492, 12.005972862243652, 12.236038208007812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 12.0, 12.0, 13.0, 18.0, 31.0, 31.0, 41.0, 29.0, 49.0, 43.0, 46.0, 60.0, 48.0, 55.0, 52.0, 47.0, 61.0, 55.0, 37.0, 41.0, 31.0, 26.0, 24.0, 22.0, 18.0, 22.0, 17.0, 10.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.617994785308838, -2.533951997756958, -2.4499094486236572, -2.3658666610717773, -2.2818241119384766, -2.1977813243865967, -2.113738536834717, -2.029695987701416, -1.9456533193588257, -1.8616106510162354, -1.777567982673645, -1.6935253143310547, -1.6094825267791748, -1.525439977645874, -1.4413971900939941, -1.3573545217514038, -1.2733118534088135, -1.1892691850662231, -1.1052265167236328, -1.021183729171753, -0.9371411204338074, -0.853098452091217, -0.7690557241439819, -0.6850130558013916, -0.6009703874588013, -0.5169277191162109, -0.4328850209712982, -0.3488423228263855, -0.26479965448379517, -0.18075698614120483, -0.09671425819396973, -0.012671589851379395, 0.07137084007263184, 0.15541352331638336, 0.2394562065601349, 0.3234989047050476, 0.40754157304763794, 0.49158424139022827, 0.5756269693374634, 0.6596696376800537, 0.743712306022644, 0.8277549743652344, 0.9117976427078247, 0.9958403706550598, 1.079883098602295, 1.1639256477355957, 1.2479684352874756, 1.332011103630066, 1.4160537719726562, 1.5000964403152466, 1.584139108657837, 1.6681818962097168, 1.7522244453430176, 1.8362672328948975, 1.9203099012374878, 2.004352569580078, 2.088395118713379, 2.172437906265259, 2.2564804553985596, 2.3405232429504395, 2.4245657920837402, 2.50860857963562, 2.5926513671875, 2.676693916320801, 2.7607367038726807]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 6.0, 10.0, 13.0, 29.0, 39.0, 64.0, 80.0, 177.0, 320.0, 485.0, 1058.0, 2339.0, 6319.0, 21350.0, 123462.0, 3774766.0, 219644.0, 29859.0, 8180.0, 2956.0, 1331.0, 696.0, 396.0, 237.0, 146.0, 92.0, 71.0, 52.0, 27.0, 13.0, 11.0, 8.0, 12.0, 7.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67724609375, -0.6458969116210938, -0.6145477294921875, -0.5831985473632812, -0.551849365234375, -0.5205001831054688, -0.4891510009765625, -0.45780181884765625, -0.42645263671875, -0.39510345458984375, -0.3637542724609375, -0.33240509033203125, -0.301055908203125, -0.26970672607421875, -0.2383575439453125, -0.20700836181640625, -0.1756591796875, -0.14430999755859375, -0.1129608154296875, -0.08161163330078125, -0.050262451171875, -0.01891326904296875, 0.0124359130859375, 0.04378509521484375, 0.07513427734375, 0.10648345947265625, 0.1378326416015625, 0.16918182373046875, 0.200531005859375, 0.23188018798828125, 0.2632293701171875, 0.29457855224609375, 0.325927734375, 0.35727691650390625, 0.3886260986328125, 0.41997528076171875, 0.451324462890625, 0.48267364501953125, 0.5140228271484375, 0.5453720092773438, 0.57672119140625, 0.6080703735351562, 0.6394195556640625, 0.6707687377929688, 0.702117919921875, 0.7334671020507812, 0.7648162841796875, 0.7961654663085938, 0.8275146484375, 0.8588638305664062, 0.8902130126953125, 0.9215621948242188, 0.952911376953125, 0.9842605590820312, 1.0156097412109375, 1.0469589233398438, 1.07830810546875, 1.1096572875976562, 1.1410064697265625, 1.1723556518554688, 1.203704833984375, 1.2350540161132812, 1.2664031982421875, 1.2977523803710938, 1.3291015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 6.0, 6.0, 8.0, 9.0, 16.0, 15.0, 27.0, 30.0, 41.0, 43.0, 74.0, 66.0, 70.0, 64.0, 74.0, 67.0, 73.0, 68.0, 52.0, 42.0, 25.0, 29.0, 19.0, 15.0, 16.0, 6.0, 6.0, 7.0, 10.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07427978515625, -0.07119560241699219, -0.06811141967773438, -0.06502723693847656, -0.06194305419921875, -0.05885887145996094, -0.055774688720703125, -0.05269050598144531, -0.0496063232421875, -0.04652214050292969, -0.043437957763671875, -0.04035377502441406, -0.03726959228515625, -0.03418540954589844, -0.031101226806640625, -0.028017044067382812, -0.024932861328125, -0.021848678588867188, -0.018764495849609375, -0.015680313110351562, -0.01259613037109375, -0.009511947631835938, -0.006427764892578125, -0.0033435821533203125, -0.0002593994140625, 0.0028247833251953125, 0.005908966064453125, 0.008993148803710938, 0.01207733154296875, 0.015161514282226562, 0.018245697021484375, 0.021329879760742188, 0.0244140625, 0.027498245239257812, 0.030582427978515625, 0.03366661071777344, 0.03675079345703125, 0.03983497619628906, 0.042919158935546875, 0.04600334167480469, 0.0490875244140625, 0.05217170715332031, 0.055255889892578125, 0.05834007263183594, 0.06142425537109375, 0.06450843811035156, 0.06759262084960938, 0.07067680358886719, 0.073760986328125, 0.07684516906738281, 0.07992935180664062, 0.08301353454589844, 0.08609771728515625, 0.08918190002441406, 0.09226608276367188, 0.09535026550292969, 0.0984344482421875, 0.10151863098144531, 0.10460281372070312, 0.10768699645996094, 0.11077117919921875, 0.11385536193847656, 0.11693954467773438, 0.12002372741699219, 0.12310791015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 4.0, 5.0, 13.0, 19.0, 26.0, 46.0, 62.0, 101.0, 181.0, 277.0, 472.0, 916.0, 1604.0, 3281.0, 6496.0, 14737.0, 41521.0, 200077.0, 3391635.0, 432626.0, 62075.0, 20130.0, 8557.0, 4130.0, 2304.0, 1230.0, 701.0, 406.0, 244.0, 139.0, 86.0, 64.0, 39.0, 23.0, 13.0, 15.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5107421875, -0.4915771484375, -0.472412109375, -0.4532470703125, -0.43408203125, -0.4149169921875, -0.395751953125, -0.3765869140625, -0.357421875, -0.3382568359375, -0.319091796875, -0.2999267578125, -0.28076171875, -0.2615966796875, -0.242431640625, -0.2232666015625, -0.2041015625, -0.1849365234375, -0.165771484375, -0.1466064453125, -0.12744140625, -0.1082763671875, -0.089111328125, -0.0699462890625, -0.05078125, -0.0316162109375, -0.012451171875, 0.0067138671875, 0.02587890625, 0.0450439453125, 0.064208984375, 0.0833740234375, 0.1025390625, 0.1217041015625, 0.140869140625, 0.1600341796875, 0.17919921875, 0.1983642578125, 0.217529296875, 0.2366943359375, 0.255859375, 0.2750244140625, 0.294189453125, 0.3133544921875, 0.33251953125, 0.3516845703125, 0.370849609375, 0.3900146484375, 0.4091796875, 0.4283447265625, 0.447509765625, 0.4666748046875, 0.48583984375, 0.5050048828125, 0.524169921875, 0.5433349609375, 0.5625, 0.5816650390625, 0.600830078125, 0.6199951171875, 0.63916015625, 0.6583251953125, 0.677490234375, 0.6966552734375, 0.7158203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 8.0, 14.0, 10.0, 17.0, 21.0, 16.0, 31.0, 49.0, 62.0, 103.0, 147.0, 275.0, 733.0, 1375.0, 512.0, 242.0, 126.0, 71.0, 56.0, 53.0, 23.0, 25.0, 15.0, 8.0, 12.0, 13.0, 5.0, 7.0, 1.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.1746826171875, -0.1697368621826172, -0.16479110717773438, -0.15984535217285156, -0.15489959716796875, -0.14995384216308594, -0.14500808715820312, -0.1400623321533203, -0.1351165771484375, -0.1301708221435547, -0.12522506713867188, -0.12027931213378906, -0.11533355712890625, -0.11038780212402344, -0.10544204711914062, -0.10049629211425781, -0.095550537109375, -0.09060478210449219, -0.08565902709960938, -0.08071327209472656, -0.07576751708984375, -0.07082176208496094, -0.06587600708007812, -0.06093025207519531, -0.0559844970703125, -0.05103874206542969, -0.046092987060546875, -0.04114723205566406, -0.03620147705078125, -0.03125572204589844, -0.026309967041015625, -0.021364212036132812, -0.01641845703125, -0.011472702026367188, -0.006526947021484375, -0.0015811920166015625, 0.00336456298828125, 0.008310317993164062, 0.013256072998046875, 0.018201828002929688, 0.0231475830078125, 0.028093338012695312, 0.033039093017578125, 0.03798484802246094, 0.04293060302734375, 0.04787635803222656, 0.052822113037109375, 0.05776786804199219, 0.062713623046875, 0.06765937805175781, 0.07260513305664062, 0.07755088806152344, 0.08249664306640625, 0.08744239807128906, 0.09238815307617188, 0.09733390808105469, 0.1022796630859375, 0.10722541809082031, 0.11217117309570312, 0.11711692810058594, 0.12206268310546875, 0.12700843811035156, 0.13195419311523438, 0.1368999481201172, 0.141845703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 12.0, 16.0, 31.0, 63.0, 107.0, 181.0, 190.0, 138.0, 102.0, 58.0, 37.0, 19.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6106644868850708, -1.5675655603408813, -1.5244665145874023, -1.481367588043213, -1.4382685422897339, -1.3951696157455444, -1.3520705699920654, -1.308971643447876, -1.265872597694397, -1.2227736711502075, -1.1796746253967285, -1.136575698852539, -1.09347665309906, -1.0503777265548706, -1.0072786808013916, -0.9641797542572021, -0.9210807681083679, -0.8779817819595337, -0.8348827958106995, -0.7917838096618652, -0.748684823513031, -0.7055858373641968, -0.6624869108200073, -0.6193878650665283, -0.5762889385223389, -0.5331899523735046, -0.4900909662246704, -0.4469919800758362, -0.40389299392700195, -0.3607940077781677, -0.3176950514316559, -0.27459606528282166, -0.23149704933166504, -0.1883980631828308, -0.14529907703399658, -0.10220010578632355, -0.05910111963748932, -0.01600213348865509, 0.027096837759017944, 0.07019582390785217, 0.1132948100566864, 0.15639379620552063, 0.19949278235435486, 0.2425917536020279, 0.2856907248497009, 0.32878971099853516, 0.3718886971473694, 0.4149876832962036, 0.45808666944503784, 0.5011856555938721, 0.5442846417427063, 0.5873836278915405, 0.6304826140403748, 0.673581600189209, 0.7166805267333984, 0.7597795724868774, 0.8028784990310669, 0.8459774851799011, 0.8890764713287354, 0.9321754574775696, 0.9752744436264038, 1.0183733701705933, 1.0614724159240723, 1.1045713424682617, 1.1476703882217407]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 4.0, 18.0, 25.0, 17.0, 21.0, 31.0, 41.0, 35.0, 53.0, 52.0, 55.0, 47.0, 51.0, 77.0, 49.0, 55.0, 46.0, 55.0, 46.0, 46.0, 27.0, 31.0, 21.0, 18.0, 16.0, 13.0, 11.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.971295952796936, -0.9458733797073364, -0.9204508662223816, -0.895028293132782, -0.8696057796478271, -0.8441832065582275, -0.8187606930732727, -0.7933381199836731, -0.7679156064987183, -0.7424930334091187, -0.7170705199241638, -0.6916479468345642, -0.6662254333496094, -0.6408028602600098, -0.6153803467750549, -0.5899577736854553, -0.5645352602005005, -0.5391126871109009, -0.513690173625946, -0.4882676303386688, -0.4628450870513916, -0.437422513961792, -0.41200000047683716, -0.38657742738723755, -0.36115485429763794, -0.3357323110103607, -0.3103097677230835, -0.2848872244358063, -0.25946468114852905, -0.23404212296009064, -0.20861957967281342, -0.1831970363855362, -0.15777450799942017, -0.13235196471214294, -0.10692942142486572, -0.0815068706870079, -0.05608432739973068, -0.030661776661872864, -0.005239233374595642, 0.02018330991268158, 0.0456058531999588, 0.07102839648723602, 0.09645093977451324, 0.12187349051237106, 0.14729604125022888, 0.1727185845375061, 0.19814112782478333, 0.22356367111206055, 0.24898621439933777, 0.274408757686615, 0.2998313009738922, 0.32525384426116943, 0.35067638754844666, 0.3760989308357239, 0.4015215039253235, 0.4269440174102783, 0.45236659049987793, 0.47778913378715515, 0.5032116770744324, 0.528634250164032, 0.5540567636489868, 0.5794793367385864, 0.6049018502235413, 0.6303244233131409, 0.6557469367980957]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 14.0, 17.0, 22.0, 51.0, 80.0, 134.0, 245.0, 449.0, 790.0, 1552.0, 3027.0, 6902.0, 18000.0, 58377.0, 258825.0, 503134.0, 139245.0, 35492.0, 12270.0, 4920.0, 2359.0, 1141.0, 647.0, 349.0, 209.0, 124.0, 65.0, 37.0, 21.0, 15.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382568359375, -0.3685569763183594, -0.35454559326171875, -0.3405342102050781, -0.3265228271484375, -0.3125114440917969, -0.29850006103515625, -0.2844886779785156, -0.270477294921875, -0.2564659118652344, -0.24245452880859375, -0.22844314575195312, -0.2144317626953125, -0.20042037963867188, -0.18640899658203125, -0.17239761352539062, -0.15838623046875, -0.14437484741210938, -0.13036346435546875, -0.11635208129882812, -0.1023406982421875, -0.08832931518554688, -0.07431793212890625, -0.060306549072265625, -0.046295166015625, -0.032283782958984375, -0.01827239990234375, -0.004261016845703125, 0.0097503662109375, 0.023761749267578125, 0.03777313232421875, 0.051784515380859375, 0.0657958984375, 0.07980728149414062, 0.09381866455078125, 0.10783004760742188, 0.1218414306640625, 0.13585281372070312, 0.14986419677734375, 0.16387557983398438, 0.177886962890625, 0.19189834594726562, 0.20590972900390625, 0.21992111206054688, 0.2339324951171875, 0.24794387817382812, 0.26195526123046875, 0.2759666442871094, 0.28997802734375, 0.3039894104003906, 0.31800079345703125, 0.3320121765136719, 0.3460235595703125, 0.3600349426269531, 0.37404632568359375, 0.3880577087402344, 0.402069091796875, 0.4160804748535156, 0.43009185791015625, 0.4441032409667969, 0.4581146240234375, 0.4721260070800781, 0.48613739013671875, 0.5001487731933594, 0.51416015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 14.0, 18.0, 24.0, 23.0, 41.0, 46.0, 64.0, 64.0, 81.0, 83.0, 81.0, 81.0, 85.0, 60.0, 51.0, 27.0, 36.0, 19.0, 22.0, 13.0, 11.0, 6.0, 5.0, 5.0, 7.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10345458984375, -0.10033321380615234, -0.09721183776855469, -0.09409046173095703, -0.09096908569335938, -0.08784770965576172, -0.08472633361816406, -0.0816049575805664, -0.07848358154296875, -0.0753622055053711, -0.07224082946777344, -0.06911945343017578, -0.06599807739257812, -0.06287670135498047, -0.05975532531738281, -0.056633949279785156, -0.0535125732421875, -0.050391197204589844, -0.04726982116699219, -0.04414844512939453, -0.041027069091796875, -0.03790569305419922, -0.03478431701660156, -0.031662940979003906, -0.02854156494140625, -0.025420188903808594, -0.022298812866210938, -0.01917743682861328, -0.016056060791015625, -0.012934684753417969, -0.009813308715820312, -0.006691932678222656, -0.003570556640625, -0.00044918060302734375, 0.0026721954345703125, 0.005793571472167969, 0.008914947509765625, 0.012036323547363281, 0.015157699584960938, 0.018279075622558594, 0.02140045166015625, 0.024521827697753906, 0.027643203735351562, 0.03076457977294922, 0.033885955810546875, 0.03700733184814453, 0.04012870788574219, 0.043250083923339844, 0.0463714599609375, 0.049492835998535156, 0.05261421203613281, 0.05573558807373047, 0.058856964111328125, 0.06197834014892578, 0.06509971618652344, 0.0682210922241211, 0.07134246826171875, 0.0744638442993164, 0.07758522033691406, 0.08070659637451172, 0.08382797241210938, 0.08694934844970703, 0.09007072448730469, 0.09319210052490234, 0.0963134765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 9.0, 9.0, 17.0, 24.0, 20.0, 44.0, 63.0, 95.0, 128.0, 210.0, 358.0, 737.0, 1557.0, 3600.0, 8660.0, 23330.0, 76279.0, 315173.0, 449556.0, 115309.0, 33109.0, 11634.0, 4425.0, 1973.0, 917.0, 503.0, 292.0, 175.0, 110.0, 72.0, 42.0, 30.0, 24.0, 20.0, 13.0, 10.0, 11.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427978515625, -0.4142417907714844, -0.40050506591796875, -0.3867683410644531, -0.3730316162109375, -0.3592948913574219, -0.34555816650390625, -0.3318214416503906, -0.318084716796875, -0.3043479919433594, -0.29061126708984375, -0.2768745422363281, -0.2631378173828125, -0.24940109252929688, -0.23566436767578125, -0.22192764282226562, -0.20819091796875, -0.19445419311523438, -0.18071746826171875, -0.16698074340820312, -0.1532440185546875, -0.13950729370117188, -0.12577056884765625, -0.11203384399414062, -0.098297119140625, -0.08456039428710938, -0.07082366943359375, -0.057086944580078125, -0.0433502197265625, -0.029613494873046875, -0.01587677001953125, -0.002140045166015625, 0.0115966796875, 0.025333404541015625, 0.03907012939453125, 0.052806854248046875, 0.0665435791015625, 0.08028030395507812, 0.09401702880859375, 0.10775375366210938, 0.121490478515625, 0.13522720336914062, 0.14896392822265625, 0.16270065307617188, 0.1764373779296875, 0.19017410278320312, 0.20391082763671875, 0.21764755249023438, 0.23138427734375, 0.24512100219726562, 0.25885772705078125, 0.2725944519042969, 0.2863311767578125, 0.3000679016113281, 0.31380462646484375, 0.3275413513183594, 0.341278076171875, 0.3550148010253906, 0.36875152587890625, 0.3824882507324219, 0.3962249755859375, 0.4099617004394531, 0.42369842529296875, 0.4374351501464844, 0.451171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 8.0, 9.0, 7.0, 7.0, 16.0, 11.0, 24.0, 22.0, 26.0, 37.0, 36.0, 38.0, 63.0, 48.0, 57.0, 48.0, 58.0, 64.0, 44.0, 45.0, 43.0, 43.0, 37.0, 37.0, 36.0, 28.0, 25.0, 12.0, 15.0, 11.0, 13.0, 10.0, 5.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40771484375, -0.394805908203125, -0.38189697265625, -0.368988037109375, -0.3560791015625, -0.343170166015625, -0.33026123046875, -0.317352294921875, -0.304443359375, -0.291534423828125, -0.27862548828125, -0.265716552734375, -0.2528076171875, -0.239898681640625, -0.22698974609375, -0.214080810546875, -0.201171875, -0.188262939453125, -0.17535400390625, -0.162445068359375, -0.1495361328125, -0.136627197265625, -0.12371826171875, -0.110809326171875, -0.097900390625, -0.084991455078125, -0.07208251953125, -0.059173583984375, -0.0462646484375, -0.033355712890625, -0.02044677734375, -0.007537841796875, 0.00537109375, 0.018280029296875, 0.03118896484375, 0.044097900390625, 0.0570068359375, 0.069915771484375, 0.08282470703125, 0.095733642578125, 0.108642578125, 0.121551513671875, 0.13446044921875, 0.147369384765625, 0.1602783203125, 0.173187255859375, 0.18609619140625, 0.199005126953125, 0.2119140625, 0.224822998046875, 0.23773193359375, 0.250640869140625, 0.2635498046875, 0.276458740234375, 0.28936767578125, 0.302276611328125, 0.315185546875, 0.328094482421875, 0.34100341796875, 0.353912353515625, 0.3668212890625, 0.379730224609375, 0.39263916015625, 0.405548095703125, 0.41845703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 4.0, 4.0, 14.0, 28.0, 26.0, 41.0, 67.0, 98.0, 148.0, 268.0, 484.0, 1047.0, 2314.0, 5769.0, 17366.0, 63315.0, 256705.0, 471336.0, 168020.0, 41487.0, 12022.0, 4289.0, 1845.0, 830.0, 431.0, 211.0, 119.0, 78.0, 58.0, 41.0, 23.0, 18.0, 12.0, 7.0, 5.0, 7.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138671875, -0.13377952575683594, -0.12888717651367188, -0.12399482727050781, -0.11910247802734375, -0.11421012878417969, -0.10931777954101562, -0.10442543029785156, -0.0995330810546875, -0.09464073181152344, -0.08974838256835938, -0.08485603332519531, -0.07996368408203125, -0.07507133483886719, -0.07017898559570312, -0.06528663635253906, -0.060394287109375, -0.05550193786621094, -0.050609588623046875, -0.04571723937988281, -0.04082489013671875, -0.03593254089355469, -0.031040191650390625, -0.026147842407226562, -0.0212554931640625, -0.016363143920898438, -0.011470794677734375, -0.0065784454345703125, -0.00168609619140625, 0.0032062530517578125, 0.008098602294921875, 0.012990951538085938, 0.01788330078125, 0.022775650024414062, 0.027667999267578125, 0.03256034851074219, 0.03745269775390625, 0.04234504699707031, 0.047237396240234375, 0.05212974548339844, 0.0570220947265625, 0.06191444396972656, 0.06680679321289062, 0.07169914245605469, 0.07659149169921875, 0.08148384094238281, 0.08637619018554688, 0.09126853942871094, 0.096160888671875, 0.10105323791503906, 0.10594558715820312, 0.11083793640136719, 0.11573028564453125, 0.12062263488769531, 0.12551498413085938, 0.13040733337402344, 0.1352996826171875, 0.14019203186035156, 0.14508438110351562, 0.1499767303466797, 0.15486907958984375, 0.1597614288330078, 0.16465377807617188, 0.16954612731933594, 0.1744384765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 8.0, 14.0, 13.0, 14.0, 18.0, 26.0, 48.0, 49.0, 82.0, 98.0, 98.0, 94.0, 102.0, 85.0, 50.0, 55.0, 29.0, 26.0, 24.0, 12.0, 11.0, 12.0, 5.0, 4.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.965066909790039e-05, -4.799105226993561e-05, -4.6331435441970825e-05, -4.467181861400604e-05, -4.301220178604126e-05, -4.135258495807648e-05, -3.9692968130111694e-05, -3.803335130214691e-05, -3.637373447418213e-05, -3.4714117646217346e-05, -3.3054500818252563e-05, -3.139488399028778e-05, -2.9735267162322998e-05, -2.8075650334358215e-05, -2.6416033506393433e-05, -2.475641667842865e-05, -2.3096799850463867e-05, -2.1437183022499084e-05, -1.9777566194534302e-05, -1.811794936656952e-05, -1.6458332538604736e-05, -1.4798715710639954e-05, -1.3139098882675171e-05, -1.1479482054710388e-05, -9.819865226745605e-06, -8.160248398780823e-06, -6.50063157081604e-06, -4.841014742851257e-06, -3.1813979148864746e-06, -1.521781086921692e-06, 1.3783574104309082e-07, 1.7974525690078735e-06, 3.4570693969726562e-06, 5.116686224937439e-06, 6.776303052902222e-06, 8.435919880867004e-06, 1.0095536708831787e-05, 1.175515353679657e-05, 1.3414770364761353e-05, 1.5074387192726135e-05, 1.6734004020690918e-05, 1.83936208486557e-05, 2.0053237676620483e-05, 2.1712854504585266e-05, 2.337247133255005e-05, 2.503208816051483e-05, 2.6691704988479614e-05, 2.8351321816444397e-05, 3.001093864440918e-05, 3.167055547237396e-05, 3.3330172300338745e-05, 3.498978912830353e-05, 3.664940595626831e-05, 3.830902278423309e-05, 3.9968639612197876e-05, 4.162825644016266e-05, 4.328787326812744e-05, 4.4947490096092224e-05, 4.660710692405701e-05, 4.826672375202179e-05, 4.992634057998657e-05, 5.1585957407951355e-05, 5.324557423591614e-05, 5.490519106388092e-05, 5.65648078918457e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 11.0, 7.0, 12.0, 9.0, 15.0, 22.0, 26.0, 52.0, 57.0, 80.0, 152.0, 236.0, 415.0, 732.0, 1346.0, 2728.0, 6042.0, 14420.0, 41372.0, 148334.0, 443749.0, 274233.0, 74155.0, 23382.0, 8828.0, 3932.0, 1887.0, 931.0, 505.0, 325.0, 193.0, 132.0, 78.0, 43.0, 43.0, 30.0, 17.0, 8.0, 9.0, 2.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1812744140625, -0.176055908203125, -0.17083740234375, -0.165618896484375, -0.160400390625, -0.155181884765625, -0.14996337890625, -0.144744873046875, -0.1395263671875, -0.134307861328125, -0.12908935546875, -0.123870849609375, -0.11865234375, -0.113433837890625, -0.10821533203125, -0.102996826171875, -0.0977783203125, -0.092559814453125, -0.08734130859375, -0.082122802734375, -0.076904296875, -0.071685791015625, -0.06646728515625, -0.061248779296875, -0.0560302734375, -0.050811767578125, -0.04559326171875, -0.040374755859375, -0.03515625, -0.029937744140625, -0.02471923828125, -0.019500732421875, -0.0142822265625, -0.009063720703125, -0.00384521484375, 0.001373291015625, 0.006591796875, 0.011810302734375, 0.01702880859375, 0.022247314453125, 0.0274658203125, 0.032684326171875, 0.03790283203125, 0.043121337890625, 0.04833984375, 0.053558349609375, 0.05877685546875, 0.063995361328125, 0.0692138671875, 0.074432373046875, 0.07965087890625, 0.084869384765625, 0.090087890625, 0.095306396484375, 0.10052490234375, 0.105743408203125, 0.1109619140625, 0.116180419921875, 0.12139892578125, 0.126617431640625, 0.1318359375, 0.137054443359375, 0.14227294921875, 0.147491455078125, 0.1527099609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 8.0, 7.0, 15.0, 16.0, 21.0, 17.0, 32.0, 31.0, 45.0, 71.0, 79.0, 68.0, 90.0, 91.0, 70.0, 73.0, 53.0, 55.0, 34.0, 26.0, 23.0, 25.0, 14.0, 11.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1541748046875, -0.14990615844726562, -0.14563751220703125, -0.14136886596679688, -0.1371002197265625, -0.13283157348632812, -0.12856292724609375, -0.12429428100585938, -0.120025634765625, -0.11575698852539062, -0.11148834228515625, -0.10721969604492188, -0.1029510498046875, -0.09868240356445312, -0.09441375732421875, -0.09014511108398438, -0.08587646484375, -0.08160781860351562, -0.07733917236328125, -0.07307052612304688, -0.0688018798828125, -0.06453323364257812, -0.06026458740234375, -0.055995941162109375, -0.051727294921875, -0.047458648681640625, -0.04319000244140625, -0.038921356201171875, -0.0346527099609375, -0.030384063720703125, -0.02611541748046875, -0.021846771240234375, -0.017578125, -0.013309478759765625, -0.00904083251953125, -0.004772186279296875, -0.0005035400390625, 0.003765106201171875, 0.00803375244140625, 0.012302398681640625, 0.016571044921875, 0.020839691162109375, 0.02510833740234375, 0.029376983642578125, 0.0336456298828125, 0.037914276123046875, 0.04218292236328125, 0.046451568603515625, 0.05072021484375, 0.054988861083984375, 0.05925750732421875, 0.06352615356445312, 0.0677947998046875, 0.07206344604492188, 0.07633209228515625, 0.08060073852539062, 0.084869384765625, 0.08913803100585938, 0.09340667724609375, 0.09767532348632812, 0.1019439697265625, 0.10621261596679688, 0.11048126220703125, 0.11474990844726562, 0.1190185546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 15.0, 17.0, 19.0, 27.0, 46.0, 66.0, 91.0, 121.0, 139.0, 119.0, 107.0, 70.0, 45.0, 39.0, 21.0, 13.0, 12.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015870571136475, -1.5391391515731812, -1.4766911268234253, -1.414243221282959, -1.3517951965332031, -1.2893472909927368, -1.2268993854522705, -1.1644513607025146, -1.1020034551620483, -1.039555549621582, -0.9771075248718262, -0.9146596193313599, -0.8522116541862488, -0.7897636890411377, -0.7273157238960266, -0.6648677587509155, -0.6024197936058044, -0.5399718284606934, -0.47752389311790466, -0.4150759279727936, -0.3526279926300049, -0.2901800274848938, -0.22773206233978271, -0.16528412699699402, -0.10283616185188293, -0.040388207882642746, 0.022059746086597443, 0.08450770378112793, 0.14695565402507782, 0.2094036042690277, 0.2718515694141388, 0.3342995047569275, 0.3967474699020386, 0.45919543504714966, 0.5216434001922607, 0.584091305732727, 0.6465392708778381, 0.7089872360229492, 0.7714352011680603, 0.8338831663131714, 0.8963310718536377, 0.9587790369987488, 1.0212270021438599, 1.0836749076843262, 1.146122932434082, 1.2085708379745483, 1.2710187435150146, 1.3334667682647705, 1.3959147930145264, 1.4583626985549927, 1.5208107233047485, 1.5832586288452148, 1.6457066535949707, 1.708154559135437, 1.7706024646759033, 1.8330504894256592, 1.8954983949661255, 1.9579463005065918, 2.0203943252563477, 2.0828423500061035, 2.1452901363372803, 2.207738161087036, 2.270186185836792, 2.3326339721679688, 2.3950819969177246]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 9.0, 10.0, 11.0, 12.0, 18.0, 15.0, 26.0, 26.0, 26.0, 28.0, 41.0, 51.0, 35.0, 47.0, 46.0, 49.0, 47.0, 52.0, 49.0, 35.0, 46.0, 48.0, 34.0, 38.0, 39.0, 28.0, 17.0, 19.0, 17.0, 14.0, 12.0, 8.0, 7.0, 7.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6978859901428223, -1.6366530656814575, -1.5754202604293823, -1.5141873359680176, -1.4529544115066528, -1.391721487045288, -1.330488681793213, -1.2692557573318481, -1.2080228328704834, -1.1467899084091187, -1.0855571031570435, -1.0243241786956787, -0.963091254234314, -0.901858389377594, -0.840625524520874, -0.7793926000595093, -0.7181597948074341, -0.6569269299507141, -0.5956940054893494, -0.5344611406326294, -0.47322824597358704, -0.4119953513145447, -0.3507624864578247, -0.28952959179878235, -0.22829669713974, -0.16706380248069763, -0.10583092272281647, -0.0445980429649353, 0.016634851694107056, 0.07786774635314941, 0.13910061120986938, 0.20033350586891174, 0.2615664005279541, 0.32279929518699646, 0.3840321898460388, 0.4452650547027588, 0.5064979791641235, 0.5677308440208435, 0.6289637088775635, 0.6901966333389282, 0.7514294981956482, 0.8126623630523682, 0.8738952875137329, 0.9351281523704529, 0.9963610172271729, 1.0575939416885376, 1.1188268661499023, 1.1800596714019775, 1.2412925958633423, 1.302525520324707, 1.3637583255767822, 1.424991250038147, 1.4862241744995117, 1.547456979751587, 1.6086899042129517, 1.6699228286743164, 1.7311556339263916, 1.7923885583877563, 1.8536213636398315, 1.9148542881011963, 1.976087212562561, 2.037320137023926, 2.098552942276001, 2.159785747528076, 2.2210187911987305]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 7.0, 11.0, 11.0, 12.0, 10.0, 21.0, 31.0, 39.0, 55.0, 66.0, 123.0, 223.0, 367.0, 814.0, 2132.0, 7606.0, 46549.0, 3950359.0, 164681.0, 14809.0, 3733.0, 1368.0, 573.0, 290.0, 153.0, 81.0, 52.0, 38.0, 23.0, 11.0, 5.0, 9.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.47265625, -1.4355621337890625, -1.398468017578125, -1.3613739013671875, -1.32427978515625, -1.2871856689453125, -1.250091552734375, -1.2129974365234375, -1.1759033203125, -1.1388092041015625, -1.101715087890625, -1.0646209716796875, -1.02752685546875, -0.9904327392578125, -0.953338623046875, -0.9162445068359375, -0.879150390625, -0.8420562744140625, -0.804962158203125, -0.7678680419921875, -0.73077392578125, -0.6936798095703125, -0.656585693359375, -0.6194915771484375, -0.5823974609375, -0.5453033447265625, -0.508209228515625, -0.4711151123046875, -0.43402099609375, -0.3969268798828125, -0.359832763671875, -0.3227386474609375, -0.28564453125, -0.2485504150390625, -0.211456298828125, -0.1743621826171875, -0.13726806640625, -0.1001739501953125, -0.063079833984375, -0.0259857177734375, 0.0111083984375, 0.0482025146484375, 0.085296630859375, 0.1223907470703125, 0.15948486328125, 0.1965789794921875, 0.233673095703125, 0.2707672119140625, 0.307861328125, 0.3449554443359375, 0.382049560546875, 0.4191436767578125, 0.45623779296875, 0.4933319091796875, 0.530426025390625, 0.5675201416015625, 0.6046142578125, 0.6417083740234375, 0.678802490234375, 0.7158966064453125, 0.75299072265625, 0.7900848388671875, 0.827178955078125, 0.8642730712890625, 0.9013671875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 10.0, 5.0, 11.0, 19.0, 28.0, 38.0, 51.0, 46.0, 71.0, 84.0, 90.0, 85.0, 84.0, 66.0, 60.0, 55.0, 51.0, 33.0, 27.0, 33.0, 8.0, 3.0, 8.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10772705078125, -0.10431098937988281, -0.10089492797851562, -0.09747886657714844, -0.09406280517578125, -0.09064674377441406, -0.08723068237304688, -0.08381462097167969, -0.0803985595703125, -0.07698249816894531, -0.07356643676757812, -0.07015037536621094, -0.06673431396484375, -0.06331825256347656, -0.059902191162109375, -0.05648612976074219, -0.053070068359375, -0.04965400695800781, -0.046237945556640625, -0.04282188415527344, -0.03940582275390625, -0.03598976135253906, -0.032573699951171875, -0.029157638549804688, -0.0257415771484375, -0.022325515747070312, -0.018909454345703125, -0.015493392944335938, -0.01207733154296875, -0.008661270141601562, -0.005245208740234375, -0.0018291473388671875, 0.0015869140625, 0.0050029754638671875, 0.008419036865234375, 0.011835098266601562, 0.01525115966796875, 0.018667221069335938, 0.022083282470703125, 0.025499343872070312, 0.0289154052734375, 0.03233146667480469, 0.035747528076171875, 0.03916358947753906, 0.04257965087890625, 0.04599571228027344, 0.049411773681640625, 0.05282783508300781, 0.056243896484375, 0.05965995788574219, 0.06307601928710938, 0.06649208068847656, 0.06990814208984375, 0.07332420349121094, 0.07674026489257812, 0.08015632629394531, 0.0835723876953125, 0.08698844909667969, 0.09040451049804688, 0.09382057189941406, 0.09723663330078125, 0.10065269470214844, 0.10406875610351562, 0.10748481750488281, 0.11090087890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 8.0, 8.0, 9.0, 11.0, 8.0, 13.0, 14.0, 20.0, 25.0, 48.0, 49.0, 87.0, 138.0, 252.0, 444.0, 1035.0, 2759.0, 10218.0, 64897.0, 3828302.0, 258250.0, 20181.0, 4577.0, 1523.0, 600.0, 292.0, 162.0, 98.0, 74.0, 38.0, 33.0, 19.0, 22.0, 12.0, 14.0, 13.0, 6.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.0107421875, -0.9788665771484375, -0.946990966796875, -0.9151153564453125, -0.88323974609375, -0.8513641357421875, -0.819488525390625, -0.7876129150390625, -0.7557373046875, -0.7238616943359375, -0.691986083984375, -0.6601104736328125, -0.62823486328125, -0.5963592529296875, -0.564483642578125, -0.5326080322265625, -0.500732421875, -0.4688568115234375, -0.436981201171875, -0.4051055908203125, -0.37322998046875, -0.3413543701171875, -0.309478759765625, -0.2776031494140625, -0.2457275390625, -0.2138519287109375, -0.181976318359375, -0.1501007080078125, -0.11822509765625, -0.0863494873046875, -0.054473876953125, -0.0225982666015625, 0.00927734375, 0.0411529541015625, 0.073028564453125, 0.1049041748046875, 0.13677978515625, 0.1686553955078125, 0.200531005859375, 0.2324066162109375, 0.2642822265625, 0.2961578369140625, 0.328033447265625, 0.3599090576171875, 0.39178466796875, 0.4236602783203125, 0.455535888671875, 0.4874114990234375, 0.519287109375, 0.5511627197265625, 0.583038330078125, 0.6149139404296875, 0.64678955078125, 0.6786651611328125, 0.710540771484375, 0.7424163818359375, 0.7742919921875, 0.8061676025390625, 0.838043212890625, 0.8699188232421875, 0.90179443359375, 0.9336700439453125, 0.965545654296875, 0.9974212646484375, 1.029296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 9.0, 11.0, 9.0, 20.0, 26.0, 51.0, 60.0, 115.0, 207.0, 526.0, 1603.0, 767.0, 286.0, 119.0, 77.0, 50.0, 22.0, 17.0, 20.0, 12.0, 18.0, 10.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1904296875, -0.18563461303710938, -0.18083953857421875, -0.17604446411132812, -0.1712493896484375, -0.16645431518554688, -0.16165924072265625, -0.15686416625976562, -0.152069091796875, -0.14727401733398438, -0.14247894287109375, -0.13768386840820312, -0.1328887939453125, -0.12809371948242188, -0.12329864501953125, -0.11850357055664062, -0.11370849609375, -0.10891342163085938, -0.10411834716796875, -0.09932327270507812, -0.0945281982421875, -0.08973312377929688, -0.08493804931640625, -0.08014297485351562, -0.075347900390625, -0.07055282592773438, -0.06575775146484375, -0.060962677001953125, -0.0561676025390625, -0.051372528076171875, -0.04657745361328125, -0.041782379150390625, -0.0369873046875, -0.032192230224609375, -0.02739715576171875, -0.022602081298828125, -0.0178070068359375, -0.013011932373046875, -0.00821685791015625, -0.003421783447265625, 0.001373291015625, 0.006168365478515625, 0.01096343994140625, 0.015758514404296875, 0.0205535888671875, 0.025348663330078125, 0.03014373779296875, 0.034938812255859375, 0.03973388671875, 0.044528961181640625, 0.04932403564453125, 0.054119110107421875, 0.0589141845703125, 0.06370925903320312, 0.06850433349609375, 0.07329940795898438, 0.078094482421875, 0.08288955688476562, 0.08768463134765625, 0.09247970581054688, 0.0972747802734375, 0.10206985473632812, 0.10686492919921875, 0.11166000366210938, 0.116455078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 17.0, 17.0, 37.0, 78.0, 137.0, 223.0, 195.0, 133.0, 73.0, 37.0, 22.0, 13.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5720391273498535, -1.528545618057251, -1.485052227973938, -1.4415587186813354, -1.398065209388733, -1.35457181930542, -1.3110783100128174, -1.2675848007202148, -1.2240912914276123, -1.1805977821350098, -1.1371043920516968, -1.0936108827590942, -1.0501173734664917, -1.0066239833831787, -0.9631304740905762, -0.9196369647979736, -0.8761435747146606, -0.8326501250267029, -0.7891566157341003, -0.7456631660461426, -0.70216965675354, -0.6586762070655823, -0.6151827573776245, -0.571689248085022, -0.5281957983970642, -0.48470231890678406, -0.4412088394165039, -0.39771538972854614, -0.354221910238266, -0.31072843074798584, -0.2672349810600281, -0.22374150156974792, -0.18024790287017822, -0.13675442337989807, -0.09326095879077911, -0.049767494201660156, -0.006274014711380005, 0.037219464778900146, 0.08071291446685791, 0.12420639395713806, 0.1676998734474182, 0.21119335293769836, 0.2546868324279785, 0.2981802821159363, 0.34167376160621643, 0.3851672410964966, 0.42866069078445435, 0.4721541702747345, 0.5156476497650146, 0.5591410994529724, 0.602634608745575, 0.6461280584335327, 0.6896215677261353, 0.733115017414093, 0.7766084671020508, 0.8201019763946533, 0.8635954260826111, 0.9070888757705688, 0.9505823850631714, 0.9940758347511292, 1.037569284439087, 1.0810627937316895, 1.124556303024292, 1.168049693107605, 1.2115432024002075]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 9.0, 7.0, 11.0, 15.0, 15.0, 13.0, 18.0, 28.0, 23.0, 30.0, 37.0, 30.0, 42.0, 54.0, 51.0, 46.0, 48.0, 50.0, 37.0, 50.0, 52.0, 40.0, 48.0, 49.0, 31.0, 25.0, 25.0, 21.0, 24.0, 16.0, 13.0, 15.0, 10.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5638051629066467, -0.5481237173080444, -0.5324422121047974, -0.5167607665061951, -0.5010793209075928, -0.4853978455066681, -0.4697163701057434, -0.4540349245071411, -0.43835344910621643, -0.42267197370529175, -0.40699052810668945, -0.39130905270576477, -0.3756275773048401, -0.3599461317062378, -0.3442646563053131, -0.3285831809043884, -0.31290173530578613, -0.29722025990486145, -0.28153881430625916, -0.2658573389053345, -0.2501758933067322, -0.2344944179058075, -0.2188129425048828, -0.20313148200511932, -0.18745002150535583, -0.17176856100559235, -0.15608710050582886, -0.14040562510490417, -0.12472416460514069, -0.1090427041053772, -0.09336123615503311, -0.07767976820468903, -0.06199830770492554, -0.04631684347987175, -0.030635379254817963, -0.014953915029764175, 0.0007275491952896118, 0.0164090096950531, 0.032090477645397186, 0.04777194559574127, 0.06345340609550476, 0.07913486659526825, 0.09481633454561234, 0.11049780249595642, 0.1261792629957199, 0.1418607234954834, 0.15754219889640808, 0.17322365939617157, 0.18890511989593506, 0.20458658039569855, 0.22026804089546204, 0.23594951629638672, 0.251630961894989, 0.2673124372959137, 0.2829939126968384, 0.2986753582954407, 0.31435683369636536, 0.33003830909729004, 0.34571975469589233, 0.361401230096817, 0.3770827054977417, 0.392764151096344, 0.4084456264972687, 0.42412710189819336, 0.43980854749679565]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 10.0, 22.0, 31.0, 39.0, 81.0, 151.0, 259.0, 440.0, 868.0, 1834.0, 4032.0, 10087.0, 28560.0, 101191.0, 420775.0, 358081.0, 82217.0, 23934.0, 8784.0, 3705.0, 1661.0, 854.0, 435.0, 217.0, 112.0, 74.0, 39.0, 23.0, 17.0, 11.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4326171875, -0.4186286926269531, -0.40464019775390625, -0.3906517028808594, -0.3766632080078125, -0.3626747131347656, -0.34868621826171875, -0.3346977233886719, -0.320709228515625, -0.3067207336425781, -0.29273223876953125, -0.2787437438964844, -0.2647552490234375, -0.2507667541503906, -0.23677825927734375, -0.22278976440429688, -0.20880126953125, -0.19481277465820312, -0.18082427978515625, -0.16683578491210938, -0.1528472900390625, -0.13885879516601562, -0.12487030029296875, -0.11088180541992188, -0.096893310546875, -0.08290481567382812, -0.06891632080078125, -0.054927825927734375, -0.0409393310546875, -0.026950836181640625, -0.01296234130859375, 0.001026153564453125, 0.0150146484375, 0.029003143310546875, 0.04299163818359375, 0.056980133056640625, 0.0709686279296875, 0.08495712280273438, 0.09894561767578125, 0.11293411254882812, 0.126922607421875, 0.14091110229492188, 0.15489959716796875, 0.16888809204101562, 0.1828765869140625, 0.19686508178710938, 0.21085357666015625, 0.22484207153320312, 0.23883056640625, 0.2528190612792969, 0.26680755615234375, 0.2807960510253906, 0.2947845458984375, 0.3087730407714844, 0.32276153564453125, 0.3367500305175781, 0.350738525390625, 0.3647270202636719, 0.37871551513671875, 0.3927040100097656, 0.4066925048828125, 0.4206809997558594, 0.43466949462890625, 0.4486579895019531, 0.462646484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 11.0, 10.0, 15.0, 23.0, 21.0, 46.0, 34.0, 53.0, 74.0, 63.0, 92.0, 85.0, 78.0, 74.0, 68.0, 54.0, 43.0, 43.0, 33.0, 15.0, 14.0, 6.0, 5.0, 15.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12408447265625, -0.12076854705810547, -0.11745262145996094, -0.1141366958618164, -0.11082077026367188, -0.10750484466552734, -0.10418891906738281, -0.10087299346923828, -0.09755706787109375, -0.09424114227294922, -0.09092521667480469, -0.08760929107666016, -0.08429336547851562, -0.0809774398803711, -0.07766151428222656, -0.07434558868408203, -0.0710296630859375, -0.06771373748779297, -0.06439781188964844, -0.061081886291503906, -0.057765960693359375, -0.054450035095214844, -0.05113410949707031, -0.04781818389892578, -0.04450225830078125, -0.04118633270263672, -0.03787040710449219, -0.034554481506347656, -0.031238555908203125, -0.027922630310058594, -0.024606704711914062, -0.02129077911376953, -0.017974853515625, -0.014658927917480469, -0.011343002319335938, -0.008027076721191406, -0.004711151123046875, -0.0013952255249023438, 0.0019207000732421875, 0.005236625671386719, 0.00855255126953125, 0.011868476867675781, 0.015184402465820312, 0.018500328063964844, 0.021816253662109375, 0.025132179260253906, 0.028448104858398438, 0.03176403045654297, 0.0350799560546875, 0.03839588165283203, 0.04171180725097656, 0.045027732849121094, 0.048343658447265625, 0.051659584045410156, 0.05497550964355469, 0.05829143524169922, 0.06160736083984375, 0.06492328643798828, 0.06823921203613281, 0.07155513763427734, 0.07487106323242188, 0.0781869888305664, 0.08150291442871094, 0.08481884002685547, 0.088134765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 20.0, 32.0, 31.0, 50.0, 88.0, 126.0, 245.0, 461.0, 1064.0, 3003.0, 9941.0, 40349.0, 233632.0, 599148.0, 125132.0, 25102.0, 6318.0, 2060.0, 814.0, 379.0, 215.0, 107.0, 84.0, 46.0, 32.0, 17.0, 17.0, 9.0, 7.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.5020065307617188, -0.4854583740234375, -0.46891021728515625, -0.452362060546875, -0.43581390380859375, -0.4192657470703125, -0.40271759033203125, -0.38616943359375, -0.36962127685546875, -0.3530731201171875, -0.33652496337890625, -0.319976806640625, -0.30342864990234375, -0.2868804931640625, -0.27033233642578125, -0.2537841796875, -0.23723602294921875, -0.2206878662109375, -0.20413970947265625, -0.187591552734375, -0.17104339599609375, -0.1544952392578125, -0.13794708251953125, -0.12139892578125, -0.10485076904296875, -0.0883026123046875, -0.07175445556640625, -0.055206298828125, -0.03865814208984375, -0.0221099853515625, -0.00556182861328125, 0.010986328125, 0.02753448486328125, 0.0440826416015625, 0.06063079833984375, 0.077178955078125, 0.09372711181640625, 0.1102752685546875, 0.12682342529296875, 0.14337158203125, 0.15991973876953125, 0.1764678955078125, 0.19301605224609375, 0.209564208984375, 0.22611236572265625, 0.2426605224609375, 0.25920867919921875, 0.2757568359375, 0.29230499267578125, 0.3088531494140625, 0.32540130615234375, 0.341949462890625, 0.35849761962890625, 0.3750457763671875, 0.39159393310546875, 0.40814208984375, 0.42469024658203125, 0.4412384033203125, 0.45778656005859375, 0.474334716796875, 0.49088287353515625, 0.5074310302734375, 0.5239791870117188, 0.54052734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 9.0, 7.0, 6.0, 10.0, 16.0, 20.0, 22.0, 19.0, 21.0, 37.0, 33.0, 35.0, 42.0, 35.0, 40.0, 38.0, 46.0, 40.0, 40.0, 42.0, 43.0, 36.0, 30.0, 40.0, 36.0, 29.0, 33.0, 24.0, 20.0, 20.0, 13.0, 19.0, 9.0, 15.0, 10.0, 9.0, 10.0, 5.0, 8.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.2935600280761719, -0.28438568115234375, -0.2752113342285156, -0.2660369873046875, -0.2568626403808594, -0.24768829345703125, -0.23851394653320312, -0.229339599609375, -0.22016525268554688, -0.21099090576171875, -0.20181655883789062, -0.1926422119140625, -0.18346786499023438, -0.17429351806640625, -0.16511917114257812, -0.15594482421875, -0.14677047729492188, -0.13759613037109375, -0.12842178344726562, -0.1192474365234375, -0.11007308959960938, -0.10089874267578125, -0.09172439575195312, -0.082550048828125, -0.07337570190429688, -0.06420135498046875, -0.055027008056640625, -0.0458526611328125, -0.036678314208984375, -0.02750396728515625, -0.018329620361328125, -0.0091552734375, 1.9073486328125e-05, 0.00919342041015625, 0.018367767333984375, 0.0275421142578125, 0.036716461181640625, 0.04589080810546875, 0.055065155029296875, 0.064239501953125, 0.07341384887695312, 0.08258819580078125, 0.09176254272460938, 0.1009368896484375, 0.11011123657226562, 0.11928558349609375, 0.12845993041992188, 0.13763427734375, 0.14680862426757812, 0.15598297119140625, 0.16515731811523438, 0.1743316650390625, 0.18350601196289062, 0.19268035888671875, 0.20185470581054688, 0.211029052734375, 0.22020339965820312, 0.22937774658203125, 0.23855209350585938, 0.2477264404296875, 0.2569007873535156, 0.26607513427734375, 0.2752494812011719, 0.284423828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 7.0, 15.0, 16.0, 22.0, 28.0, 76.0, 111.0, 209.0, 372.0, 699.0, 1447.0, 3778.0, 12051.0, 59563.0, 469761.0, 428514.0, 54250.0, 11114.0, 3544.0, 1407.0, 710.0, 378.0, 190.0, 99.0, 62.0, 36.0, 29.0, 17.0, 10.0, 11.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.19741058349609375, -0.1903533935546875, -0.18329620361328125, -0.176239013671875, -0.16918182373046875, -0.1621246337890625, -0.15506744384765625, -0.14801025390625, -0.14095306396484375, -0.1338958740234375, -0.12683868408203125, -0.119781494140625, -0.11272430419921875, -0.1056671142578125, -0.09860992431640625, -0.091552734375, -0.08449554443359375, -0.0774383544921875, -0.07038116455078125, -0.063323974609375, -0.05626678466796875, -0.0492095947265625, -0.04215240478515625, -0.03509521484375, -0.02803802490234375, -0.0209808349609375, -0.01392364501953125, -0.006866455078125, 0.00019073486328125, 0.0072479248046875, 0.01430511474609375, 0.0213623046875, 0.02841949462890625, 0.0354766845703125, 0.04253387451171875, 0.049591064453125, 0.05664825439453125, 0.0637054443359375, 0.07076263427734375, 0.07781982421875, 0.08487701416015625, 0.0919342041015625, 0.09899139404296875, 0.106048583984375, 0.11310577392578125, 0.1201629638671875, 0.12722015380859375, 0.13427734375, 0.14133453369140625, 0.1483917236328125, 0.15544891357421875, 0.162506103515625, 0.16956329345703125, 0.1766204833984375, 0.18367767333984375, 0.19073486328125, 0.19779205322265625, 0.2048492431640625, 0.21190643310546875, 0.218963623046875, 0.22602081298828125, 0.2330780029296875, 0.24013519287109375, 0.2471923828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 8.0, 7.0, 6.0, 11.0, 19.0, 15.0, 19.0, 32.0, 35.0, 41.0, 46.0, 52.0, 44.0, 62.0, 85.0, 73.0, 85.0, 54.0, 52.0, 49.0, 44.0, 29.0, 22.0, 19.0, 17.0, 18.0, 19.0, 10.0, 5.0, 6.0, 6.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5359134674072266e-05, -4.41940501332283e-05, -4.302896559238434e-05, -4.1863881051540375e-05, -4.069879651069641e-05, -3.953371196985245e-05, -3.8368627429008484e-05, -3.720354288816452e-05, -3.603845834732056e-05, -3.487337380647659e-05, -3.370828926563263e-05, -3.2543204724788666e-05, -3.13781201839447e-05, -3.021303564310074e-05, -2.9047951102256775e-05, -2.788286656141281e-05, -2.6717782020568848e-05, -2.5552697479724884e-05, -2.438761293888092e-05, -2.3222528398036957e-05, -2.2057443857192993e-05, -2.089235931634903e-05, -1.9727274775505066e-05, -1.8562190234661102e-05, -1.739710569381714e-05, -1.6232021152973175e-05, -1.5066936612129211e-05, -1.3901852071285248e-05, -1.2736767530441284e-05, -1.157168298959732e-05, -1.0406598448753357e-05, -9.241513907909393e-06, -8.07642936706543e-06, -6.911344826221466e-06, -5.7462602853775024e-06, -4.581175744533539e-06, -3.416091203689575e-06, -2.2510066628456116e-06, -1.085922122001648e-06, 7.916241884231567e-08, 1.2442469596862793e-06, 2.409331500530243e-06, 3.5744160413742065e-06, 4.73950058221817e-06, 5.904585123062134e-06, 7.069669663906097e-06, 8.234754204750061e-06, 9.399838745594025e-06, 1.0564923286437988e-05, 1.1730007827281952e-05, 1.2895092368125916e-05, 1.4060176908969879e-05, 1.5225261449813843e-05, 1.6390345990657806e-05, 1.755543053150177e-05, 1.8720515072345734e-05, 1.9885599613189697e-05, 2.105068415403366e-05, 2.2215768694877625e-05, 2.3380853235721588e-05, 2.4545937776565552e-05, 2.5711022317409515e-05, 2.687610685825348e-05, 2.8041191399097443e-05, 2.9206275939941406e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 7.0, 12.0, 13.0, 9.0, 20.0, 45.0, 49.0, 84.0, 130.0, 207.0, 294.0, 497.0, 794.0, 1472.0, 2595.0, 5514.0, 12818.0, 35806.0, 132079.0, 442558.0, 297874.0, 74892.0, 22809.0, 8882.0, 4031.0, 2102.0, 1111.0, 703.0, 402.0, 224.0, 182.0, 99.0, 64.0, 53.0, 31.0, 28.0, 16.0, 15.0, 6.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1754150390625, -0.17037391662597656, -0.16533279418945312, -0.1602916717529297, -0.15525054931640625, -0.1502094268798828, -0.14516830444335938, -0.14012718200683594, -0.1350860595703125, -0.13004493713378906, -0.12500381469726562, -0.11996269226074219, -0.11492156982421875, -0.10988044738769531, -0.10483932495117188, -0.09979820251464844, -0.094757080078125, -0.08971595764160156, -0.08467483520507812, -0.07963371276855469, -0.07459259033203125, -0.06955146789550781, -0.06451034545898438, -0.05946922302246094, -0.0544281005859375, -0.04938697814941406, -0.044345855712890625, -0.03930473327636719, -0.03426361083984375, -0.029222488403320312, -0.024181365966796875, -0.019140243530273438, -0.01409912109375, -0.009057998657226562, -0.004016876220703125, 0.0010242462158203125, 0.00606536865234375, 0.011106491088867188, 0.016147613525390625, 0.021188735961914062, 0.0262298583984375, 0.03127098083496094, 0.036312103271484375, 0.04135322570800781, 0.04639434814453125, 0.05143547058105469, 0.056476593017578125, 0.06151771545410156, 0.066558837890625, 0.07159996032714844, 0.07664108276367188, 0.08168220520019531, 0.08672332763671875, 0.09176445007324219, 0.09680557250976562, 0.10184669494628906, 0.1068878173828125, 0.11192893981933594, 0.11697006225585938, 0.12201118469238281, 0.12705230712890625, 0.1320934295654297, 0.13713455200195312, 0.14217567443847656, 0.147216796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 7.0, 8.0, 4.0, 16.0, 10.0, 17.0, 20.0, 35.0, 31.0, 35.0, 63.0, 79.0, 98.0, 100.0, 90.0, 83.0, 72.0, 60.0, 55.0, 31.0, 35.0, 14.0, 7.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1693115234375, -0.1647491455078125, -0.160186767578125, -0.1556243896484375, -0.15106201171875, -0.1464996337890625, -0.141937255859375, -0.1373748779296875, -0.1328125, -0.1282501220703125, -0.123687744140625, -0.1191253662109375, -0.11456298828125, -0.1100006103515625, -0.105438232421875, -0.1008758544921875, -0.0963134765625, -0.0917510986328125, -0.087188720703125, -0.0826263427734375, -0.07806396484375, -0.0735015869140625, -0.068939208984375, -0.0643768310546875, -0.059814453125, -0.0552520751953125, -0.050689697265625, -0.0461273193359375, -0.04156494140625, -0.0370025634765625, -0.032440185546875, -0.0278778076171875, -0.0233154296875, -0.0187530517578125, -0.014190673828125, -0.0096282958984375, -0.00506591796875, -0.0005035400390625, 0.004058837890625, 0.0086212158203125, 0.01318359375, 0.0177459716796875, 0.022308349609375, 0.0268707275390625, 0.03143310546875, 0.0359954833984375, 0.040557861328125, 0.0451202392578125, 0.0496826171875, 0.0542449951171875, 0.058807373046875, 0.0633697509765625, 0.06793212890625, 0.0724945068359375, 0.077056884765625, 0.0816192626953125, 0.086181640625, 0.0907440185546875, 0.095306396484375, 0.0998687744140625, 0.10443115234375, 0.1089935302734375, 0.113555908203125, 0.1181182861328125, 0.1226806640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 7.0, 19.0, 24.0, 46.0, 74.0, 161.0, 215.0, 179.0, 117.0, 70.0, 35.0, 17.0, 14.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7060390710830688, -1.6045560836791992, -1.5030732154846191, -1.4015902280807495, -1.3001073598861694, -1.1986243724822998, -1.0971415042877197, -0.9956585168838501, -0.8941755890846252, -0.7926926612854004, -0.6912097334861755, -0.5897268056869507, -0.48824384808540344, -0.3867608904838562, -0.28527796268463135, -0.1837950348854065, -0.08231210708618164, 0.01917082816362381, 0.12065376341342926, 0.2221367061138153, 0.32361963391304016, 0.4251025915145874, 0.5265855193138123, 0.6280684471130371, 0.729551374912262, 0.8310343027114868, 0.9325172305107117, 1.0340001583099365, 1.1354831457138062, 1.2369661331176758, 1.3384490013122559, 1.439931869506836, 1.5414149761199951, 1.6428979635238647, 1.7443808317184448, 1.8458638191223145, 1.9473466873168945, 2.0488295555114746, 2.150312662124634, 2.251795530319214, 2.353278398513794, 2.454761266708374, 2.556244373321533, 2.6577272415161133, 2.7592101097106934, 2.8606929779052734, 2.9621760845184326, 3.0636589527130127, 3.165142059326172, 3.266624927520752, 3.368108034133911, 3.469590902328491, 3.5710737705230713, 3.6725568771362305, 3.7740397453308105, 3.8755226135253906, 3.9770054817199707, 4.078488349914551, 4.179971218109131, 4.281454086303711, 4.382937431335449, 4.484420299530029, 4.585903167724609, 4.6873860359191895, 4.7888689041137695]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 6.0, 14.0, 13.0, 19.0, 25.0, 24.0, 34.0, 39.0, 37.0, 40.0, 53.0, 52.0, 70.0, 66.0, 77.0, 64.0, 74.0, 32.0, 43.0, 36.0, 28.0, 30.0, 35.0, 19.0, 13.0, 15.0, 12.0, 2.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1835310459136963, -2.1053805351257324, -2.0272300243377686, -1.9490795135498047, -1.8709290027618408, -1.792778491973877, -1.7146281003952026, -1.6364775896072388, -1.558327078819275, -1.480176568031311, -1.4020260572433472, -1.3238755464553833, -1.245725154876709, -1.1675746440887451, -1.0894241333007812, -1.0112736225128174, -0.9331231117248535, -0.8549726009368896, -0.7768220901489258, -0.6986716389656067, -0.6205211281776428, -0.542370617389679, -0.4642201364040375, -0.386069655418396, -0.30791914463043213, -0.22976864874362946, -0.15161815285682678, -0.07346765697002411, 0.0046828389167785645, 0.08283334970474243, 0.1609838306903839, 0.2391343116760254, 0.31728482246398926, 0.3954353332519531, 0.4735858142375946, 0.5517362952232361, 0.6298868060112, 0.7080373167991638, 0.7861877679824829, 0.8643382787704468, 0.9424887895584106, 1.0206393003463745, 1.0987898111343384, 1.1769403219223022, 1.2550907135009766, 1.3332412242889404, 1.4113917350769043, 1.4895422458648682, 1.567692756652832, 1.645843267440796, 1.7239937782287598, 1.8021442890167236, 1.8802947998046875, 1.9584453105926514, 2.0365958213806152, 2.11474609375, 2.192896842956543, 2.271047353744507, 2.3491978645324707, 2.4273483753204346, 2.5054988861083984, 2.5836493968963623, 2.661799907684326, 2.739950180053711, 2.818100690841675]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 10.0, 12.0, 16.0, 30.0, 44.0, 68.0, 103.0, 159.0, 278.0, 574.0, 1344.0, 3678.0, 15883.0, 143525.0, 3904759.0, 104174.0, 13457.0, 3653.0, 1252.0, 591.0, 290.0, 161.0, 72.0, 56.0, 28.0, 14.0, 16.0, 11.0, 3.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0595703125, -1.02587890625, -0.9921875, -0.95849609375, -0.9248046875, -0.89111328125, -0.857421875, -0.82373046875, -0.7900390625, -0.75634765625, -0.72265625, -0.68896484375, -0.6552734375, -0.62158203125, -0.587890625, -0.55419921875, -0.5205078125, -0.48681640625, -0.453125, -0.41943359375, -0.3857421875, -0.35205078125, -0.318359375, -0.28466796875, -0.2509765625, -0.21728515625, -0.18359375, -0.14990234375, -0.1162109375, -0.08251953125, -0.048828125, -0.01513671875, 0.0185546875, 0.05224609375, 0.0859375, 0.11962890625, 0.1533203125, 0.18701171875, 0.220703125, 0.25439453125, 0.2880859375, 0.32177734375, 0.35546875, 0.38916015625, 0.4228515625, 0.45654296875, 0.490234375, 0.52392578125, 0.5576171875, 0.59130859375, 0.625, 0.65869140625, 0.6923828125, 0.72607421875, 0.759765625, 0.79345703125, 0.8271484375, 0.86083984375, 0.89453125, 0.92822265625, 0.9619140625, 0.99560546875, 1.029296875, 1.06298828125, 1.0966796875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 4.0, 5.0, 7.0, 15.0, 16.0, 35.0, 30.0, 42.0, 51.0, 84.0, 77.0, 79.0, 78.0, 79.0, 70.0, 69.0, 61.0, 39.0, 36.0, 25.0, 26.0, 14.0, 16.0, 6.0, 5.0, 4.0, 7.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1217041015625, -0.11836814880371094, -0.11503219604492188, -0.11169624328613281, -0.10836029052734375, -0.10502433776855469, -0.10168838500976562, -0.09835243225097656, -0.0950164794921875, -0.09168052673339844, -0.08834457397460938, -0.08500862121582031, -0.08167266845703125, -0.07833671569824219, -0.07500076293945312, -0.07166481018066406, -0.068328857421875, -0.06499290466308594, -0.061656951904296875, -0.05832099914550781, -0.05498504638671875, -0.05164909362792969, -0.048313140869140625, -0.04497718811035156, -0.0416412353515625, -0.03830528259277344, -0.034969329833984375, -0.03163337707519531, -0.02829742431640625, -0.024961471557617188, -0.021625518798828125, -0.018289566040039062, -0.01495361328125, -0.011617660522460938, -0.008281707763671875, -0.0049457550048828125, -0.00160980224609375, 0.0017261505126953125, 0.005062103271484375, 0.008398056030273438, 0.0117340087890625, 0.015069961547851562, 0.018405914306640625, 0.021741867065429688, 0.02507781982421875, 0.028413772583007812, 0.031749725341796875, 0.03508567810058594, 0.038421630859375, 0.04175758361816406, 0.045093536376953125, 0.04842948913574219, 0.05176544189453125, 0.05510139465332031, 0.058437347412109375, 0.06177330017089844, 0.0651092529296875, 0.06844520568847656, 0.07178115844726562, 0.07511711120605469, 0.07845306396484375, 0.08178901672363281, 0.08512496948242188, 0.08846092224121094, 0.091796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 8.0, 7.0, 19.0, 26.0, 31.0, 52.0, 84.0, 169.0, 478.0, 2065.0, 21248.0, 4088356.0, 76758.0, 3625.0, 725.0, 260.0, 143.0, 74.0, 44.0, 37.0, 23.0, 9.0, 11.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.56353759765625, -2.4825439453125, -2.40155029296875, -2.320556640625, -2.23956298828125, -2.1585693359375, -2.07757568359375, -1.99658203125, -1.91558837890625, -1.8345947265625, -1.75360107421875, -1.672607421875, -1.59161376953125, -1.5106201171875, -1.42962646484375, -1.3486328125, -1.26763916015625, -1.1866455078125, -1.10565185546875, -1.024658203125, -0.94366455078125, -0.8626708984375, -0.78167724609375, -0.70068359375, -0.61968994140625, -0.5386962890625, -0.45770263671875, -0.376708984375, -0.29571533203125, -0.2147216796875, -0.13372802734375, -0.052734375, 0.02825927734375, 0.1092529296875, 0.19024658203125, 0.271240234375, 0.35223388671875, 0.4332275390625, 0.51422119140625, 0.59521484375, 0.67620849609375, 0.7572021484375, 0.83819580078125, 0.919189453125, 1.00018310546875, 1.0811767578125, 1.16217041015625, 1.2431640625, 1.32415771484375, 1.4051513671875, 1.48614501953125, 1.567138671875, 1.64813232421875, 1.7291259765625, 1.81011962890625, 1.89111328125, 1.97210693359375, 2.0531005859375, 2.13409423828125, 2.215087890625, 2.29608154296875, 2.3770751953125, 2.45806884765625, 2.5390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 11.0, 22.0, 42.0, 68.0, 130.0, 407.0, 1774.0, 1030.0, 273.0, 133.0, 60.0, 31.0, 28.0, 18.0, 15.0, 8.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.369140625, -0.35634613037109375, -0.3435516357421875, -0.33075714111328125, -0.317962646484375, -0.30516815185546875, -0.2923736572265625, -0.27957916259765625, -0.26678466796875, -0.25399017333984375, -0.2411956787109375, -0.22840118408203125, -0.215606689453125, -0.20281219482421875, -0.1900177001953125, -0.17722320556640625, -0.1644287109375, -0.15163421630859375, -0.1388397216796875, -0.12604522705078125, -0.113250732421875, -0.10045623779296875, -0.0876617431640625, -0.07486724853515625, -0.06207275390625, -0.04927825927734375, -0.0364837646484375, -0.02368927001953125, -0.010894775390625, 0.00189971923828125, 0.0146942138671875, 0.02748870849609375, 0.040283203125, 0.05307769775390625, 0.0658721923828125, 0.07866668701171875, 0.091461181640625, 0.10425567626953125, 0.1170501708984375, 0.12984466552734375, 0.14263916015625, 0.15543365478515625, 0.1682281494140625, 0.18102264404296875, 0.193817138671875, 0.20661163330078125, 0.2194061279296875, 0.23220062255859375, 0.2449951171875, 0.25778961181640625, 0.2705841064453125, 0.28337860107421875, 0.296173095703125, 0.30896759033203125, 0.3217620849609375, 0.33455657958984375, 0.34735107421875, 0.36014556884765625, 0.3729400634765625, 0.38573455810546875, 0.398529052734375, 0.41132354736328125, 0.4241180419921875, 0.43691253662109375, 0.44970703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 10.0, 26.0, 66.0, 164.0, 317.0, 242.0, 96.0, 41.0, 19.0, 14.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.86831521987915, -4.739267826080322, -4.610220432281494, -4.481173038482666, -4.352125644683838, -4.223078727722168, -4.09403133392334, -3.9649837017059326, -3.8359365463256836, -3.7068891525268555, -3.5778417587280273, -3.448794364929199, -3.31974720954895, -3.190699815750122, -3.061652421951294, -2.932605028152466, -2.8035576343536377, -2.6745102405548096, -2.5454628467559814, -2.4164156913757324, -2.2873682975769043, -2.158320903778076, -2.029273509979248, -1.90022611618042, -1.7711788415908813, -1.6421314477920532, -1.5130841732025146, -1.3840367794036865, -1.2549893856048584, -1.1259421110153198, -0.9968947172164917, -0.8678473830223083, -0.738800048828125, -0.6097527146339417, -0.4807053506374359, -0.3516579866409302, -0.22261065244674683, -0.09356331825256348, 0.03548407554626465, 0.164531409740448, 0.29357874393463135, 0.4226260781288147, 0.551673412322998, 0.6807208061218262, 0.8097681403160095, 0.9388154745101929, 1.067862868309021, 1.1969101428985596, 1.3259575366973877, 1.4550049304962158, 1.5840522050857544, 1.7130995988845825, 1.842146873474121, 1.9711942672729492, 2.1002416610717773, 2.2292890548706055, 2.3583364486694336, 2.4873838424682617, 2.61643123626709, 2.745478630065918, 2.874525785446167, 3.003573179244995, 3.1326205730438232, 3.2616679668426514, 3.3907151222229004]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 10.0, 4.0, 10.0, 11.0, 19.0, 24.0, 15.0, 25.0, 32.0, 59.0, 36.0, 55.0, 56.0, 65.0, 69.0, 57.0, 57.0, 58.0, 46.0, 46.0, 42.0, 34.0, 31.0, 35.0, 19.0, 28.0, 17.0, 13.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08934485912323, -1.0557117462158203, -1.0220786333084106, -0.9884454607963562, -0.9548123478889465, -0.9211792349815369, -0.8875460624694824, -0.8539129495620728, -0.8202798366546631, -0.7866467237472534, -0.7530136108398438, -0.7193804383277893, -0.6857473254203796, -0.65211421251297, -0.6184810400009155, -0.5848479270935059, -0.5512148141860962, -0.5175817012786865, -0.48394855856895447, -0.4503154158592224, -0.41668230295181274, -0.3830491900444031, -0.349416047334671, -0.31578290462493896, -0.2821497917175293, -0.24851666390895844, -0.21488353610038757, -0.1812504082918167, -0.14761728048324585, -0.11398415267467499, -0.08035102486610413, -0.046717897057533264, -0.013084769248962402, 0.02054835855960846, 0.05418148636817932, 0.08781461417675018, 0.12144774198532104, 0.1550808697938919, 0.18871399760246277, 0.22234712541103363, 0.2559802532196045, 0.28961336612701416, 0.3232465088367462, 0.35687965154647827, 0.39051276445388794, 0.4241458773612976, 0.45777902007102966, 0.4914121627807617, 0.5250452756881714, 0.558678388595581, 0.5923115015029907, 0.6259446740150452, 0.6595777869224548, 0.6932108998298645, 0.726844072341919, 0.7604771852493286, 0.7941102981567383, 0.827743411064148, 0.8613765239715576, 0.8950096964836121, 0.9286428093910217, 0.9622759222984314, 0.9959090948104858, 1.0295422077178955, 1.0631753206253052]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 5.0, 11.0, 23.0, 19.0, 18.0, 40.0, 64.0, 71.0, 99.0, 169.0, 253.0, 396.0, 565.0, 885.0, 1554.0, 2717.0, 5307.0, 12258.0, 35164.0, 142347.0, 522189.0, 239921.0, 52776.0, 16829.0, 6831.0, 3307.0, 1820.0, 1022.0, 659.0, 428.0, 249.0, 177.0, 136.0, 75.0, 46.0, 33.0, 26.0, 21.0, 12.0, 8.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.55859375, -0.5424766540527344, -0.5263595581054688, -0.5102424621582031, -0.4941253662109375, -0.4780082702636719, -0.46189117431640625, -0.4457740783691406, -0.429656982421875, -0.4135398864746094, -0.39742279052734375, -0.3813056945800781, -0.3651885986328125, -0.3490715026855469, -0.33295440673828125, -0.3168373107910156, -0.30072021484375, -0.2846031188964844, -0.26848602294921875, -0.2523689270019531, -0.2362518310546875, -0.22013473510742188, -0.20401763916015625, -0.18790054321289062, -0.171783447265625, -0.15566635131835938, -0.13954925537109375, -0.12343215942382812, -0.1073150634765625, -0.09119796752929688, -0.07508087158203125, -0.058963775634765625, -0.0428466796875, -0.026729583740234375, -0.01061248779296875, 0.005504608154296875, 0.0216217041015625, 0.037738800048828125, 0.05385589599609375, 0.06997299194335938, 0.086090087890625, 0.10220718383789062, 0.11832427978515625, 0.13444137573242188, 0.1505584716796875, 0.16667556762695312, 0.18279266357421875, 0.19890975952148438, 0.21502685546875, 0.23114395141601562, 0.24726104736328125, 0.2633781433105469, 0.2794952392578125, 0.2956123352050781, 0.31172943115234375, 0.3278465270996094, 0.343963623046875, 0.3600807189941406, 0.37619781494140625, 0.3923149108886719, 0.4084320068359375, 0.4245491027832031, 0.44066619873046875, 0.4567832946777344, 0.472900390625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 17.0, 20.0, 38.0, 48.0, 57.0, 77.0, 79.0, 112.0, 94.0, 82.0, 90.0, 70.0, 59.0, 39.0, 24.0, 20.0, 14.0, 4.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1544189453125, -0.1502523422241211, -0.1460857391357422, -0.14191913604736328, -0.13775253295898438, -0.13358592987060547, -0.12941932678222656, -0.12525272369384766, -0.12108612060546875, -0.11691951751708984, -0.11275291442871094, -0.10858631134033203, -0.10441970825195312, -0.10025310516357422, -0.09608650207519531, -0.0919198989868164, -0.0877532958984375, -0.0835866928100586, -0.07942008972167969, -0.07525348663330078, -0.07108688354492188, -0.06692028045654297, -0.06275367736816406, -0.058587074279785156, -0.05442047119140625, -0.050253868103027344, -0.04608726501464844, -0.04192066192626953, -0.037754058837890625, -0.03358745574951172, -0.029420852661132812, -0.025254249572753906, -0.021087646484375, -0.016921043395996094, -0.012754440307617188, -0.008587837219238281, -0.004421234130859375, -0.00025463104248046875, 0.0039119720458984375, 0.008078575134277344, 0.01224517822265625, 0.016411781311035156, 0.020578384399414062, 0.02474498748779297, 0.028911590576171875, 0.03307819366455078, 0.03724479675292969, 0.041411399841308594, 0.0455780029296875, 0.049744606018066406, 0.05391120910644531, 0.05807781219482422, 0.062244415283203125, 0.06641101837158203, 0.07057762145996094, 0.07474422454833984, 0.07891082763671875, 0.08307743072509766, 0.08724403381347656, 0.09141063690185547, 0.09557723999023438, 0.09974384307861328, 0.10391044616699219, 0.1080770492553711, 0.11224365234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 16.0, 16.0, 16.0, 33.0, 46.0, 36.0, 45.0, 89.0, 145.0, 234.0, 414.0, 731.0, 1450.0, 3115.0, 6936.0, 16487.0, 43181.0, 128447.0, 363211.0, 317673.0, 104890.0, 36048.0, 14083.0, 5687.0, 2584.0, 1265.0, 634.0, 356.0, 216.0, 120.0, 78.0, 66.0, 38.0, 32.0, 18.0, 19.0, 22.0, 11.0, 17.0, 6.0, 6.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.31298828125, -0.3031806945800781, -0.29337310791015625, -0.2835655212402344, -0.2737579345703125, -0.2639503479003906, -0.25414276123046875, -0.24433517456054688, -0.234527587890625, -0.22472000122070312, -0.21491241455078125, -0.20510482788085938, -0.1952972412109375, -0.18548965454101562, -0.17568206787109375, -0.16587448120117188, -0.15606689453125, -0.14625930786132812, -0.13645172119140625, -0.12664413452148438, -0.1168365478515625, -0.10702896118164062, -0.09722137451171875, -0.08741378784179688, -0.077606201171875, -0.06779861450195312, -0.05799102783203125, -0.048183441162109375, -0.0383758544921875, -0.028568267822265625, -0.01876068115234375, -0.008953094482421875, 0.0008544921875, 0.010662078857421875, 0.02046966552734375, 0.030277252197265625, 0.0400848388671875, 0.049892425537109375, 0.05970001220703125, 0.06950759887695312, 0.079315185546875, 0.08912277221679688, 0.09893035888671875, 0.10873794555664062, 0.1185455322265625, 0.12835311889648438, 0.13816070556640625, 0.14796829223632812, 0.15777587890625, 0.16758346557617188, 0.17739105224609375, 0.18719863891601562, 0.1970062255859375, 0.20681381225585938, 0.21662139892578125, 0.22642898559570312, 0.236236572265625, 0.24604415893554688, 0.25585174560546875, 0.2656593322753906, 0.2754669189453125, 0.2852745056152344, 0.29508209228515625, 0.3048896789550781, 0.314697265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 6.0, 8.0, 13.0, 9.0, 16.0, 20.0, 17.0, 24.0, 19.0, 26.0, 28.0, 28.0, 40.0, 32.0, 38.0, 39.0, 31.0, 33.0, 44.0, 32.0, 37.0, 38.0, 39.0, 36.0, 41.0, 28.0, 24.0, 35.0, 25.0, 37.0, 19.0, 10.0, 25.0, 15.0, 13.0, 15.0, 9.0, 15.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.301513671875, -0.2927284240722656, -0.28394317626953125, -0.2751579284667969, -0.2663726806640625, -0.2575874328613281, -0.24880218505859375, -0.24001693725585938, -0.231231689453125, -0.22244644165039062, -0.21366119384765625, -0.20487594604492188, -0.1960906982421875, -0.18730545043945312, -0.17852020263671875, -0.16973495483398438, -0.16094970703125, -0.15216445922851562, -0.14337921142578125, -0.13459396362304688, -0.1258087158203125, -0.11702346801757812, -0.10823822021484375, -0.09945297241210938, -0.090667724609375, -0.08188247680664062, -0.07309722900390625, -0.06431198120117188, -0.0555267333984375, -0.046741485595703125, -0.03795623779296875, -0.029170989990234375, -0.0203857421875, -0.011600494384765625, -0.00281524658203125, 0.005970001220703125, 0.0147552490234375, 0.023540496826171875, 0.03232574462890625, 0.041110992431640625, 0.049896240234375, 0.058681488037109375, 0.06746673583984375, 0.07625198364257812, 0.0850372314453125, 0.09382247924804688, 0.10260772705078125, 0.11139297485351562, 0.12017822265625, 0.12896347045898438, 0.13774871826171875, 0.14653396606445312, 0.1553192138671875, 0.16410446166992188, 0.17288970947265625, 0.18167495727539062, 0.190460205078125, 0.19924545288085938, 0.20803070068359375, 0.21681594848632812, 0.2256011962890625, 0.23438644409179688, 0.24317169189453125, 0.2519569396972656, 0.2607421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 7.0, 7.0, 2.0, 8.0, 14.0, 13.0, 19.0, 39.0, 63.0, 111.0, 268.0, 715.0, 2088.0, 9453.0, 67438.0, 581348.0, 343061.0, 35531.0, 5920.0, 1493.0, 469.0, 227.0, 101.0, 53.0, 40.0, 20.0, 14.0, 9.0, 11.0, 1.0, 4.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22802734375, -0.22063636779785156, -0.21324539184570312, -0.2058544158935547, -0.19846343994140625, -0.1910724639892578, -0.18368148803710938, -0.17629051208496094, -0.1688995361328125, -0.16150856018066406, -0.15411758422851562, -0.1467266082763672, -0.13933563232421875, -0.1319446563720703, -0.12455368041992188, -0.11716270446777344, -0.109771728515625, -0.10238075256347656, -0.09498977661132812, -0.08759880065917969, -0.08020782470703125, -0.07281684875488281, -0.06542587280273438, -0.05803489685058594, -0.0506439208984375, -0.04325294494628906, -0.035861968994140625, -0.028470993041992188, -0.02108001708984375, -0.013689041137695312, -0.006298065185546875, 0.0010929107666015625, 0.00848388671875, 0.015874862670898438, 0.023265838623046875, 0.030656814575195312, 0.03804779052734375, 0.04543876647949219, 0.052829742431640625, 0.06022071838378906, 0.0676116943359375, 0.07500267028808594, 0.08239364624023438, 0.08978462219238281, 0.09717559814453125, 0.10456657409667969, 0.11195755004882812, 0.11934852600097656, 0.126739501953125, 0.13413047790527344, 0.14152145385742188, 0.1489124298095703, 0.15630340576171875, 0.1636943817138672, 0.17108535766601562, 0.17847633361816406, 0.1858673095703125, 0.19325828552246094, 0.20064926147460938, 0.2080402374267578, 0.21543121337890625, 0.2228221893310547, 0.23021316528320312, 0.23760414123535156, 0.2449951171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 1.0, 0.0, 8.0, 4.0, 8.0, 9.0, 3.0, 15.0, 22.0, 21.0, 27.0, 28.0, 34.0, 31.0, 41.0, 48.0, 54.0, 71.0, 62.0, 72.0, 61.0, 62.0, 51.0, 44.0, 42.0, 29.0, 22.0, 20.0, 18.0, 17.0, 8.0, 14.0, 9.0, 7.0, 9.0, 8.0, 4.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.528594970703125e-05, -3.425776958465576e-05, -3.3229589462280273e-05, -3.2201409339904785e-05, -3.11732292175293e-05, -3.014504909515381e-05, -2.911686897277832e-05, -2.8088688850402832e-05, -2.7060508728027344e-05, -2.6032328605651855e-05, -2.5004148483276367e-05, -2.397596836090088e-05, -2.294778823852539e-05, -2.1919608116149902e-05, -2.0891427993774414e-05, -1.9863247871398926e-05, -1.8835067749023438e-05, -1.780688762664795e-05, -1.677870750427246e-05, -1.5750527381896973e-05, -1.4722347259521484e-05, -1.3694167137145996e-05, -1.2665987014770508e-05, -1.163780689239502e-05, -1.0609626770019531e-05, -9.581446647644043e-06, -8.553266525268555e-06, -7.525086402893066e-06, -6.496906280517578e-06, -5.46872615814209e-06, -4.4405460357666016e-06, -3.4123659133911133e-06, -2.384185791015625e-06, -1.3560056686401367e-06, -3.2782554626464844e-07, 7.003545761108398e-07, 1.7285346984863281e-06, 2.7567148208618164e-06, 3.7848949432373047e-06, 4.813075065612793e-06, 5.841255187988281e-06, 6.8694353103637695e-06, 7.897615432739258e-06, 8.925795555114746e-06, 9.953975677490234e-06, 1.0982155799865723e-05, 1.2010335922241211e-05, 1.30385160446167e-05, 1.4066696166992188e-05, 1.5094876289367676e-05, 1.6123056411743164e-05, 1.7151236534118652e-05, 1.817941665649414e-05, 1.920759677886963e-05, 2.0235776901245117e-05, 2.1263957023620605e-05, 2.2292137145996094e-05, 2.3320317268371582e-05, 2.434849739074707e-05, 2.537667751312256e-05, 2.6404857635498047e-05, 2.7433037757873535e-05, 2.8461217880249023e-05, 2.9489398002624512e-05, 3.0517578125e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 12.0, 24.0, 35.0, 64.0, 99.0, 197.0, 358.0, 707.0, 1501.0, 4625.0, 18940.0, 117603.0, 650489.0, 212782.0, 30544.0, 6626.0, 2131.0, 847.0, 427.0, 209.0, 145.0, 73.0, 30.0, 23.0, 25.0, 8.0, 13.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2705078125, -0.2626991271972656, -0.25489044189453125, -0.24708175659179688, -0.2392730712890625, -0.23146438598632812, -0.22365570068359375, -0.21584701538085938, -0.208038330078125, -0.20022964477539062, -0.19242095947265625, -0.18461227416992188, -0.1768035888671875, -0.16899490356445312, -0.16118621826171875, -0.15337753295898438, -0.14556884765625, -0.13776016235351562, -0.12995147705078125, -0.12214279174804688, -0.1143341064453125, -0.10652542114257812, -0.09871673583984375, -0.09090805053710938, -0.083099365234375, -0.07529067993164062, -0.06748199462890625, -0.059673309326171875, -0.0518646240234375, -0.044055938720703125, -0.03624725341796875, -0.028438568115234375, -0.0206298828125, -0.012821197509765625, -0.00501251220703125, 0.002796173095703125, 0.0106048583984375, 0.018413543701171875, 0.02622222900390625, 0.034030914306640625, 0.041839599609375, 0.049648284912109375, 0.05745697021484375, 0.06526565551757812, 0.0730743408203125, 0.08088302612304688, 0.08869171142578125, 0.09650039672851562, 0.10430908203125, 0.11211776733398438, 0.11992645263671875, 0.12773513793945312, 0.1355438232421875, 0.14335250854492188, 0.15116119384765625, 0.15896987915039062, 0.166778564453125, 0.17458724975585938, 0.18239593505859375, 0.19020462036132812, 0.1980133056640625, 0.20582199096679688, 0.21363067626953125, 0.22143936157226562, 0.229248046875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 11.0, 8.0, 25.0, 38.0, 64.0, 64.0, 100.0, 137.0, 167.0, 113.0, 92.0, 65.0, 35.0, 32.0, 23.0, 15.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22732162475585938, -0.22051239013671875, -0.21370315551757812, -0.2068939208984375, -0.20008468627929688, -0.19327545166015625, -0.18646621704101562, -0.179656982421875, -0.17284774780273438, -0.16603851318359375, -0.15922927856445312, -0.1524200439453125, -0.14561080932617188, -0.13880157470703125, -0.13199234008789062, -0.12518310546875, -0.11837387084960938, -0.11156463623046875, -0.10475540161132812, -0.0979461669921875, -0.09113693237304688, -0.08432769775390625, -0.07751846313476562, -0.070709228515625, -0.06389999389648438, -0.05709075927734375, -0.050281524658203125, -0.0434722900390625, -0.036663055419921875, -0.02985382080078125, -0.023044586181640625, -0.0162353515625, -0.009426116943359375, -0.00261688232421875, 0.004192352294921875, 0.0110015869140625, 0.017810821533203125, 0.02462005615234375, 0.031429290771484375, 0.038238525390625, 0.045047760009765625, 0.05185699462890625, 0.058666229248046875, 0.0654754638671875, 0.07228469848632812, 0.07909393310546875, 0.08590316772460938, 0.09271240234375, 0.09952163696289062, 0.10633087158203125, 0.11314010620117188, 0.1199493408203125, 0.12675857543945312, 0.13356781005859375, 0.14037704467773438, 0.147186279296875, 0.15399551391601562, 0.16080474853515625, 0.16761398315429688, 0.1744232177734375, 0.18123245239257812, 0.18804168701171875, 0.19485092163085938, 0.20166015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 11.0, 8.0, 30.0, 49.0, 67.0, 140.0, 250.0, 186.0, 113.0, 60.0, 45.0, 16.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8819222450256348, -2.774542808532715, -2.667163372039795, -2.559783935546875, -2.452404260635376, -2.345024824142456, -2.237645387649536, -2.130265951156616, -2.0228865146636963, -1.9155070781707764, -1.808127522468567, -1.700748085975647, -1.593368649482727, -1.4859890937805176, -1.3786096572875977, -1.2712302207946777, -1.1638506650924683, -1.0564712285995483, -0.9490917325019836, -0.841712236404419, -0.734332799911499, -0.6269533038139343, -0.5195738077163696, -0.4121943712234497, -0.304814875125885, -0.1974354088306427, -0.0900559276342392, 0.017323553562164307, 0.12470301985740662, 0.23208248615264893, 0.3394619822502136, 0.44684141874313354, 0.5542209148406982, 0.6616004109382629, 0.7689798474311829, 0.8763593435287476, 0.9837387800216675, 1.091118335723877, 1.1984977722167969, 1.3058772087097168, 1.4132566452026367, 1.5206360816955566, 1.6280156373977661, 1.735395073890686, 1.842774510383606, 1.9501540660858154, 2.0575335025787354, 2.1649129390716553, 2.2722926139831543, 2.379672050476074, 2.487051486968994, 2.594430923461914, 2.701810598373413, 2.809190034866333, 2.916569471359253, 3.023948907852173, 3.1313283443450928, 3.2387077808380127, 3.3460872173309326, 3.4534668922424316, 3.5608463287353516, 3.6682257652282715, 3.7756052017211914, 3.8829846382141113, 3.9903640747070312]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 1.0, 8.0, 10.0, 11.0, 12.0, 19.0, 22.0, 25.0, 28.0, 33.0, 50.0, 36.0, 47.0, 54.0, 62.0, 57.0, 58.0, 55.0, 55.0, 52.0, 42.0, 39.0, 35.0, 32.0, 37.0, 18.0, 25.0, 22.0, 11.0, 17.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7582156658172607, -1.6930890083312988, -1.627962350845337, -1.562835693359375, -1.497709035873413, -1.4325823783874512, -1.3674558401107788, -1.302329182624817, -1.237202525138855, -1.172075867652893, -1.1069492101669312, -1.0418225526809692, -0.9766959547996521, -0.9115692973136902, -0.846442699432373, -0.7813160419464111, -0.7161893844604492, -0.6510627269744873, -0.5859360694885254, -0.5208094716072083, -0.45568281412124634, -0.3905561566352844, -0.3254295289516449, -0.26030290126800537, -0.19517624378204346, -0.13004960119724274, -0.06492295861244202, 0.0002036839723587036, 0.06533032655715942, 0.13045698404312134, 0.19558361172676086, 0.2607102394104004, 0.3258371353149414, 0.3909637928009033, 0.45609042048454285, 0.5212170481681824, 0.5863437056541443, 0.6514703631401062, 0.7165969610214233, 0.7817236185073853, 0.8468502759933472, 0.9119769334793091, 0.977103590965271, 1.042230248451233, 1.1073567867279053, 1.1724834442138672, 1.237610101699829, 1.302736759185791, 1.367863416671753, 1.4329900741577148, 1.4981167316436768, 1.5632433891296387, 1.6283700466156006, 1.6934967041015625, 1.7586232423782349, 1.8237498998641968, 1.8888765573501587, 1.9540032148361206, 2.019129753112793, 2.084256410598755, 2.149383068084717, 2.2145097255706787, 2.2796363830566406, 2.3447630405426025, 2.4098896980285645]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 8.0, 9.0, 7.0, 12.0, 15.0, 13.0, 23.0, 40.0, 51.0, 71.0, 123.0, 182.0, 294.0, 551.0, 1215.0, 3491.0, 13877.0, 147908.0, 3972464.0, 41942.0, 7458.0, 2384.0, 980.0, 511.0, 245.0, 141.0, 105.0, 52.0, 33.0, 33.0, 11.0, 4.0, 16.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.0330963134765625, -0.997833251953125, -0.9625701904296875, -0.92730712890625, -0.8920440673828125, -0.856781005859375, -0.8215179443359375, -0.7862548828125, -0.7509918212890625, -0.715728759765625, -0.6804656982421875, -0.64520263671875, -0.6099395751953125, -0.574676513671875, -0.5394134521484375, -0.504150390625, -0.4688873291015625, -0.433624267578125, -0.3983612060546875, -0.36309814453125, -0.3278350830078125, -0.292572021484375, -0.2573089599609375, -0.2220458984375, -0.1867828369140625, -0.151519775390625, -0.1162567138671875, -0.08099365234375, -0.0457305908203125, -0.010467529296875, 0.0247955322265625, 0.06005859375, 0.0953216552734375, 0.130584716796875, 0.1658477783203125, 0.20111083984375, 0.2363739013671875, 0.271636962890625, 0.3069000244140625, 0.3421630859375, 0.3774261474609375, 0.412689208984375, 0.4479522705078125, 0.48321533203125, 0.5184783935546875, 0.553741455078125, 0.5890045166015625, 0.624267578125, 0.6595306396484375, 0.694793701171875, 0.7300567626953125, 0.76531982421875, 0.8005828857421875, 0.835845947265625, 0.8711090087890625, 0.9063720703125, 0.9416351318359375, 0.976898193359375, 1.0121612548828125, 1.04742431640625, 1.0826873779296875, 1.117950439453125, 1.1532135009765625, 1.1884765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 12.0, 19.0, 31.0, 34.0, 32.0, 38.0, 56.0, 65.0, 74.0, 86.0, 76.0, 90.0, 58.0, 69.0, 58.0, 45.0, 32.0, 21.0, 21.0, 13.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.12939453125, -0.12581825256347656, -0.12224197387695312, -0.11866569519042969, -0.11508941650390625, -0.11151313781738281, -0.10793685913085938, -0.10436058044433594, -0.1007843017578125, -0.09720802307128906, -0.09363174438476562, -0.09005546569824219, -0.08647918701171875, -0.08290290832519531, -0.07932662963867188, -0.07575035095214844, -0.072174072265625, -0.06859779357910156, -0.06502151489257812, -0.06144523620605469, -0.05786895751953125, -0.05429267883300781, -0.050716400146484375, -0.04714012145996094, -0.0435638427734375, -0.03998756408691406, -0.036411285400390625, -0.03283500671386719, -0.02925872802734375, -0.025682449340820312, -0.022106170654296875, -0.018529891967773438, -0.01495361328125, -0.011377334594726562, -0.007801055908203125, -0.0042247772216796875, -0.00064849853515625, 0.0029277801513671875, 0.006504058837890625, 0.010080337524414062, 0.0136566162109375, 0.017232894897460938, 0.020809173583984375, 0.024385452270507812, 0.02796173095703125, 0.03153800964355469, 0.035114288330078125, 0.03869056701660156, 0.042266845703125, 0.04584312438964844, 0.049419403076171875, 0.05299568176269531, 0.05657196044921875, 0.06014823913574219, 0.06372451782226562, 0.06730079650878906, 0.0708770751953125, 0.07445335388183594, 0.07802963256835938, 0.08160591125488281, 0.08518218994140625, 0.08875846862792969, 0.09233474731445312, 0.09591102600097656, 0.0994873046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 6.0, 18.0, 18.0, 36.0, 39.0, 47.0, 110.0, 123.0, 199.0, 353.0, 542.0, 949.0, 1754.0, 3382.0, 7304.0, 17701.0, 56132.0, 387202.0, 3438701.0, 212971.0, 40922.0, 13729.0, 5742.0, 2795.0, 1432.0, 801.0, 485.0, 256.0, 155.0, 105.0, 80.0, 53.0, 36.0, 29.0, 23.0, 16.0, 7.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39208984375, -0.37776947021484375, -0.3634490966796875, -0.34912872314453125, -0.334808349609375, -0.32048797607421875, -0.3061676025390625, -0.29184722900390625, -0.27752685546875, -0.26320648193359375, -0.2488861083984375, -0.23456573486328125, -0.220245361328125, -0.20592498779296875, -0.1916046142578125, -0.17728424072265625, -0.1629638671875, -0.14864349365234375, -0.1343231201171875, -0.12000274658203125, -0.105682373046875, -0.09136199951171875, -0.0770416259765625, -0.06272125244140625, -0.04840087890625, -0.03408050537109375, -0.0197601318359375, -0.00543975830078125, 0.008880615234375, 0.02320098876953125, 0.0375213623046875, 0.05184173583984375, 0.066162109375, 0.08048248291015625, 0.0948028564453125, 0.10912322998046875, 0.123443603515625, 0.13776397705078125, 0.1520843505859375, 0.16640472412109375, 0.18072509765625, 0.19504547119140625, 0.2093658447265625, 0.22368621826171875, 0.238006591796875, 0.25232696533203125, 0.2666473388671875, 0.28096771240234375, 0.2952880859375, 0.30960845947265625, 0.3239288330078125, 0.33824920654296875, 0.352569580078125, 0.36688995361328125, 0.3812103271484375, 0.39553070068359375, 0.40985107421875, 0.42417144775390625, 0.4384918212890625, 0.45281219482421875, 0.467132568359375, 0.48145294189453125, 0.4957733154296875, 0.5100936889648438, 0.5244140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 5.0, 9.0, 5.0, 10.0, 6.0, 16.0, 15.0, 22.0, 37.0, 56.0, 80.0, 162.0, 386.0, 1607.0, 978.0, 290.0, 148.0, 84.0, 62.0, 33.0, 18.0, 18.0, 15.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2320556640625, -0.22575950622558594, -0.21946334838867188, -0.2131671905517578, -0.20687103271484375, -0.2005748748779297, -0.19427871704101562, -0.18798255920410156, -0.1816864013671875, -0.17539024353027344, -0.16909408569335938, -0.1627979278564453, -0.15650177001953125, -0.1502056121826172, -0.14390945434570312, -0.13761329650878906, -0.131317138671875, -0.12502098083496094, -0.11872482299804688, -0.11242866516113281, -0.10613250732421875, -0.09983634948730469, -0.09354019165039062, -0.08724403381347656, -0.0809478759765625, -0.07465171813964844, -0.06835556030273438, -0.06205940246582031, -0.05576324462890625, -0.04946708679199219, -0.043170928955078125, -0.03687477111816406, -0.03057861328125, -0.024282455444335938, -0.017986297607421875, -0.011690139770507812, -0.00539398193359375, 0.0009021759033203125, 0.007198333740234375, 0.013494491577148438, 0.0197906494140625, 0.026086807250976562, 0.032382965087890625, 0.03867912292480469, 0.04497528076171875, 0.05127143859863281, 0.057567596435546875, 0.06386375427246094, 0.070159912109375, 0.07645606994628906, 0.08275222778320312, 0.08904838562011719, 0.09534454345703125, 0.10164070129394531, 0.10793685913085938, 0.11423301696777344, 0.1205291748046875, 0.12682533264160156, 0.13312149047851562, 0.1394176483154297, 0.14571380615234375, 0.1520099639892578, 0.15830612182617188, 0.16460227966308594, 0.1708984375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 3.0, 6.0, 6.0, 15.0, 40.0, 53.0, 109.0, 140.0, 195.0, 169.0, 120.0, 74.0, 25.0, 20.0, 9.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8479150533676147, -1.8002554178237915, -1.7525957822799683, -1.704936146736145, -1.6572763919830322, -1.609616756439209, -1.5619571208953857, -1.5142974853515625, -1.4666378498077393, -1.418978214263916, -1.3713185787200928, -1.3236589431762695, -1.2759993076324463, -1.2283395528793335, -1.1806799173355103, -1.133020281791687, -1.0853606462478638, -1.0377010107040405, -0.9900413751602173, -0.9423816800117493, -0.894722044467926, -0.8470624089241028, -0.7994027137756348, -0.7517430782318115, -0.7040834426879883, -0.656423807144165, -0.6087641716003418, -0.5611044764518738, -0.5134448409080505, -0.4657852053642273, -0.41812554001808167, -0.37046587467193604, -0.32280611991882324, -0.275146484375, -0.22748681902885437, -0.17982716858386993, -0.1321675181388855, -0.08450786769390106, -0.036848217248916626, 0.010811448097229004, 0.058471083641052246, 0.10613073408603668, 0.15379038453102112, 0.20145003497600555, 0.24910968542099, 0.29676932096481323, 0.34442898631095886, 0.3920886516571045, 0.43974828720092773, 0.487407922744751, 0.5350675582885742, 0.5827272534370422, 0.6303868889808655, 0.6780465245246887, 0.7257062196731567, 0.77336585521698, 0.8210254907608032, 0.8686851263046265, 0.9163447618484497, 0.9640044569969177, 1.0116641521453857, 1.059323787689209, 1.1069834232330322, 1.1546430587768555, 1.2023026943206787]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 0.0, 3.0, 7.0, 10.0, 10.0, 9.0, 13.0, 20.0, 14.0, 24.0, 26.0, 32.0, 13.0, 38.0, 34.0, 38.0, 42.0, 33.0, 37.0, 47.0, 39.0, 49.0, 30.0, 35.0, 45.0, 43.0, 38.0, 31.0, 30.0, 31.0, 26.0, 30.0, 24.0, 18.0, 16.0, 14.0, 15.0, 9.0, 9.0, 3.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5908243656158447, -0.5731974244117737, -0.5555704832077026, -0.5379435420036316, -0.5203166007995605, -0.5026896595954895, -0.48506271839141846, -0.4674357771873474, -0.44980883598327637, -0.4321818947792053, -0.4145549535751343, -0.39692801237106323, -0.3793010711669922, -0.36167412996292114, -0.3440471887588501, -0.32642024755477905, -0.3087932765483856, -0.2911663353443146, -0.27353939414024353, -0.2559124529361725, -0.23828551173210144, -0.2206585705280304, -0.20303161442279816, -0.1854046732187271, -0.16777773201465607, -0.15015079081058502, -0.13252384960651398, -0.11489690095186234, -0.09726995974779129, -0.07964301854372025, -0.062016069889068604, -0.04438912868499756, -0.026762187480926514, -0.00913524441421032, 0.008491698652505875, 0.026118643581867218, 0.04374558478593826, 0.06137252599000931, 0.07899947464466095, 0.096626415848732, 0.11425335705280304, 0.13188029825687408, 0.14950723946094513, 0.16713419556617737, 0.1847611367702484, 0.20238807797431946, 0.2200150191783905, 0.23764196038246155, 0.2552689015865326, 0.27289584279060364, 0.2905227839946747, 0.3081497251987457, 0.3257766664028168, 0.3434036076068878, 0.36103057861328125, 0.3786575198173523, 0.39628446102142334, 0.4139114022254944, 0.43153834342956543, 0.4491652846336365, 0.4667922258377075, 0.48441916704177856, 0.5020461082458496, 0.5196730494499207, 0.5372999906539917]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 8.0, 10.0, 13.0, 16.0, 17.0, 30.0, 59.0, 78.0, 141.0, 206.0, 272.0, 470.0, 725.0, 1263.0, 2210.0, 4322.0, 9220.0, 22736.0, 75838.0, 331930.0, 436740.0, 109177.0, 30140.0, 11340.0, 5248.0, 2631.0, 1399.0, 832.0, 529.0, 335.0, 182.0, 150.0, 83.0, 66.0, 52.0, 25.0, 13.0, 13.0, 4.0, 5.0, 3.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4267578125, -0.41304779052734375, -0.3993377685546875, -0.38562774658203125, -0.371917724609375, -0.35820770263671875, -0.3444976806640625, -0.33078765869140625, -0.31707763671875, -0.30336761474609375, -0.2896575927734375, -0.27594757080078125, -0.262237548828125, -0.24852752685546875, -0.2348175048828125, -0.22110748291015625, -0.2073974609375, -0.19368743896484375, -0.1799774169921875, -0.16626739501953125, -0.152557373046875, -0.13884735107421875, -0.1251373291015625, -0.11142730712890625, -0.09771728515625, -0.08400726318359375, -0.0702972412109375, -0.05658721923828125, -0.042877197265625, -0.02916717529296875, -0.0154571533203125, -0.00174713134765625, 0.011962890625, 0.02567291259765625, 0.0393829345703125, 0.05309295654296875, 0.066802978515625, 0.08051300048828125, 0.0942230224609375, 0.10793304443359375, 0.12164306640625, 0.13535308837890625, 0.1490631103515625, 0.16277313232421875, 0.176483154296875, 0.19019317626953125, 0.2039031982421875, 0.21761322021484375, 0.2313232421875, 0.24503326416015625, 0.2587432861328125, 0.27245330810546875, 0.286163330078125, 0.29987335205078125, 0.3135833740234375, 0.32729339599609375, 0.34100341796875, 0.35471343994140625, 0.3684234619140625, 0.38213348388671875, 0.395843505859375, 0.40955352783203125, 0.4232635498046875, 0.43697357177734375, 0.45068359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 10.0, 9.0, 10.0, 13.0, 17.0, 22.0, 29.0, 34.0, 52.0, 58.0, 70.0, 74.0, 68.0, 81.0, 81.0, 81.0, 75.0, 41.0, 47.0, 28.0, 23.0, 19.0, 18.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12445068359375, -0.12069225311279297, -0.11693382263183594, -0.1131753921508789, -0.10941696166992188, -0.10565853118896484, -0.10190010070800781, -0.09814167022705078, -0.09438323974609375, -0.09062480926513672, -0.08686637878417969, -0.08310794830322266, -0.07934951782226562, -0.0755910873413086, -0.07183265686035156, -0.06807422637939453, -0.0643157958984375, -0.06055736541748047, -0.05679893493652344, -0.053040504455566406, -0.049282073974609375, -0.045523643493652344, -0.04176521301269531, -0.03800678253173828, -0.03424835205078125, -0.03048992156982422, -0.026731491088867188, -0.022973060607910156, -0.019214630126953125, -0.015456199645996094, -0.011697769165039062, -0.007939338684082031, -0.004180908203125, -0.00042247772216796875, 0.0033359527587890625, 0.007094383239746094, 0.010852813720703125, 0.014611244201660156, 0.018369674682617188, 0.02212810516357422, 0.02588653564453125, 0.02964496612548828, 0.03340339660644531, 0.037161827087402344, 0.040920257568359375, 0.044678688049316406, 0.04843711853027344, 0.05219554901123047, 0.0559539794921875, 0.05971240997314453, 0.06347084045410156, 0.0672292709350586, 0.07098770141601562, 0.07474613189697266, 0.07850456237792969, 0.08226299285888672, 0.08602142333984375, 0.08977985382080078, 0.09353828430175781, 0.09729671478271484, 0.10105514526367188, 0.1048135757446289, 0.10857200622558594, 0.11233043670654297, 0.1160888671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 11.0, 10.0, 16.0, 27.0, 31.0, 41.0, 57.0, 66.0, 139.0, 196.0, 259.0, 414.0, 676.0, 1198.0, 2017.0, 3920.0, 7150.0, 14302.0, 30676.0, 70656.0, 175920.0, 332688.0, 234149.0, 95667.0, 39889.0, 18527.0, 9022.0, 4619.0, 2565.0, 1368.0, 777.0, 536.0, 273.0, 201.0, 162.0, 81.0, 88.0, 53.0, 33.0, 20.0, 15.0, 10.0, 12.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.2392578125, -0.23215103149414062, -0.22504425048828125, -0.21793746948242188, -0.2108306884765625, -0.20372390747070312, -0.19661712646484375, -0.18951034545898438, -0.182403564453125, -0.17529678344726562, -0.16819000244140625, -0.16108322143554688, -0.1539764404296875, -0.14686965942382812, -0.13976287841796875, -0.13265609741210938, -0.12554931640625, -0.11844253540039062, -0.11133575439453125, -0.10422897338867188, -0.0971221923828125, -0.09001541137695312, -0.08290863037109375, -0.07580184936523438, -0.068695068359375, -0.061588287353515625, -0.05448150634765625, -0.047374725341796875, -0.0402679443359375, -0.033161163330078125, -0.02605438232421875, -0.018947601318359375, -0.0118408203125, -0.004734039306640625, 0.00237274169921875, 0.009479522705078125, 0.0165863037109375, 0.023693084716796875, 0.03079986572265625, 0.037906646728515625, 0.045013427734375, 0.052120208740234375, 0.05922698974609375, 0.06633377075195312, 0.0734405517578125, 0.08054733276367188, 0.08765411376953125, 0.09476089477539062, 0.10186767578125, 0.10897445678710938, 0.11608123779296875, 0.12318801879882812, 0.1302947998046875, 0.13740158081054688, 0.14450836181640625, 0.15161514282226562, 0.158721923828125, 0.16582870483398438, 0.17293548583984375, 0.18004226684570312, 0.1871490478515625, 0.19425582885742188, 0.20136260986328125, 0.20846939086914062, 0.215576171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 0.0, 7.0, 8.0, 12.0, 2.0, 11.0, 8.0, 15.0, 13.0, 22.0, 17.0, 16.0, 21.0, 28.0, 35.0, 29.0, 27.0, 25.0, 26.0, 40.0, 38.0, 37.0, 34.0, 39.0, 36.0, 43.0, 34.0, 31.0, 43.0, 32.0, 23.0, 32.0, 30.0, 21.0, 24.0, 10.0, 14.0, 14.0, 24.0, 11.0, 12.0, 9.0, 6.0, 6.0, 5.0, 5.0, 5.0, 9.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.278076171875, -0.26966094970703125, -0.2612457275390625, -0.25283050537109375, -0.244415283203125, -0.23600006103515625, -0.2275848388671875, -0.21916961669921875, -0.21075439453125, -0.20233917236328125, -0.1939239501953125, -0.18550872802734375, -0.177093505859375, -0.16867828369140625, -0.1602630615234375, -0.15184783935546875, -0.1434326171875, -0.13501739501953125, -0.1266021728515625, -0.11818695068359375, -0.109771728515625, -0.10135650634765625, -0.0929412841796875, -0.08452606201171875, -0.07611083984375, -0.06769561767578125, -0.0592803955078125, -0.05086517333984375, -0.042449951171875, -0.03403472900390625, -0.0256195068359375, -0.01720428466796875, -0.0087890625, -0.00037384033203125, 0.0080413818359375, 0.01645660400390625, 0.024871826171875, 0.03328704833984375, 0.0417022705078125, 0.05011749267578125, 0.05853271484375, 0.06694793701171875, 0.0753631591796875, 0.08377838134765625, 0.092193603515625, 0.10060882568359375, 0.1090240478515625, 0.11743927001953125, 0.1258544921875, 0.13426971435546875, 0.1426849365234375, 0.15110015869140625, 0.159515380859375, 0.16793060302734375, 0.1763458251953125, 0.18476104736328125, 0.19317626953125, 0.20159149169921875, 0.2100067138671875, 0.21842193603515625, 0.226837158203125, 0.23525238037109375, 0.2436676025390625, 0.25208282470703125, 0.260498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 12.0, 12.0, 29.0, 38.0, 71.0, 128.0, 372.0, 873.0, 3758.0, 29311.0, 419876.0, 546919.0, 40511.0, 4768.0, 1137.0, 382.0, 165.0, 83.0, 41.0, 26.0, 16.0, 9.0, 7.0, 2.0, 7.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2841796875, -0.2755851745605469, -0.26699066162109375, -0.2583961486816406, -0.2498016357421875, -0.24120712280273438, -0.23261260986328125, -0.22401809692382812, -0.215423583984375, -0.20682907104492188, -0.19823455810546875, -0.18964004516601562, -0.1810455322265625, -0.17245101928710938, -0.16385650634765625, -0.15526199340820312, -0.14666748046875, -0.13807296752929688, -0.12947845458984375, -0.12088394165039062, -0.1122894287109375, -0.10369491577148438, -0.09510040283203125, -0.08650588989257812, -0.077911376953125, -0.06931686401367188, -0.06072235107421875, -0.052127838134765625, -0.0435333251953125, -0.034938812255859375, -0.02634429931640625, -0.017749786376953125, -0.0091552734375, -0.000560760498046875, 0.00803375244140625, 0.016628265380859375, 0.0252227783203125, 0.033817291259765625, 0.04241180419921875, 0.051006317138671875, 0.059600830078125, 0.06819534301757812, 0.07678985595703125, 0.08538436889648438, 0.0939788818359375, 0.10257339477539062, 0.11116790771484375, 0.11976242065429688, 0.12835693359375, 0.13695144653320312, 0.14554595947265625, 0.15414047241210938, 0.1627349853515625, 0.17132949829101562, 0.17992401123046875, 0.18851852416992188, 0.197113037109375, 0.20570755004882812, 0.21430206298828125, 0.22289657592773438, 0.2314910888671875, 0.24008560180664062, 0.24868011474609375, 0.2572746276855469, 0.265869140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 5.0, 10.0, 7.0, 8.0, 12.0, 18.0, 21.0, 19.0, 28.0, 39.0, 52.0, 74.0, 60.0, 82.0, 78.0, 77.0, 80.0, 52.0, 50.0, 48.0, 44.0, 18.0, 21.0, 21.0, 20.0, 16.0, 6.0, 7.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1604042053222656e-05, -4.039797931909561e-05, -3.919191658496857e-05, -3.798585385084152e-05, -3.677979111671448e-05, -3.557372838258743e-05, -3.436766564846039e-05, -3.3161602914333344e-05, -3.19555401802063e-05, -3.0749477446079254e-05, -2.954341471195221e-05, -2.8337351977825165e-05, -2.713128924369812e-05, -2.5925226509571075e-05, -2.471916377544403e-05, -2.3513101041316986e-05, -2.230703830718994e-05, -2.1100975573062897e-05, -1.9894912838935852e-05, -1.8688850104808807e-05, -1.7482787370681763e-05, -1.6276724636554718e-05, -1.5070661902427673e-05, -1.3864599168300629e-05, -1.2658536434173584e-05, -1.145247370004654e-05, -1.0246410965919495e-05, -9.04034823179245e-06, -7.834285497665405e-06, -6.628222763538361e-06, -5.422160029411316e-06, -4.216097295284271e-06, -3.0100345611572266e-06, -1.8039718270301819e-06, -5.979090929031372e-07, 6.081536412239075e-07, 1.8142163753509521e-06, 3.020279109477997e-06, 4.2263418436050415e-06, 5.432404577732086e-06, 6.638467311859131e-06, 7.844530045986176e-06, 9.05059278011322e-06, 1.0256655514240265e-05, 1.146271824836731e-05, 1.2668780982494354e-05, 1.3874843716621399e-05, 1.5080906450748444e-05, 1.6286969184875488e-05, 1.7493031919002533e-05, 1.8699094653129578e-05, 1.9905157387256622e-05, 2.1111220121383667e-05, 2.231728285551071e-05, 2.3523345589637756e-05, 2.47294083237648e-05, 2.5935471057891846e-05, 2.714153379201889e-05, 2.8347596526145935e-05, 2.955365926027298e-05, 3.0759721994400024e-05, 3.196578472852707e-05, 3.3171847462654114e-05, 3.437791019678116e-05, 3.55839729309082e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 10.0, 26.0, 21.0, 36.0, 64.0, 117.0, 186.0, 331.0, 637.0, 1458.0, 3354.0, 8530.0, 26682.0, 99744.0, 415857.0, 368876.0, 85794.0, 23246.0, 7900.0, 3007.0, 1291.0, 619.0, 302.0, 159.0, 105.0, 65.0, 40.0, 32.0, 19.0, 19.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.212646484375, -0.20704269409179688, -0.20143890380859375, -0.19583511352539062, -0.1902313232421875, -0.18462753295898438, -0.17902374267578125, -0.17341995239257812, -0.167816162109375, -0.16221237182617188, -0.15660858154296875, -0.15100479125976562, -0.1454010009765625, -0.13979721069335938, -0.13419342041015625, -0.12858963012695312, -0.12298583984375, -0.11738204956054688, -0.11177825927734375, -0.10617446899414062, -0.1005706787109375, -0.09496688842773438, -0.08936309814453125, -0.08375930786132812, -0.078155517578125, -0.07255172729492188, -0.06694793701171875, -0.061344146728515625, -0.0557403564453125, -0.050136566162109375, -0.04453277587890625, -0.038928985595703125, -0.0333251953125, -0.027721405029296875, -0.02211761474609375, -0.016513824462890625, -0.0109100341796875, -0.005306243896484375, 0.00029754638671875, 0.005901336669921875, 0.011505126953125, 0.017108917236328125, 0.02271270751953125, 0.028316497802734375, 0.0339202880859375, 0.039524078369140625, 0.04512786865234375, 0.050731658935546875, 0.05633544921875, 0.061939239501953125, 0.06754302978515625, 0.07314682006835938, 0.0787506103515625, 0.08435440063476562, 0.08995819091796875, 0.09556198120117188, 0.101165771484375, 0.10676956176757812, 0.11237335205078125, 0.11797714233398438, 0.1235809326171875, 0.12918472290039062, 0.13478851318359375, 0.14039230346679688, 0.14599609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 6.0, 10.0, 14.0, 11.0, 21.0, 22.0, 29.0, 29.0, 35.0, 49.0, 87.0, 72.0, 89.0, 89.0, 82.0, 76.0, 59.0, 49.0, 44.0, 19.0, 35.0, 14.0, 12.0, 12.0, 8.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09735107421875, -0.0929880142211914, -0.08862495422363281, -0.08426189422607422, -0.07989883422851562, -0.07553577423095703, -0.07117271423339844, -0.06680965423583984, -0.06244659423828125, -0.058083534240722656, -0.05372047424316406, -0.04935741424560547, -0.044994354248046875, -0.04063129425048828, -0.03626823425292969, -0.031905174255371094, -0.0275421142578125, -0.023179054260253906, -0.018815994262695312, -0.014452934265136719, -0.010089874267578125, -0.005726814270019531, -0.0013637542724609375, 0.0029993057250976562, 0.00736236572265625, 0.011725425720214844, 0.016088485717773438, 0.02045154571533203, 0.024814605712890625, 0.02917766571044922, 0.03354072570800781, 0.037903785705566406, 0.042266845703125, 0.046629905700683594, 0.05099296569824219, 0.05535602569580078, 0.059719085693359375, 0.06408214569091797, 0.06844520568847656, 0.07280826568603516, 0.07717132568359375, 0.08153438568115234, 0.08589744567871094, 0.09026050567626953, 0.09462356567382812, 0.09898662567138672, 0.10334968566894531, 0.1077127456665039, 0.1120758056640625, 0.1164388656616211, 0.12080192565917969, 0.12516498565673828, 0.12952804565429688, 0.13389110565185547, 0.13825416564941406, 0.14261722564697266, 0.14698028564453125, 0.15134334564208984, 0.15570640563964844, 0.16006946563720703, 0.16443252563476562, 0.16879558563232422, 0.1731586456298828, 0.1775217056274414, 0.181884765625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 13.0, 13.0, 29.0, 45.0, 70.0, 145.0, 181.0, 192.0, 129.0, 67.0, 47.0, 33.0, 16.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7640862464904785, -3.6674387454986572, -3.570791244506836, -3.4741437435150146, -3.3774962425231934, -3.280848979949951, -3.18420147895813, -3.0875539779663086, -2.9909064769744873, -2.894258975982666, -2.7976114749908447, -2.7009639739990234, -2.6043167114257812, -2.50766921043396, -2.4110217094421387, -2.3143742084503174, -2.217726707458496, -2.121079206466675, -2.0244317054748535, -1.9277843236923218, -1.8311368227005005, -1.7344893217086792, -1.6378419399261475, -1.5411944389343262, -1.4445469379425049, -1.3478994369506836, -1.2512519359588623, -1.1546045541763306, -1.0579570531845093, -0.961309552192688, -0.8646621108055115, -0.768014669418335, -0.6713674068450928, -0.5747199058532715, -0.47807246446609497, -0.38142499327659607, -0.28477752208709717, -0.18813005089759827, -0.09148257970809937, 0.0051648616790771484, 0.10181236267089844, 0.19845983386039734, 0.29510730504989624, 0.39175477623939514, 0.48840224742889404, 0.5850497484207153, 0.6816971898078918, 0.7783446311950684, 0.8749921321868896, 0.9716396331787109, 1.0682871341705322, 1.164934515953064, 1.2615820169448853, 1.3582295179367065, 1.4548768997192383, 1.5515244007110596, 1.6481719017028809, 1.7448194026947021, 1.8414669036865234, 1.9381142854690552, 2.034761905670166, 2.131409168243408, 2.2280566692352295, 2.324704170227051, 2.421351671218872]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 6.0, 11.0, 13.0, 11.0, 25.0, 25.0, 14.0, 24.0, 31.0, 22.0, 25.0, 41.0, 44.0, 50.0, 48.0, 48.0, 36.0, 57.0, 43.0, 55.0, 43.0, 40.0, 33.0, 27.0, 24.0, 28.0, 29.0, 24.0, 25.0, 15.0, 10.0, 7.0, 7.0, 15.0, 3.0, 8.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.027660846710205, -1.9695684909820557, -1.9114760160446167, -1.8533836603164673, -1.7952911853790283, -1.737198829650879, -1.6791064739227295, -1.62101411819458, -1.5629216432571411, -1.5048292875289917, -1.4467368125915527, -1.3886444568634033, -1.330552101135254, -1.272459626197815, -1.2143672704696655, -1.1562747955322266, -1.0981824398040771, -1.0400900840759277, -0.9819976091384888, -0.9239052534103394, -0.8658128380775452, -0.807720422744751, -0.7496280670166016, -0.6915356516838074, -0.6334432363510132, -0.575350821018219, -0.5172584056854248, -0.4591660499572754, -0.4010736346244812, -0.342981219291687, -0.2848888337612152, -0.2267964482307434, -0.16870403289794922, -0.11061163246631622, -0.05251923203468323, 0.005573168396949768, 0.06366556882858276, 0.12175798416137695, 0.17985036969184875, 0.23794275522232056, 0.29603517055511475, 0.35412758588790894, 0.41221997141838074, 0.47031235694885254, 0.5284047722816467, 0.5864971876144409, 0.6445895433425903, 0.7026819586753845, 0.7607743740081787, 0.8188667893409729, 0.8769592046737671, 0.9350515604019165, 0.9931439757347107, 1.0512363910675049, 1.1093287467956543, 1.1674211025238037, 1.2255135774612427, 1.283605933189392, 1.341698408126831, 1.3997907638549805, 1.4578831195831299, 1.5159755945205688, 1.5740679502487183, 1.6321604251861572, 1.6902527809143066]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 11.0, 11.0, 17.0, 25.0, 25.0, 33.0, 42.0, 60.0, 77.0, 135.0, 163.0, 319.0, 509.0, 972.0, 1974.0, 4596.0, 13548.0, 72031.0, 3840924.0, 222575.0, 23250.0, 6713.0, 2858.0, 1389.0, 766.0, 455.0, 257.0, 160.0, 99.0, 70.0, 56.0, 36.0, 35.0, 22.0, 14.0, 10.0, 8.0, 11.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.637451171875, -0.615234375, -0.593017578125, -0.57080078125, -0.548583984375, -0.5263671875, -0.504150390625, -0.48193359375, -0.459716796875, -0.4375, -0.415283203125, -0.39306640625, -0.370849609375, -0.3486328125, -0.326416015625, -0.30419921875, -0.281982421875, -0.259765625, -0.237548828125, -0.21533203125, -0.193115234375, -0.1708984375, -0.148681640625, -0.12646484375, -0.104248046875, -0.08203125, -0.059814453125, -0.03759765625, -0.015380859375, 0.0068359375, 0.029052734375, 0.05126953125, 0.073486328125, 0.095703125, 0.117919921875, 0.14013671875, 0.162353515625, 0.1845703125, 0.206787109375, 0.22900390625, 0.251220703125, 0.2734375, 0.295654296875, 0.31787109375, 0.340087890625, 0.3623046875, 0.384521484375, 0.40673828125, 0.428955078125, 0.451171875, 0.473388671875, 0.49560546875, 0.517822265625, 0.5400390625, 0.562255859375, 0.58447265625, 0.606689453125, 0.62890625, 0.651123046875, 0.67333984375, 0.695556640625, 0.7177734375, 0.739990234375, 0.76220703125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 11.0, 10.0, 12.0, 11.0, 25.0, 37.0, 37.0, 35.0, 46.0, 40.0, 55.0, 56.0, 71.0, 79.0, 67.0, 60.0, 55.0, 60.0, 35.0, 38.0, 33.0, 24.0, 13.0, 15.0, 15.0, 7.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.109619140625, -0.10620784759521484, -0.10279655456542969, -0.09938526153564453, -0.09597396850585938, -0.09256267547607422, -0.08915138244628906, -0.0857400894165039, -0.08232879638671875, -0.0789175033569336, -0.07550621032714844, -0.07209491729736328, -0.06868362426757812, -0.06527233123779297, -0.06186103820800781, -0.058449745178222656, -0.0550384521484375, -0.051627159118652344, -0.04821586608886719, -0.04480457305908203, -0.041393280029296875, -0.03798198699951172, -0.03457069396972656, -0.031159400939941406, -0.02774810791015625, -0.024336814880371094, -0.020925521850585938, -0.01751422882080078, -0.014102935791015625, -0.010691642761230469, -0.0072803497314453125, -0.0038690567016601562, -0.000457763671875, 0.0029535293579101562, 0.0063648223876953125, 0.009776115417480469, 0.013187408447265625, 0.01659870147705078, 0.020009994506835938, 0.023421287536621094, 0.02683258056640625, 0.030243873596191406, 0.03365516662597656, 0.03706645965576172, 0.040477752685546875, 0.04388904571533203, 0.04730033874511719, 0.050711631774902344, 0.0541229248046875, 0.057534217834472656, 0.06094551086425781, 0.06435680389404297, 0.06776809692382812, 0.07117938995361328, 0.07459068298339844, 0.0780019760131836, 0.08141326904296875, 0.0848245620727539, 0.08823585510253906, 0.09164714813232422, 0.09505844116210938, 0.09846973419189453, 0.10188102722167969, 0.10529232025146484, 0.10870361328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 5.0, 4.0, 11.0, 11.0, 18.0, 17.0, 28.0, 36.0, 52.0, 103.0, 193.0, 389.0, 826.0, 2163.0, 5660.0, 20722.0, 209245.0, 3827615.0, 104897.0, 14862.0, 4363.0, 1585.0, 707.0, 271.0, 144.0, 96.0, 61.0, 43.0, 32.0, 31.0, 15.0, 29.0, 9.0, 7.0, 4.0, 3.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.94580078125, -0.9211654663085938, -0.8965301513671875, -0.8718948364257812, -0.847259521484375, -0.8226242065429688, -0.7979888916015625, -0.7733535766601562, -0.74871826171875, -0.7240829467773438, -0.6994476318359375, -0.6748123168945312, -0.650177001953125, -0.6255416870117188, -0.6009063720703125, -0.5762710571289062, -0.5516357421875, -0.5270004272460938, -0.5023651123046875, -0.47772979736328125, -0.453094482421875, -0.42845916748046875, -0.4038238525390625, -0.37918853759765625, -0.35455322265625, -0.32991790771484375, -0.3052825927734375, -0.28064727783203125, -0.256011962890625, -0.23137664794921875, -0.2067413330078125, -0.18210601806640625, -0.157470703125, -0.13283538818359375, -0.1082000732421875, -0.08356475830078125, -0.058929443359375, -0.03429412841796875, -0.0096588134765625, 0.01497650146484375, 0.03961181640625, 0.06424713134765625, 0.0888824462890625, 0.11351776123046875, 0.138153076171875, 0.16278839111328125, 0.1874237060546875, 0.21205902099609375, 0.2366943359375, 0.26132965087890625, 0.2859649658203125, 0.31060028076171875, 0.335235595703125, 0.35987091064453125, 0.3845062255859375, 0.40914154052734375, 0.43377685546875, 0.45841217041015625, 0.4830474853515625, 0.5076828002929688, 0.532318115234375, 0.5569534301757812, 0.5815887451171875, 0.6062240600585938, 0.630859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 3.0, 4.0, 5.0, 7.0, 13.0, 10.0, 24.0, 47.0, 75.0, 116.0, 342.0, 1464.0, 1361.0, 324.0, 103.0, 80.0, 25.0, 19.0, 13.0, 8.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.19860267639160156, -0.18956375122070312, -0.1805248260498047, -0.17148590087890625, -0.1624469757080078, -0.15340805053710938, -0.14436912536621094, -0.1353302001953125, -0.12629127502441406, -0.11725234985351562, -0.10821342468261719, -0.09917449951171875, -0.09013557434082031, -0.08109664916992188, -0.07205772399902344, -0.063018798828125, -0.05397987365722656, -0.044940948486328125, -0.03590202331542969, -0.02686309814453125, -0.017824172973632812, -0.008785247802734375, 0.0002536773681640625, 0.0092926025390625, 0.018331527709960938, 0.027370452880859375, 0.03640937805175781, 0.04544830322265625, 0.05448722839355469, 0.06352615356445312, 0.07256507873535156, 0.08160400390625, 0.09064292907714844, 0.09968185424804688, 0.10872077941894531, 0.11775970458984375, 0.1267986297607422, 0.13583755493164062, 0.14487648010253906, 0.1539154052734375, 0.16295433044433594, 0.17199325561523438, 0.1810321807861328, 0.19007110595703125, 0.1991100311279297, 0.20814895629882812, 0.21718788146972656, 0.226226806640625, 0.23526573181152344, 0.24430465698242188, 0.2533435821533203, 0.26238250732421875, 0.2714214324951172, 0.2804603576660156, 0.28949928283691406, 0.2985382080078125, 0.30757713317871094, 0.3166160583496094, 0.3256549835205078, 0.33469390869140625, 0.3437328338623047, 0.3527717590332031, 0.36181068420410156, 0.370849609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 16.0, 21.0, 30.0, 96.0, 162.0, 229.0, 222.0, 115.0, 51.0, 24.0, 21.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8557887077331543, -2.7802300453186035, -2.7046713829040527, -2.629112482070923, -2.553553819656372, -2.4779951572418213, -2.4024364948272705, -2.3268775939941406, -2.25131893157959, -2.175760269165039, -2.1002016067504883, -2.0246427059173584, -1.9490840435028076, -1.8735253810882568, -1.797966718673706, -1.7224079370498657, -1.646849274635315, -1.5712906122207642, -1.4957318305969238, -1.420173168182373, -1.3446143865585327, -1.269055724143982, -1.1934969425201416, -1.1179382801055908, -1.04237961769104, -0.9668208956718445, -0.8912621736526489, -0.8157035112380981, -0.7401447296142578, -0.664586067199707, -0.5890273451805115, -0.5134686231613159, -0.4379098415374756, -0.36235111951828003, -0.2867923974990845, -0.2112337052822113, -0.13567498326301575, -0.06011626124382019, 0.015442430973052979, 0.09100115299224854, 0.1665598750114441, 0.24211859703063965, 0.3176773190498352, 0.3932360112667084, 0.46879473328590393, 0.5443534851074219, 0.6199121475219727, 0.6954708695411682, 0.7710295915603638, 0.8465883135795593, 0.9221470355987549, 0.9977056980133057, 1.073264479637146, 1.1488231420516968, 1.224381923675537, 1.299940586090088, 1.3754992485046387, 1.4510579109191895, 1.5266166925430298, 1.6021753549575806, 1.677734136581421, 1.7532927989959717, 1.8288514614105225, 1.9044102430343628, 1.9799690246582031]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 6.0, 6.0, 7.0, 7.0, 16.0, 14.0, 23.0, 25.0, 28.0, 38.0, 32.0, 39.0, 34.0, 42.0, 41.0, 66.0, 54.0, 54.0, 54.0, 42.0, 49.0, 37.0, 30.0, 35.0, 34.0, 21.0, 35.0, 19.0, 23.0, 20.0, 16.0, 13.0, 5.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.727221667766571, -0.7038155198097229, -0.6804093718528748, -0.6570032835006714, -0.6335971355438232, -0.6101909875869751, -0.586784839630127, -0.5633786916732788, -0.5399725437164307, -0.5165663957595825, -0.49316027760505676, -0.4697541296482086, -0.4463479816913605, -0.4229418635368347, -0.3995357155799866, -0.3761295676231384, -0.35272344946861267, -0.3293173015117645, -0.30591118335723877, -0.2825050354003906, -0.2590988874435425, -0.23569275438785553, -0.21228662133216858, -0.18888047337532043, -0.16547434031963348, -0.14206820726394653, -0.11866205930709839, -0.09525592625141144, -0.07184978574514389, -0.04844364523887634, -0.025037512183189392, -0.0016313642263412476, 0.021774768829345703, 0.04518090933561325, 0.0685870498418808, 0.09199318289756775, 0.1153993234038353, 0.13880546391010284, 0.1622115969657898, 0.18561774492263794, 0.2090238779783249, 0.23243001103401184, 0.25583615899086, 0.27924227714538574, 0.3026484251022339, 0.32605457305908203, 0.3494607210159302, 0.3728668689727783, 0.3962729871273041, 0.4196791350841522, 0.443085253238678, 0.4664914011955261, 0.48989754915237427, 0.5133036971092224, 0.5367097854614258, 0.5601159334182739, 0.5835220813751221, 0.6069282293319702, 0.6303343772888184, 0.6537405252456665, 0.6771466135978699, 0.700552761554718, 0.7239589095115662, 0.7473650574684143, 0.7707712054252625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 4.0, 10.0, 14.0, 11.0, 25.0, 37.0, 53.0, 68.0, 129.0, 200.0, 388.0, 696.0, 1458.0, 3174.0, 8312.0, 26019.0, 126534.0, 613131.0, 211538.0, 38168.0, 10833.0, 4007.0, 1776.0, 861.0, 453.0, 255.0, 137.0, 78.0, 65.0, 31.0, 26.0, 18.0, 11.0, 13.0, 9.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48828125, -0.470611572265625, -0.45294189453125, -0.435272216796875, -0.4176025390625, -0.399932861328125, -0.38226318359375, -0.364593505859375, -0.346923828125, -0.329254150390625, -0.31158447265625, -0.293914794921875, -0.2762451171875, -0.258575439453125, -0.24090576171875, -0.223236083984375, -0.20556640625, -0.187896728515625, -0.17022705078125, -0.152557373046875, -0.1348876953125, -0.117218017578125, -0.09954833984375, -0.081878662109375, -0.064208984375, -0.046539306640625, -0.02886962890625, -0.011199951171875, 0.0064697265625, 0.024139404296875, 0.04180908203125, 0.059478759765625, 0.0771484375, 0.094818115234375, 0.11248779296875, 0.130157470703125, 0.1478271484375, 0.165496826171875, 0.18316650390625, 0.200836181640625, 0.218505859375, 0.236175537109375, 0.25384521484375, 0.271514892578125, 0.2891845703125, 0.306854248046875, 0.32452392578125, 0.342193603515625, 0.35986328125, 0.377532958984375, 0.39520263671875, 0.412872314453125, 0.4305419921875, 0.448211669921875, 0.46588134765625, 0.483551025390625, 0.501220703125, 0.518890380859375, 0.53656005859375, 0.554229736328125, 0.5718994140625, 0.589569091796875, 0.60723876953125, 0.624908447265625, 0.642578125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 16.0, 17.0, 23.0, 41.0, 43.0, 54.0, 73.0, 84.0, 105.0, 95.0, 80.0, 89.0, 83.0, 52.0, 45.0, 21.0, 17.0, 11.0, 10.0, 5.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19580078125, -0.1906719207763672, -0.18554306030273438, -0.18041419982910156, -0.17528533935546875, -0.17015647888183594, -0.16502761840820312, -0.1598987579345703, -0.1547698974609375, -0.1496410369873047, -0.14451217651367188, -0.13938331604003906, -0.13425445556640625, -0.12912559509277344, -0.12399673461914062, -0.11886787414550781, -0.113739013671875, -0.10861015319824219, -0.10348129272460938, -0.09835243225097656, -0.09322357177734375, -0.08809471130371094, -0.08296585083007812, -0.07783699035644531, -0.0727081298828125, -0.06757926940917969, -0.062450408935546875, -0.05732154846191406, -0.05219268798828125, -0.04706382751464844, -0.041934967041015625, -0.03680610656738281, -0.03167724609375, -0.026548385620117188, -0.021419525146484375, -0.016290664672851562, -0.01116180419921875, -0.0060329437255859375, -0.000904083251953125, 0.0042247772216796875, 0.0093536376953125, 0.014482498168945312, 0.019611358642578125, 0.024740219116210938, 0.02986907958984375, 0.03499794006347656, 0.040126800537109375, 0.04525566101074219, 0.050384521484375, 0.05551338195800781, 0.060642242431640625, 0.06577110290527344, 0.07089996337890625, 0.07602882385253906, 0.08115768432617188, 0.08628654479980469, 0.0914154052734375, 0.09654426574707031, 0.10167312622070312, 0.10680198669433594, 0.11193084716796875, 0.11705970764160156, 0.12218856811523438, 0.1273174285888672, 0.1324462890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 12.0, 10.0, 12.0, 23.0, 36.0, 48.0, 87.0, 197.0, 438.0, 975.0, 2916.0, 9492.0, 37452.0, 206576.0, 604296.0, 145703.0, 28732.0, 7510.0, 2369.0, 903.0, 340.0, 149.0, 106.0, 48.0, 33.0, 18.0, 8.0, 10.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.46630859375, -0.4519195556640625, -0.437530517578125, -0.4231414794921875, -0.40875244140625, -0.3943634033203125, -0.379974365234375, -0.3655853271484375, -0.3511962890625, -0.3368072509765625, -0.322418212890625, -0.3080291748046875, -0.29364013671875, -0.2792510986328125, -0.264862060546875, -0.2504730224609375, -0.236083984375, -0.2216949462890625, -0.207305908203125, -0.1929168701171875, -0.17852783203125, -0.1641387939453125, -0.149749755859375, -0.1353607177734375, -0.1209716796875, -0.1065826416015625, -0.092193603515625, -0.0778045654296875, -0.06341552734375, -0.0490264892578125, -0.034637451171875, -0.0202484130859375, -0.005859375, 0.0085296630859375, 0.022918701171875, 0.0373077392578125, 0.05169677734375, 0.0660858154296875, 0.080474853515625, 0.0948638916015625, 0.1092529296875, 0.1236419677734375, 0.138031005859375, 0.1524200439453125, 0.16680908203125, 0.1811981201171875, 0.195587158203125, 0.2099761962890625, 0.224365234375, 0.2387542724609375, 0.253143310546875, 0.2675323486328125, 0.28192138671875, 0.2963104248046875, 0.310699462890625, 0.3250885009765625, 0.3394775390625, 0.3538665771484375, 0.368255615234375, 0.3826446533203125, 0.39703369140625, 0.4114227294921875, 0.425811767578125, 0.4402008056640625, 0.45458984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 3.0, 2.0, 10.0, 8.0, 14.0, 13.0, 14.0, 24.0, 29.0, 31.0, 28.0, 37.0, 38.0, 51.0, 38.0, 42.0, 42.0, 51.0, 53.0, 48.0, 46.0, 44.0, 39.0, 44.0, 37.0, 31.0, 25.0, 32.0, 27.0, 17.0, 18.0, 13.0, 10.0, 10.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2989158630371094, -0.28704071044921875, -0.2751655578613281, -0.2632904052734375, -0.2514152526855469, -0.23954010009765625, -0.22766494750976562, -0.215789794921875, -0.20391464233398438, -0.19203948974609375, -0.18016433715820312, -0.1682891845703125, -0.15641403198242188, -0.14453887939453125, -0.13266372680664062, -0.12078857421875, -0.10891342163085938, -0.09703826904296875, -0.08516311645507812, -0.0732879638671875, -0.061412811279296875, -0.04953765869140625, -0.037662506103515625, -0.025787353515625, -0.013912200927734375, -0.00203704833984375, 0.009838104248046875, 0.0217132568359375, 0.033588409423828125, 0.04546356201171875, 0.057338714599609375, 0.0692138671875, 0.08108901977539062, 0.09296417236328125, 0.10483932495117188, 0.1167144775390625, 0.12858963012695312, 0.14046478271484375, 0.15233993530273438, 0.164215087890625, 0.17609024047851562, 0.18796539306640625, 0.19984054565429688, 0.2117156982421875, 0.22359085083007812, 0.23546600341796875, 0.24734115600585938, 0.25921630859375, 0.2710914611816406, 0.28296661376953125, 0.2948417663574219, 0.3067169189453125, 0.3185920715332031, 0.33046722412109375, 0.3423423767089844, 0.354217529296875, 0.3660926818847656, 0.37796783447265625, 0.3898429870605469, 0.4017181396484375, 0.4135932922363281, 0.42546844482421875, 0.4373435974121094, 0.44921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 6.0, 2.0, 10.0, 6.0, 14.0, 16.0, 23.0, 37.0, 63.0, 82.0, 143.0, 239.0, 509.0, 1048.0, 2636.0, 8574.0, 34514.0, 173061.0, 616794.0, 164534.0, 33423.0, 8207.0, 2454.0, 1003.0, 458.0, 226.0, 165.0, 99.0, 63.0, 33.0, 28.0, 21.0, 5.0, 12.0, 8.0, 8.0, 6.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.14599609375, -0.1413593292236328, -0.13672256469726562, -0.13208580017089844, -0.12744903564453125, -0.12281227111816406, -0.11817550659179688, -0.11353874206542969, -0.1089019775390625, -0.10426521301269531, -0.09962844848632812, -0.09499168395996094, -0.09035491943359375, -0.08571815490722656, -0.08108139038085938, -0.07644462585449219, -0.071807861328125, -0.06717109680175781, -0.06253433227539062, -0.05789756774902344, -0.05326080322265625, -0.04862403869628906, -0.043987274169921875, -0.03935050964355469, -0.0347137451171875, -0.030076980590820312, -0.025440216064453125, -0.020803451538085938, -0.01616668701171875, -0.011529922485351562, -0.006893157958984375, -0.0022563934326171875, 0.00238037109375, 0.0070171356201171875, 0.011653900146484375, 0.016290664672851562, 0.02092742919921875, 0.025564193725585938, 0.030200958251953125, 0.03483772277832031, 0.0394744873046875, 0.04411125183105469, 0.048748016357421875, 0.05338478088378906, 0.05802154541015625, 0.06265830993652344, 0.06729507446289062, 0.07193183898925781, 0.076568603515625, 0.08120536804199219, 0.08584213256835938, 0.09047889709472656, 0.09511566162109375, 0.09975242614746094, 0.10438919067382812, 0.10902595520019531, 0.1136627197265625, 0.11829948425292969, 0.12293624877929688, 0.12757301330566406, 0.13220977783203125, 0.13684654235839844, 0.14148330688476562, 0.1461200714111328, 0.1507568359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 9.0, 20.0, 20.0, 43.0, 63.0, 84.0, 137.0, 124.0, 138.0, 104.0, 85.0, 60.0, 34.0, 27.0, 13.0, 10.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0650367736816406e-05, -3.8525089621543884e-05, -3.639981150627136e-05, -3.427453339099884e-05, -3.214925527572632e-05, -3.0023977160453796e-05, -2.7898699045181274e-05, -2.5773420929908752e-05, -2.364814281463623e-05, -2.152286469936371e-05, -1.9397586584091187e-05, -1.7272308468818665e-05, -1.5147030353546143e-05, -1.302175223827362e-05, -1.0896474123001099e-05, -8.771196007728577e-06, -6.645917892456055e-06, -4.520639777183533e-06, -2.3953616619110107e-06, -2.7008354663848877e-07, 1.8551945686340332e-06, 3.980472683906555e-06, 6.105750799179077e-06, 8.231028914451599e-06, 1.0356307029724121e-05, 1.2481585144996643e-05, 1.4606863260269165e-05, 1.6732141375541687e-05, 1.885741949081421e-05, 2.098269760608673e-05, 2.3107975721359253e-05, 2.5233253836631775e-05, 2.7358531951904297e-05, 2.948381006717682e-05, 3.160908818244934e-05, 3.373436629772186e-05, 3.5859644412994385e-05, 3.798492252826691e-05, 4.011020064353943e-05, 4.223547875881195e-05, 4.436075687408447e-05, 4.6486034989356995e-05, 4.8611313104629517e-05, 5.073659121990204e-05, 5.286186933517456e-05, 5.498714745044708e-05, 5.7112425565719604e-05, 5.9237703680992126e-05, 6.136298179626465e-05, 6.348825991153717e-05, 6.561353802680969e-05, 6.773881614208221e-05, 6.986409425735474e-05, 7.198937237262726e-05, 7.411465048789978e-05, 7.62399286031723e-05, 7.836520671844482e-05, 8.049048483371735e-05, 8.261576294898987e-05, 8.474104106426239e-05, 8.686631917953491e-05, 8.899159729480743e-05, 9.111687541007996e-05, 9.324215352535248e-05, 9.5367431640625e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 10.0, 12.0, 20.0, 37.0, 57.0, 73.0, 102.0, 135.0, 219.0, 340.0, 572.0, 1279.0, 2994.0, 8658.0, 31208.0, 140131.0, 632530.0, 175981.0, 37543.0, 10025.0, 3489.0, 1339.0, 724.0, 380.0, 215.0, 159.0, 101.0, 43.0, 47.0, 34.0, 20.0, 17.0, 20.0, 7.0, 5.0, 0.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1883544921875, -0.18274307250976562, -0.17713165283203125, -0.17152023315429688, -0.1659088134765625, -0.16029739379882812, -0.15468597412109375, -0.14907455444335938, -0.143463134765625, -0.13785171508789062, -0.13224029541015625, -0.12662887573242188, -0.1210174560546875, -0.11540603637695312, -0.10979461669921875, -0.10418319702148438, -0.09857177734375, -0.09296035766601562, -0.08734893798828125, -0.08173751831054688, -0.0761260986328125, -0.07051467895507812, -0.06490325927734375, -0.059291839599609375, -0.053680419921875, -0.048069000244140625, -0.04245758056640625, -0.036846160888671875, -0.0312347412109375, -0.025623321533203125, -0.02001190185546875, -0.014400482177734375, -0.0087890625, -0.003177642822265625, 0.00243377685546875, 0.008045196533203125, 0.0136566162109375, 0.019268035888671875, 0.02487945556640625, 0.030490875244140625, 0.036102294921875, 0.041713714599609375, 0.04732513427734375, 0.052936553955078125, 0.0585479736328125, 0.06415939331054688, 0.06977081298828125, 0.07538223266601562, 0.08099365234375, 0.08660507202148438, 0.09221649169921875, 0.09782791137695312, 0.1034393310546875, 0.10905075073242188, 0.11466217041015625, 0.12027359008789062, 0.125885009765625, 0.13149642944335938, 0.13710784912109375, 0.14271926879882812, 0.1483306884765625, 0.15394210815429688, 0.15955352783203125, 0.16516494750976562, 0.1707763671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 6.0, 6.0, 14.0, 15.0, 32.0, 39.0, 60.0, 80.0, 119.0, 189.0, 135.0, 114.0, 64.0, 37.0, 32.0, 18.0, 18.0, 9.0, 1.0, 10.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.17591285705566406, -0.16957473754882812, -0.1632366180419922, -0.15689849853515625, -0.1505603790283203, -0.14422225952148438, -0.13788414001464844, -0.1315460205078125, -0.12520790100097656, -0.11886978149414062, -0.11253166198730469, -0.10619354248046875, -0.09985542297363281, -0.09351730346679688, -0.08717918395996094, -0.080841064453125, -0.07450294494628906, -0.06816482543945312, -0.06182670593261719, -0.05548858642578125, -0.04915046691894531, -0.042812347412109375, -0.03647422790527344, -0.0301361083984375, -0.023797988891601562, -0.017459869384765625, -0.011121749877929688, -0.00478363037109375, 0.0015544891357421875, 0.007892608642578125, 0.014230728149414062, 0.02056884765625, 0.026906967163085938, 0.033245086669921875, 0.03958320617675781, 0.04592132568359375, 0.05225944519042969, 0.058597564697265625, 0.06493568420410156, 0.0712738037109375, 0.07761192321777344, 0.08395004272460938, 0.09028816223144531, 0.09662628173828125, 0.10296440124511719, 0.10930252075195312, 0.11564064025878906, 0.121978759765625, 0.12831687927246094, 0.13465499877929688, 0.1409931182861328, 0.14733123779296875, 0.1536693572998047, 0.16000747680664062, 0.16634559631347656, 0.1726837158203125, 0.17902183532714844, 0.18535995483398438, 0.1916980743408203, 0.19803619384765625, 0.2043743133544922, 0.21071243286132812, 0.21705055236816406, 0.223388671875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 11.0, 11.0, 15.0, 39.0, 41.0, 70.0, 78.0, 96.0, 133.0, 141.0, 110.0, 75.0, 65.0, 40.0, 23.0, 13.0, 8.0, 7.0, 1.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5142521858215332, -1.4511297941207886, -1.388007402420044, -1.3248848915100098, -1.2617624998092651, -1.1986401081085205, -1.1355175971984863, -1.0723952054977417, -1.009272813796997, -0.9461504220962524, -0.883027970790863, -0.8199055194854736, -0.756783127784729, -0.6936607360839844, -0.630538284778595, -0.5674158334732056, -0.5042934417724609, -0.4411710202693939, -0.3780485987663269, -0.3149261772632599, -0.25180375576019287, -0.18868133425712585, -0.12555891275405884, -0.06243649125099182, 0.0006859302520751953, 0.06380835175514221, 0.12693077325820923, 0.19005319476127625, 0.25317561626434326, 0.3162980377674103, 0.3794204592704773, 0.4425428807735443, 0.5056650638580322, 0.5687874555587769, 0.6319099068641663, 0.6950323581695557, 0.7581547498703003, 0.8212771415710449, 0.8843995928764343, 0.9475220441818237, 1.0106444358825684, 1.073766827583313, 1.1368892192840576, 1.2000117301940918, 1.2631341218948364, 1.326256513595581, 1.3893790245056152, 1.4525014162063599, 1.5156238079071045, 1.5787461996078491, 1.6418685913085938, 1.704991102218628, 1.7681134939193726, 1.8312358856201172, 1.8943583965301514, 1.957480788230896, 2.0206031799316406, 2.083725690841675, 2.14684796333313, 2.209970474243164, 2.273092746734619, 2.3362152576446533, 2.3993377685546875, 2.4624600410461426, 2.5255825519561768]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 11.0, 11.0, 10.0, 4.0, 14.0, 19.0, 10.0, 28.0, 34.0, 22.0, 19.0, 31.0, 33.0, 48.0, 42.0, 48.0, 42.0, 53.0, 53.0, 56.0, 46.0, 43.0, 46.0, 31.0, 38.0, 35.0, 23.0, 22.0, 23.0, 17.0, 14.0, 16.0, 15.0, 9.0, 8.0, 10.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7291101217269897, -1.6733416318893433, -1.6175731420516968, -1.5618046522140503, -1.5060360431671143, -1.4502675533294678, -1.3944990634918213, -1.3387305736541748, -1.2829620838165283, -1.2271935939788818, -1.1714251041412354, -1.1156566143035889, -1.0598881244659424, -1.004119634628296, -0.9483510255813599, -0.8925825357437134, -0.8368140459060669, -0.7810455560684204, -0.7252770662307739, -0.6695085167884827, -0.6137400269508362, -0.5579715371131897, -0.5022029876708984, -0.44643449783325195, -0.39066600799560547, -0.334897518157959, -0.2791289985179901, -0.22336049377918243, -0.16759198904037476, -0.11182349920272827, -0.0560549795627594, -0.00028645992279052734, 0.05548214912414551, 0.11125065386295319, 0.16701915860176086, 0.22278766334056854, 0.2785561680793762, 0.3343246579170227, 0.3900931775569916, 0.44586169719696045, 0.5016301870346069, 0.5573986768722534, 0.6131671667098999, 0.6689357161521912, 0.7247042059898376, 0.7804726958274841, 0.8362412452697754, 0.8920097351074219, 0.9477782249450684, 1.0035467147827148, 1.0593152046203613, 1.1150836944580078, 1.1708521842956543, 1.2266206741333008, 1.2823892831802368, 1.3381577730178833, 1.3939262628555298, 1.4496947526931763, 1.5054632425308228, 1.5612317323684692, 1.6170003414154053, 1.6727688312530518, 1.7285373210906982, 1.7843058109283447, 1.8400743007659912]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 20.0, 14.0, 24.0, 41.0, 52.0, 78.0, 128.0, 183.0, 396.0, 752.0, 1829.0, 6272.0, 46705.0, 4045622.0, 79703.0, 8117.0, 2262.0, 916.0, 474.0, 249.0, 143.0, 75.0, 52.0, 46.0, 35.0, 16.0, 20.0, 7.0, 11.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0009765625, -0.9711685180664062, -0.9413604736328125, -0.9115524291992188, -0.881744384765625, -0.8519363403320312, -0.8221282958984375, -0.7923202514648438, -0.76251220703125, -0.7327041625976562, -0.7028961181640625, -0.6730880737304688, -0.643280029296875, -0.6134719848632812, -0.5836639404296875, -0.5538558959960938, -0.5240478515625, -0.49423980712890625, -0.4644317626953125, -0.43462371826171875, -0.404815673828125, -0.37500762939453125, -0.3451995849609375, -0.31539154052734375, -0.28558349609375, -0.25577545166015625, -0.2259674072265625, -0.19615936279296875, -0.166351318359375, -0.13654327392578125, -0.1067352294921875, -0.07692718505859375, -0.047119140625, -0.01731109619140625, 0.0124969482421875, 0.04230499267578125, 0.072113037109375, 0.10192108154296875, 0.1317291259765625, 0.16153717041015625, 0.19134521484375, 0.22115325927734375, 0.2509613037109375, 0.28076934814453125, 0.310577392578125, 0.34038543701171875, 0.3701934814453125, 0.40000152587890625, 0.4298095703125, 0.45961761474609375, 0.4894256591796875, 0.5192337036132812, 0.549041748046875, 0.5788497924804688, 0.6086578369140625, 0.6384658813476562, 0.66827392578125, 0.6980819702148438, 0.7278900146484375, 0.7576980590820312, 0.787506103515625, 0.8173141479492188, 0.8471221923828125, 0.8769302368164062, 0.90673828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 8.0, 14.0, 19.0, 18.0, 32.0, 35.0, 38.0, 50.0, 36.0, 65.0, 63.0, 66.0, 68.0, 72.0, 52.0, 62.0, 65.0, 38.0, 31.0, 29.0, 33.0, 23.0, 14.0, 8.0, 7.0, 6.0, 8.0, 9.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1204833984375, -0.1166534423828125, -0.112823486328125, -0.1089935302734375, -0.10516357421875, -0.1013336181640625, -0.097503662109375, -0.0936737060546875, -0.08984375, -0.0860137939453125, -0.082183837890625, -0.0783538818359375, -0.07452392578125, -0.0706939697265625, -0.066864013671875, -0.0630340576171875, -0.0592041015625, -0.0553741455078125, -0.051544189453125, -0.0477142333984375, -0.04388427734375, -0.0400543212890625, -0.036224365234375, -0.0323944091796875, -0.028564453125, -0.0247344970703125, -0.020904541015625, -0.0170745849609375, -0.01324462890625, -0.0094146728515625, -0.005584716796875, -0.0017547607421875, 0.0020751953125, 0.0059051513671875, 0.009735107421875, 0.0135650634765625, 0.01739501953125, 0.0212249755859375, 0.025054931640625, 0.0288848876953125, 0.03271484375, 0.0365447998046875, 0.040374755859375, 0.0442047119140625, 0.04803466796875, 0.0518646240234375, 0.055694580078125, 0.0595245361328125, 0.0633544921875, 0.0671844482421875, 0.071014404296875, 0.0748443603515625, 0.07867431640625, 0.0825042724609375, 0.086334228515625, 0.0901641845703125, 0.093994140625, 0.0978240966796875, 0.101654052734375, 0.1054840087890625, 0.10931396484375, 0.1131439208984375, 0.116973876953125, 0.1208038330078125, 0.1246337890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 13.0, 16.0, 28.0, 38.0, 51.0, 79.0, 109.0, 172.0, 252.0, 417.0, 716.0, 1285.0, 2520.0, 6025.0, 18825.0, 104458.0, 3676172.0, 333582.0, 33003.0, 9112.0, 3552.0, 1571.0, 842.0, 487.0, 321.0, 182.0, 132.0, 90.0, 49.0, 40.0, 36.0, 18.0, 16.0, 16.0, 16.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5754928588867188, -0.5567474365234375, -0.5380020141601562, -0.519256591796875, -0.5005111694335938, -0.4817657470703125, -0.46302032470703125, -0.44427490234375, -0.42552947998046875, -0.4067840576171875, -0.38803863525390625, -0.369293212890625, -0.35054779052734375, -0.3318023681640625, -0.31305694580078125, -0.2943115234375, -0.27556610107421875, -0.2568206787109375, -0.23807525634765625, -0.219329833984375, -0.20058441162109375, -0.1818389892578125, -0.16309356689453125, -0.14434814453125, -0.12560272216796875, -0.1068572998046875, -0.08811187744140625, -0.069366455078125, -0.05062103271484375, -0.0318756103515625, -0.01313018798828125, 0.005615234375, 0.02436065673828125, 0.0431060791015625, 0.06185150146484375, 0.080596923828125, 0.09934234619140625, 0.1180877685546875, 0.13683319091796875, 0.15557861328125, 0.17432403564453125, 0.1930694580078125, 0.21181488037109375, 0.230560302734375, 0.24930572509765625, 0.2680511474609375, 0.28679656982421875, 0.3055419921875, 0.32428741455078125, 0.3430328369140625, 0.36177825927734375, 0.380523681640625, 0.39926910400390625, 0.4180145263671875, 0.43675994873046875, 0.45550537109375, 0.47425079345703125, 0.4929962158203125, 0.5117416381835938, 0.530487060546875, 0.5492324829101562, 0.5679779052734375, 0.5867233276367188, 0.60546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 0.0, 6.0, 3.0, 3.0, 8.0, 6.0, 10.0, 13.0, 16.0, 25.0, 29.0, 56.0, 76.0, 145.0, 274.0, 957.0, 1674.0, 356.0, 148.0, 78.0, 62.0, 35.0, 25.0, 14.0, 9.0, 8.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1939697265625, -0.188446044921875, -0.18292236328125, -0.177398681640625, -0.171875, -0.166351318359375, -0.16082763671875, -0.155303955078125, -0.1497802734375, -0.144256591796875, -0.13873291015625, -0.133209228515625, -0.127685546875, -0.122161865234375, -0.11663818359375, -0.111114501953125, -0.1055908203125, -0.100067138671875, -0.09454345703125, -0.089019775390625, -0.08349609375, -0.077972412109375, -0.07244873046875, -0.066925048828125, -0.0614013671875, -0.055877685546875, -0.05035400390625, -0.044830322265625, -0.039306640625, -0.033782958984375, -0.02825927734375, -0.022735595703125, -0.0172119140625, -0.011688232421875, -0.00616455078125, -0.000640869140625, 0.0048828125, 0.010406494140625, 0.01593017578125, 0.021453857421875, 0.0269775390625, 0.032501220703125, 0.03802490234375, 0.043548583984375, 0.049072265625, 0.054595947265625, 0.06011962890625, 0.065643310546875, 0.0711669921875, 0.076690673828125, 0.08221435546875, 0.087738037109375, 0.09326171875, 0.098785400390625, 0.10430908203125, 0.109832763671875, 0.1153564453125, 0.120880126953125, 0.12640380859375, 0.131927490234375, 0.137451171875, 0.142974853515625, 0.14849853515625, 0.154022216796875, 0.1595458984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 7.0, 10.0, 13.0, 45.0, 65.0, 126.0, 190.0, 220.0, 159.0, 81.0, 32.0, 28.0, 14.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.652754545211792, -1.594377040863037, -1.5359995365142822, -1.4776220321655273, -1.4192445278167725, -1.3608670234680176, -1.3024895191192627, -1.2441120147705078, -1.185734510421753, -1.127357006072998, -1.0689795017242432, -1.0106019973754883, -0.9522244930267334, -0.8938469886779785, -0.8354694247245789, -0.777091920375824, -0.7187143564224243, -0.6603368520736694, -0.6019593477249146, -0.5435818433761597, -0.4852043092250824, -0.4268268048763275, -0.36844927072525024, -0.31007176637649536, -0.2516942620277405, -0.1933167576789856, -0.13493923842906952, -0.07656171917915344, -0.01818421483039856, 0.04019328951835632, 0.0985708236694336, 0.15694832801818848, 0.21532583236694336, 0.27370333671569824, 0.3320808410644531, 0.3904583752155304, 0.4488358795642853, 0.5072133541107178, 0.5655909180641174, 0.6239684224128723, 0.6823459267616272, 0.7407234311103821, 0.799100935459137, 0.8574784994125366, 0.9158560037612915, 0.9742335081100464, 1.0326110124588013, 1.0909885168075562, 1.149366021156311, 1.207743525505066, 1.2661210298538208, 1.3244985342025757, 1.3828760385513306, 1.4412535429000854, 1.4996311664581299, 1.5580086708068848, 1.6163861751556396, 1.6747636795043945, 1.7331411838531494, 1.7915186882019043, 1.8498961925506592, 1.908273696899414, 1.966651201248169, 2.025028705596924, 2.0834062099456787]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 9.0, 11.0, 19.0, 17.0, 16.0, 19.0, 16.0, 27.0, 25.0, 28.0, 15.0, 34.0, 39.0, 43.0, 46.0, 51.0, 49.0, 39.0, 53.0, 50.0, 55.0, 39.0, 40.0, 26.0, 31.0, 32.0, 31.0, 26.0, 17.0, 17.0, 15.0, 10.0, 12.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.5788618922233582, -0.5618173480033875, -0.5447728633880615, -0.5277283191680908, -0.5106838345527649, -0.4936392903327942, -0.4765947759151459, -0.45955026149749756, -0.44250571727752686, -0.42546120285987854, -0.4084166884422302, -0.3913721442222595, -0.3743276298046112, -0.3572831153869629, -0.3402386009693146, -0.32319408655166626, -0.30614957213401794, -0.28910505771636963, -0.2720605432987213, -0.255016028881073, -0.2379714846611023, -0.22092697024345398, -0.20388245582580566, -0.18683794140815735, -0.16979341208934784, -0.15274889767169952, -0.13570436835289001, -0.1186598539352417, -0.10161533206701279, -0.08457081019878387, -0.06752629578113556, -0.05048177391290665, -0.033437252044677734, -0.01639273203909397, 0.0006517879664897919, 0.017696306109428406, 0.03474082797765732, 0.05178534984588623, 0.06882986426353455, 0.08587438613176346, 0.10291890799999237, 0.11996342986822128, 0.1370079517364502, 0.1540524661540985, 0.17109698057174683, 0.18814150989055634, 0.20518602430820465, 0.22223055362701416, 0.23927506804466248, 0.2563195824623108, 0.2733640968799591, 0.2904086112976074, 0.3074531555175781, 0.32449766993522644, 0.34154218435287476, 0.35858669877052307, 0.3756312131881714, 0.3926757276058197, 0.409720242023468, 0.4267647862434387, 0.44380930066108704, 0.46085381507873535, 0.47789832949638367, 0.494942843914032, 0.5119873881340027]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 3.0, 12.0, 11.0, 17.0, 24.0, 43.0, 69.0, 101.0, 177.0, 315.0, 479.0, 945.0, 1829.0, 3780.0, 9673.0, 27421.0, 102431.0, 457029.0, 337111.0, 71805.0, 20976.0, 7569.0, 3201.0, 1530.0, 860.0, 401.0, 287.0, 178.0, 109.0, 61.0, 40.0, 23.0, 9.0, 11.0, 3.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50732421875, -0.4927787780761719, -0.47823333740234375, -0.4636878967285156, -0.4491424560546875, -0.4345970153808594, -0.42005157470703125, -0.4055061340332031, -0.390960693359375, -0.3764152526855469, -0.36186981201171875, -0.3473243713378906, -0.3327789306640625, -0.3182334899902344, -0.30368804931640625, -0.2891426086425781, -0.27459716796875, -0.2600517272949219, -0.24550628662109375, -0.23096084594726562, -0.2164154052734375, -0.20186996459960938, -0.18732452392578125, -0.17277908325195312, -0.158233642578125, -0.14368820190429688, -0.12914276123046875, -0.11459732055664062, -0.1000518798828125, -0.08550643920898438, -0.07096099853515625, -0.056415557861328125, -0.0418701171875, -0.027324676513671875, -0.01277923583984375, 0.001766204833984375, 0.0163116455078125, 0.030857086181640625, 0.04540252685546875, 0.059947967529296875, 0.074493408203125, 0.08903884887695312, 0.10358428955078125, 0.11812973022460938, 0.1326751708984375, 0.14722061157226562, 0.16176605224609375, 0.17631149291992188, 0.19085693359375, 0.20540237426757812, 0.21994781494140625, 0.23449325561523438, 0.2490386962890625, 0.2635841369628906, 0.27812957763671875, 0.2926750183105469, 0.307220458984375, 0.3217658996582031, 0.33631134033203125, 0.3508567810058594, 0.3654022216796875, 0.3799476623535156, 0.39449310302734375, 0.4090385437011719, 0.423583984375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 7.0, 14.0, 14.0, 25.0, 30.0, 35.0, 45.0, 57.0, 63.0, 62.0, 65.0, 71.0, 67.0, 65.0, 57.0, 60.0, 42.0, 53.0, 35.0, 18.0, 22.0, 20.0, 13.0, 8.0, 10.0, 5.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13916015625, -0.13504600524902344, -0.13093185424804688, -0.1268177032470703, -0.12270355224609375, -0.11858940124511719, -0.11447525024414062, -0.11036109924316406, -0.1062469482421875, -0.10213279724121094, -0.09801864624023438, -0.09390449523925781, -0.08979034423828125, -0.08567619323730469, -0.08156204223632812, -0.07744789123535156, -0.073333740234375, -0.06921958923339844, -0.06510543823242188, -0.06099128723144531, -0.05687713623046875, -0.05276298522949219, -0.048648834228515625, -0.04453468322753906, -0.0404205322265625, -0.03630638122558594, -0.032192230224609375, -0.028078079223632812, -0.02396392822265625, -0.019849777221679688, -0.015735626220703125, -0.011621475219726562, -0.00750732421875, -0.0033931732177734375, 0.000720977783203125, 0.0048351287841796875, 0.00894927978515625, 0.013063430786132812, 0.017177581787109375, 0.021291732788085938, 0.0254058837890625, 0.029520034790039062, 0.033634185791015625, 0.03774833679199219, 0.04186248779296875, 0.04597663879394531, 0.050090789794921875, 0.05420494079589844, 0.058319091796875, 0.06243324279785156, 0.06654739379882812, 0.07066154479980469, 0.07477569580078125, 0.07888984680175781, 0.08300399780273438, 0.08711814880371094, 0.0912322998046875, 0.09534645080566406, 0.09946060180664062, 0.10357475280761719, 0.10768890380859375, 0.11180305480957031, 0.11591720581054688, 0.12003135681152344, 0.1241455078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 6.0, 7.0, 19.0, 25.0, 37.0, 41.0, 95.0, 166.0, 295.0, 522.0, 1182.0, 2507.0, 6101.0, 15486.0, 46033.0, 166370.0, 498534.0, 220922.0, 58285.0, 19098.0, 7079.0, 3008.0, 1309.0, 654.0, 297.0, 192.0, 100.0, 68.0, 28.0, 30.0, 18.0, 15.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38232421875, -0.3709449768066406, -0.35956573486328125, -0.3481864929199219, -0.3368072509765625, -0.3254280090332031, -0.31404876708984375, -0.3026695251464844, -0.291290283203125, -0.2799110412597656, -0.26853179931640625, -0.2571525573730469, -0.2457733154296875, -0.23439407348632812, -0.22301483154296875, -0.21163558959960938, -0.20025634765625, -0.18887710571289062, -0.17749786376953125, -0.16611862182617188, -0.1547393798828125, -0.14336013793945312, -0.13198089599609375, -0.12060165405273438, -0.109222412109375, -0.09784317016601562, -0.08646392822265625, -0.07508468627929688, -0.0637054443359375, -0.052326202392578125, -0.04094696044921875, -0.029567718505859375, -0.0181884765625, -0.006809234619140625, 0.00457000732421875, 0.015949249267578125, 0.0273284912109375, 0.038707733154296875, 0.05008697509765625, 0.061466217041015625, 0.072845458984375, 0.08422470092773438, 0.09560394287109375, 0.10698318481445312, 0.1183624267578125, 0.12974166870117188, 0.14112091064453125, 0.15250015258789062, 0.16387939453125, 0.17525863647460938, 0.18663787841796875, 0.19801712036132812, 0.2093963623046875, 0.22077560424804688, 0.23215484619140625, 0.24353408813476562, 0.254913330078125, 0.2662925720214844, 0.27767181396484375, 0.2890510559082031, 0.3004302978515625, 0.3118095397949219, 0.32318878173828125, 0.3345680236816406, 0.345947265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 9.0, 10.0, 10.0, 16.0, 13.0, 21.0, 21.0, 24.0, 23.0, 39.0, 36.0, 36.0, 29.0, 43.0, 59.0, 47.0, 55.0, 54.0, 46.0, 50.0, 44.0, 49.0, 39.0, 29.0, 33.0, 28.0, 20.0, 25.0, 14.0, 15.0, 11.0, 7.0, 10.0, 9.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369873046875, -0.3569450378417969, -0.34401702880859375, -0.3310890197753906, -0.3181610107421875, -0.3052330017089844, -0.29230499267578125, -0.2793769836425781, -0.266448974609375, -0.2535209655761719, -0.24059295654296875, -0.22766494750976562, -0.2147369384765625, -0.20180892944335938, -0.18888092041015625, -0.17595291137695312, -0.16302490234375, -0.15009689331054688, -0.13716888427734375, -0.12424087524414062, -0.1113128662109375, -0.09838485717773438, -0.08545684814453125, -0.07252883911132812, -0.059600830078125, -0.046672821044921875, -0.03374481201171875, -0.020816802978515625, -0.0078887939453125, 0.005039215087890625, 0.01796722412109375, 0.030895233154296875, 0.0438232421875, 0.056751251220703125, 0.06967926025390625, 0.08260726928710938, 0.0955352783203125, 0.10846328735351562, 0.12139129638671875, 0.13431930541992188, 0.147247314453125, 0.16017532348632812, 0.17310333251953125, 0.18603134155273438, 0.1989593505859375, 0.21188735961914062, 0.22481536865234375, 0.23774337768554688, 0.25067138671875, 0.2635993957519531, 0.27652740478515625, 0.2894554138183594, 0.3023834228515625, 0.3153114318847656, 0.32823944091796875, 0.3411674499511719, 0.354095458984375, 0.3670234680175781, 0.37995147705078125, 0.3928794860839844, 0.4058074951171875, 0.4187355041503906, 0.43166351318359375, 0.4445915222167969, 0.45751953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 9.0, 8.0, 14.0, 16.0, 32.0, 40.0, 62.0, 102.0, 165.0, 300.0, 501.0, 826.0, 1417.0, 2715.0, 5877.0, 30129.0, 720317.0, 261841.0, 14750.0, 4324.0, 2120.0, 1160.0, 683.0, 417.0, 246.0, 170.0, 103.0, 72.0, 45.0, 34.0, 14.0, 14.0, 9.0, 10.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273681640625, -0.2658252716064453, -0.2579689025878906, -0.25011253356933594, -0.24225616455078125, -0.23439979553222656, -0.22654342651367188, -0.2186870574951172, -0.2108306884765625, -0.2029743194580078, -0.19511795043945312, -0.18726158142089844, -0.17940521240234375, -0.17154884338378906, -0.16369247436523438, -0.1558361053466797, -0.147979736328125, -0.1401233673095703, -0.13226699829101562, -0.12441062927246094, -0.11655426025390625, -0.10869789123535156, -0.10084152221679688, -0.09298515319824219, -0.0851287841796875, -0.07727241516113281, -0.06941604614257812, -0.06155967712402344, -0.05370330810546875, -0.04584693908691406, -0.037990570068359375, -0.030134201049804688, -0.02227783203125, -0.014421463012695312, -0.006565093994140625, 0.0012912750244140625, 0.00914764404296875, 0.017004013061523438, 0.024860382080078125, 0.03271675109863281, 0.0405731201171875, 0.04842948913574219, 0.056285858154296875, 0.06414222717285156, 0.07199859619140625, 0.07985496520996094, 0.08771133422851562, 0.09556770324707031, 0.103424072265625, 0.11128044128417969, 0.11913681030273438, 0.12699317932128906, 0.13484954833984375, 0.14270591735839844, 0.15056228637695312, 0.1584186553955078, 0.1662750244140625, 0.1741313934326172, 0.18198776245117188, 0.18984413146972656, 0.19770050048828125, 0.20555686950683594, 0.21341323852539062, 0.2212696075439453, 0.2291259765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 11.0, 9.0, 9.0, 24.0, 29.0, 48.0, 67.0, 92.0, 122.0, 118.0, 124.0, 94.0, 76.0, 52.0, 48.0, 30.0, 10.0, 12.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.909536361694336e-05, -7.709860801696777e-05, -7.510185241699219e-05, -7.31050968170166e-05, -7.110834121704102e-05, -6.911158561706543e-05, -6.711483001708984e-05, -6.511807441711426e-05, -6.312131881713867e-05, -6.112456321716309e-05, -5.91278076171875e-05, -5.7131052017211914e-05, -5.513429641723633e-05, -5.313754081726074e-05, -5.1140785217285156e-05, -4.914402961730957e-05, -4.7147274017333984e-05, -4.51505184173584e-05, -4.315376281738281e-05, -4.1157007217407227e-05, -3.916025161743164e-05, -3.7163496017456055e-05, -3.516674041748047e-05, -3.316998481750488e-05, -3.11732292175293e-05, -2.917647361755371e-05, -2.7179718017578125e-05, -2.518296241760254e-05, -2.3186206817626953e-05, -2.1189451217651367e-05, -1.919269561767578e-05, -1.7195940017700195e-05, -1.519918441772461e-05, -1.3202428817749023e-05, -1.1205673217773438e-05, -9.208917617797852e-06, -7.212162017822266e-06, -5.21540641784668e-06, -3.2186508178710938e-06, -1.2218952178955078e-06, 7.748603820800781e-07, 2.771615982055664e-06, 4.76837158203125e-06, 6.765127182006836e-06, 8.761882781982422e-06, 1.0758638381958008e-05, 1.2755393981933594e-05, 1.475214958190918e-05, 1.6748905181884766e-05, 1.874566078186035e-05, 2.0742416381835938e-05, 2.2739171981811523e-05, 2.473592758178711e-05, 2.6732683181762695e-05, 2.872943878173828e-05, 3.072619438171387e-05, 3.272294998168945e-05, 3.471970558166504e-05, 3.6716461181640625e-05, 3.871321678161621e-05, 4.07099723815918e-05, 4.270672798156738e-05, 4.470348358154297e-05, 4.6700239181518555e-05, 4.869699478149414e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 5.0, 13.0, 15.0, 18.0, 22.0, 34.0, 44.0, 70.0, 77.0, 130.0, 173.0, 244.0, 369.0, 520.0, 718.0, 1022.0, 1752.0, 2696.0, 5197.0, 14453.0, 93854.0, 790546.0, 107408.0, 15696.0, 5353.0, 2799.0, 1740.0, 1117.0, 710.0, 538.0, 348.0, 241.0, 172.0, 115.0, 96.0, 58.0, 44.0, 35.0, 37.0, 17.0, 14.0, 10.0, 12.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2352294921875, -0.2277679443359375, -0.220306396484375, -0.2128448486328125, -0.20538330078125, -0.1979217529296875, -0.190460205078125, -0.1829986572265625, -0.175537109375, -0.1680755615234375, -0.160614013671875, -0.1531524658203125, -0.14569091796875, -0.1382293701171875, -0.130767822265625, -0.1233062744140625, -0.1158447265625, -0.1083831787109375, -0.100921630859375, -0.0934600830078125, -0.08599853515625, -0.0785369873046875, -0.071075439453125, -0.0636138916015625, -0.05615234375, -0.0486907958984375, -0.041229248046875, -0.0337677001953125, -0.02630615234375, -0.0188446044921875, -0.011383056640625, -0.0039215087890625, 0.0035400390625, 0.0110015869140625, 0.018463134765625, 0.0259246826171875, 0.03338623046875, 0.0408477783203125, 0.048309326171875, 0.0557708740234375, 0.063232421875, 0.0706939697265625, 0.078155517578125, 0.0856170654296875, 0.09307861328125, 0.1005401611328125, 0.108001708984375, 0.1154632568359375, 0.1229248046875, 0.1303863525390625, 0.137847900390625, 0.1453094482421875, 0.15277099609375, 0.1602325439453125, 0.167694091796875, 0.1751556396484375, 0.1826171875, 0.1900787353515625, 0.197540283203125, 0.2050018310546875, 0.21246337890625, 0.2199249267578125, 0.227386474609375, 0.2348480224609375, 0.2423095703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 10.0, 13.0, 20.0, 45.0, 94.0, 230.0, 277.0, 142.0, 66.0, 39.0, 21.0, 10.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2841796875, -0.2753334045410156, -0.26648712158203125, -0.2576408386230469, -0.2487945556640625, -0.23994827270507812, -0.23110198974609375, -0.22225570678710938, -0.213409423828125, -0.20456314086914062, -0.19571685791015625, -0.18687057495117188, -0.1780242919921875, -0.16917800903320312, -0.16033172607421875, -0.15148544311523438, -0.14263916015625, -0.13379287719726562, -0.12494659423828125, -0.11610031127929688, -0.1072540283203125, -0.09840774536132812, -0.08956146240234375, -0.08071517944335938, -0.071868896484375, -0.06302261352539062, -0.05417633056640625, -0.045330047607421875, -0.0364837646484375, -0.027637481689453125, -0.01879119873046875, -0.009944915771484375, -0.0010986328125, 0.007747650146484375, 0.01659393310546875, 0.025440216064453125, 0.0342864990234375, 0.043132781982421875, 0.05197906494140625, 0.060825347900390625, 0.069671630859375, 0.07851791381835938, 0.08736419677734375, 0.09621047973632812, 0.1050567626953125, 0.11390304565429688, 0.12274932861328125, 0.13159561157226562, 0.14044189453125, 0.14928817749023438, 0.15813446044921875, 0.16698074340820312, 0.1758270263671875, 0.18467330932617188, 0.19351959228515625, 0.20236587524414062, 0.211212158203125, 0.22005844116210938, 0.22890472412109375, 0.23775100708007812, 0.2465972900390625, 0.2554435729980469, 0.26428985595703125, 0.2731361389160156, 0.281982421875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 5.0, 16.0, 35.0, 55.0, 102.0, 180.0, 212.0, 171.0, 96.0, 65.0, 29.0, 15.0, 9.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.796614170074463, -5.679638862609863, -5.5626630783081055, -5.445687770843506, -5.328712463378906, -5.211736679077148, -5.094761371612549, -4.977786064147949, -4.860810279846191, -4.743834972381592, -4.626859188079834, -4.509883880615234, -4.392908573150635, -4.275933265686035, -4.158957481384277, -4.041982173919678, -3.925006866455078, -3.8080313205718994, -3.6910560131073, -3.574080467224121, -3.4571051597595215, -3.3401296138763428, -3.223154067993164, -3.1061787605285645, -2.9892032146453857, -2.872227668762207, -2.7552523612976074, -2.6382768154144287, -2.52130126953125, -2.4043259620666504, -2.2873504161834717, -2.170374870300293, -2.0533998012542725, -1.9364243745803833, -1.8194489479064941, -1.7024734020233154, -1.5854979753494263, -1.468522548675537, -1.3515470027923584, -1.2345715761184692, -1.11759614944458, -1.000620722770691, -0.883645236492157, -0.766669750213623, -0.6496943235397339, -0.5327188968658447, -0.4157434105873108, -0.29876792430877686, -0.1817924976348877, -0.06481704115867615, 0.0521584153175354, 0.16913387179374695, 0.2861093282699585, 0.40308475494384766, 0.5200602412223816, 0.6370357275009155, 0.7540111541748047, 0.8709865808486938, 0.9879620671272278, 1.1049375534057617, 1.2219129800796509, 1.33888840675354, 1.4558639526367188, 1.572839379310608, 1.689814805984497]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 6.0, 8.0, 14.0, 12.0, 12.0, 12.0, 14.0, 16.0, 15.0, 21.0, 24.0, 34.0, 28.0, 34.0, 38.0, 33.0, 37.0, 30.0, 44.0, 35.0, 39.0, 44.0, 33.0, 42.0, 28.0, 36.0, 31.0, 26.0, 24.0, 28.0, 27.0, 19.0, 24.0, 18.0, 15.0, 13.0, 11.0, 13.0, 8.0, 10.0, 11.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 5.0, 1.0], "bins": [-1.6204147338867188, -1.571146011352539, -1.5218771696090698, -1.4726084470748901, -1.423339605331421, -1.3740708827972412, -1.3248021602630615, -1.2755334377288818, -1.2262645959854126, -1.176995873451233, -1.1277270317077637, -1.078458309173584, -1.0291895866394043, -0.9799207448959351, -0.9306520223617554, -0.8813832402229309, -0.8321144580841064, -0.782845675945282, -0.7335768938064575, -0.6843081712722778, -0.6350393891334534, -0.5857706069946289, -0.5365018844604492, -0.48723310232162476, -0.4379643201828003, -0.38869553804397583, -0.33942678570747375, -0.2901580333709717, -0.24088925123214722, -0.19162048399448395, -0.14235171675682068, -0.0930829644203186, -0.04381430149078369, 0.005454465746879578, 0.05472323298454285, 0.10399200022220612, 0.15326076745986938, 0.20252953469753265, 0.2517983019351959, 0.301067054271698, 0.35033583641052246, 0.3996046185493469, 0.448873370885849, 0.4981421232223511, 0.5474109053611755, 0.5966796875, 0.6459484100341797, 0.6952171921730042, 0.7444859743118286, 0.7937547564506531, 0.8430235385894775, 0.8922922611236572, 0.9415610432624817, 0.9908298254013062, 1.0400985479354858, 1.089367389678955, 1.1386361122131348, 1.1879048347473145, 1.2371736764907837, 1.2864423990249634, 1.3357112407684326, 1.3849799633026123, 1.434248685836792, 1.4835174083709717, 1.532786250114441]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 15.0, 11.0, 14.0, 22.0, 28.0, 63.0, 68.0, 124.0, 153.0, 254.0, 396.0, 680.0, 1316.0, 3224.0, 12232.0, 121176.0, 4001787.0, 40299.0, 7198.0, 2447.0, 1027.0, 602.0, 332.0, 252.0, 163.0, 110.0, 74.0, 54.0, 40.0, 25.0, 17.0, 11.0, 10.0, 5.0, 7.0, 8.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.158203125, -1.1212158203125, -1.084228515625, -1.0472412109375, -1.01025390625, -0.9732666015625, -0.936279296875, -0.8992919921875, -0.8623046875, -0.8253173828125, -0.788330078125, -0.7513427734375, -0.71435546875, -0.6773681640625, -0.640380859375, -0.6033935546875, -0.56640625, -0.5294189453125, -0.492431640625, -0.4554443359375, -0.41845703125, -0.3814697265625, -0.344482421875, -0.3074951171875, -0.2705078125, -0.2335205078125, -0.196533203125, -0.1595458984375, -0.12255859375, -0.0855712890625, -0.048583984375, -0.0115966796875, 0.025390625, 0.0623779296875, 0.099365234375, 0.1363525390625, 0.17333984375, 0.2103271484375, 0.247314453125, 0.2843017578125, 0.3212890625, 0.3582763671875, 0.395263671875, 0.4322509765625, 0.46923828125, 0.5062255859375, 0.543212890625, 0.5802001953125, 0.6171875, 0.6541748046875, 0.691162109375, 0.7281494140625, 0.76513671875, 0.8021240234375, 0.839111328125, 0.8760986328125, 0.9130859375, 0.9500732421875, 0.987060546875, 1.0240478515625, 1.06103515625, 1.0980224609375, 1.135009765625, 1.1719970703125, 1.208984375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 13.0, 14.0, 20.0, 24.0, 34.0, 44.0, 47.0, 41.0, 41.0, 66.0, 62.0, 59.0, 69.0, 56.0, 62.0, 65.0, 55.0, 37.0, 31.0, 27.0, 24.0, 19.0, 11.0, 10.0, 12.0, 14.0, 8.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.12646484375, -0.122528076171875, -0.11859130859375, -0.114654541015625, -0.1107177734375, -0.106781005859375, -0.10284423828125, -0.098907470703125, -0.094970703125, -0.091033935546875, -0.08709716796875, -0.083160400390625, -0.0792236328125, -0.075286865234375, -0.07135009765625, -0.067413330078125, -0.0634765625, -0.059539794921875, -0.05560302734375, -0.051666259765625, -0.0477294921875, -0.043792724609375, -0.03985595703125, -0.035919189453125, -0.031982421875, -0.028045654296875, -0.02410888671875, -0.020172119140625, -0.0162353515625, -0.012298583984375, -0.00836181640625, -0.004425048828125, -0.00048828125, 0.003448486328125, 0.00738525390625, 0.011322021484375, 0.0152587890625, 0.019195556640625, 0.02313232421875, 0.027069091796875, 0.031005859375, 0.034942626953125, 0.03887939453125, 0.042816162109375, 0.0467529296875, 0.050689697265625, 0.05462646484375, 0.058563232421875, 0.0625, 0.066436767578125, 0.07037353515625, 0.074310302734375, 0.0782470703125, 0.082183837890625, 0.08612060546875, 0.090057373046875, 0.093994140625, 0.097930908203125, 0.10186767578125, 0.105804443359375, 0.1097412109375, 0.113677978515625, 0.11761474609375, 0.121551513671875, 0.12548828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 8.0, 12.0, 14.0, 12.0, 19.0, 33.0, 29.0, 50.0, 71.0, 97.0, 122.0, 140.0, 248.0, 390.0, 738.0, 1433.0, 3091.0, 7784.0, 24558.0, 140675.0, 3792160.0, 178472.0, 28227.0, 8649.0, 3393.0, 1649.0, 822.0, 447.0, 271.0, 172.0, 112.0, 86.0, 70.0, 60.0, 36.0, 39.0, 22.0, 19.0, 8.0, 12.0, 9.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.644683837890625, -0.62286376953125, -0.601043701171875, -0.5792236328125, -0.557403564453125, -0.53558349609375, -0.513763427734375, -0.491943359375, -0.470123291015625, -0.44830322265625, -0.426483154296875, -0.4046630859375, -0.382843017578125, -0.36102294921875, -0.339202880859375, -0.3173828125, -0.295562744140625, -0.27374267578125, -0.251922607421875, -0.2301025390625, -0.208282470703125, -0.18646240234375, -0.164642333984375, -0.142822265625, -0.121002197265625, -0.09918212890625, -0.077362060546875, -0.0555419921875, -0.033721923828125, -0.01190185546875, 0.009918212890625, 0.03173828125, 0.053558349609375, 0.07537841796875, 0.097198486328125, 0.1190185546875, 0.140838623046875, 0.16265869140625, 0.184478759765625, 0.206298828125, 0.228118896484375, 0.24993896484375, 0.271759033203125, 0.2935791015625, 0.315399169921875, 0.33721923828125, 0.359039306640625, 0.380859375, 0.402679443359375, 0.42449951171875, 0.446319580078125, 0.4681396484375, 0.489959716796875, 0.51177978515625, 0.533599853515625, 0.555419921875, 0.577239990234375, 0.59906005859375, 0.620880126953125, 0.6427001953125, 0.664520263671875, 0.68634033203125, 0.708160400390625, 0.72998046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 6.0, 15.0, 16.0, 38.0, 49.0, 110.0, 535.0, 2766.0, 303.0, 98.0, 54.0, 33.0, 12.0, 9.0, 9.0, 8.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3388671875, -0.32732391357421875, -0.3157806396484375, -0.30423736572265625, -0.292694091796875, -0.28115081787109375, -0.2696075439453125, -0.25806427001953125, -0.24652099609375, -0.23497772216796875, -0.2234344482421875, -0.21189117431640625, -0.200347900390625, -0.18880462646484375, -0.1772613525390625, -0.16571807861328125, -0.1541748046875, -0.14263153076171875, -0.1310882568359375, -0.11954498291015625, -0.108001708984375, -0.09645843505859375, -0.0849151611328125, -0.07337188720703125, -0.06182861328125, -0.05028533935546875, -0.0387420654296875, -0.02719879150390625, -0.015655517578125, -0.00411224365234375, 0.0074310302734375, 0.01897430419921875, 0.030517578125, 0.04206085205078125, 0.0536041259765625, 0.06514739990234375, 0.076690673828125, 0.08823394775390625, 0.0997772216796875, 0.11132049560546875, 0.12286376953125, 0.13440704345703125, 0.1459503173828125, 0.15749359130859375, 0.169036865234375, 0.18058013916015625, 0.1921234130859375, 0.20366668701171875, 0.2152099609375, 0.22675323486328125, 0.2382965087890625, 0.24983978271484375, 0.261383056640625, 0.27292633056640625, 0.2844696044921875, 0.29601287841796875, 0.30755615234375, 0.31909942626953125, 0.3306427001953125, 0.34218597412109375, 0.353729248046875, 0.36527252197265625, 0.3768157958984375, 0.38835906982421875, 0.39990234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 9.0, 14.0, 19.0, 42.0, 87.0, 147.0, 162.0, 199.0, 132.0, 83.0, 43.0, 19.0, 10.0, 6.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1960293054580688, -1.1452975273132324, -1.0945656299591064, -1.04383385181427, -0.9931020140647888, -0.9423701763153076, -0.8916383981704712, -0.84090656042099, -0.7901747226715088, -0.7394428849220276, -0.6887110471725464, -0.63797926902771, -0.5872474312782288, -0.5365155935287476, -0.48578378558158875, -0.43505197763442993, -0.38432013988494873, -0.33358830213546753, -0.2828564941883087, -0.2321246713399887, -0.1813928484916687, -0.1306610107421875, -0.07992920279502869, -0.029197394847869873, 0.021534442901611328, 0.07226626574993134, 0.12299808859825134, 0.17372991144657135, 0.22446173429489136, 0.27519357204437256, 0.32592537999153137, 0.3766571879386902, 0.42738914489746094, 0.47812098264694214, 0.5288528203964233, 0.5795845985412598, 0.630316436290741, 0.6810482740402222, 0.7317800521850586, 0.7825118899345398, 0.833243727684021, 0.8839755654335022, 0.9347074031829834, 0.9854391813278198, 1.0361709594726562, 1.0869028568267822, 1.1376346349716187, 1.188366413116455, 1.239098310470581, 1.2898300886154175, 1.3405619859695435, 1.3912937641143799, 1.4420256614685059, 1.4927574396133423, 1.5434892177581787, 1.5942211151123047, 1.6449528932571411, 1.6956846714019775, 1.7464165687561035, 1.79714834690094, 1.8478801250457764, 1.8986120223999023, 1.9493438005447388, 2.000075578689575, 2.050807476043701]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 6.0, 12.0, 16.0, 24.0, 26.0, 24.0, 39.0, 36.0, 47.0, 44.0, 47.0, 61.0, 60.0, 59.0, 58.0, 66.0, 60.0, 61.0, 35.0, 35.0, 28.0, 31.0, 29.0, 22.0, 18.0, 14.0, 10.0, 11.0, 8.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6312740445137024, -0.6070161461830139, -0.5827583074569702, -0.5585004091262817, -0.5342425107955933, -0.5099846124649048, -0.4857267737388611, -0.4614688754081726, -0.4372110068798065, -0.41295313835144043, -0.38869524002075195, -0.36443737149238586, -0.3401795029640198, -0.3159216046333313, -0.2916637361049652, -0.2674058675765991, -0.24314796924591064, -0.21889008581638336, -0.19463220238685608, -0.17037433385849, -0.1461164504289627, -0.12185856699943542, -0.09760069847106934, -0.07334281504154205, -0.04908493161201477, -0.024827051907777786, -0.000569172203540802, 0.023688703775405884, 0.047946587204933167, 0.07220447063446045, 0.09646233916282654, 0.12072022259235382, 0.14497804641723633, 0.1692359298467636, 0.1934938132762909, 0.21775168180465698, 0.24200956523418427, 0.26626744866371155, 0.29052531719207764, 0.3147832155227661, 0.3390410840511322, 0.3632989525794983, 0.38755685091018677, 0.41181471943855286, 0.43607258796691895, 0.4603304862976074, 0.4845883548259735, 0.5088462233543396, 0.5331041216850281, 0.5573620200157166, 0.5816198587417603, 0.6058777570724487, 0.6301356554031372, 0.6543935537338257, 0.6786513924598694, 0.7029092907905579, 0.7271671295166016, 0.75142502784729, 0.7756828665733337, 0.7999407649040222, 0.8241986632347107, 0.8484565019607544, 0.8727144002914429, 0.8969722986221313, 0.9212301969528198]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 8.0, 6.0, 13.0, 31.0, 45.0, 55.0, 77.0, 129.0, 188.0, 283.0, 458.0, 776.0, 1431.0, 2801.0, 6113.0, 15798.0, 50628.0, 212856.0, 505762.0, 180978.0, 44464.0, 13973.0, 5715.0, 2610.0, 1332.0, 720.0, 461.0, 312.0, 181.0, 92.0, 71.0, 52.0, 35.0, 24.0, 16.0, 11.0, 7.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.55615234375, -0.5404624938964844, -0.5247726440429688, -0.5090827941894531, -0.4933929443359375, -0.4777030944824219, -0.46201324462890625, -0.4463233947753906, -0.430633544921875, -0.4149436950683594, -0.39925384521484375, -0.3835639953613281, -0.3678741455078125, -0.3521842956542969, -0.33649444580078125, -0.3208045959472656, -0.30511474609375, -0.2894248962402344, -0.27373504638671875, -0.2580451965332031, -0.2423553466796875, -0.22666549682617188, -0.21097564697265625, -0.19528579711914062, -0.179595947265625, -0.16390609741210938, -0.14821624755859375, -0.13252639770507812, -0.1168365478515625, -0.10114669799804688, -0.08545684814453125, -0.06976699829101562, -0.0540771484375, -0.038387298583984375, -0.02269744873046875, -0.007007598876953125, 0.0086822509765625, 0.024372100830078125, 0.04006195068359375, 0.055751800537109375, 0.071441650390625, 0.08713150024414062, 0.10282135009765625, 0.11851119995117188, 0.1342010498046875, 0.14989089965820312, 0.16558074951171875, 0.18127059936523438, 0.19696044921875, 0.21265029907226562, 0.22834014892578125, 0.24402999877929688, 0.2597198486328125, 0.2754096984863281, 0.29109954833984375, 0.3067893981933594, 0.322479248046875, 0.3381690979003906, 0.35385894775390625, 0.3695487976074219, 0.3852386474609375, 0.4009284973144531, 0.41661834716796875, 0.4323081970214844, 0.447998046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 9.0, 7.0, 17.0, 25.0, 30.0, 30.0, 36.0, 39.0, 73.0, 55.0, 70.0, 75.0, 72.0, 75.0, 63.0, 62.0, 49.0, 46.0, 39.0, 28.0, 23.0, 16.0, 13.0, 14.0, 10.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1387939453125, -0.13423919677734375, -0.1296844482421875, -0.12512969970703125, -0.120574951171875, -0.11602020263671875, -0.1114654541015625, -0.10691070556640625, -0.10235595703125, -0.09780120849609375, -0.0932464599609375, -0.08869171142578125, -0.084136962890625, -0.07958221435546875, -0.0750274658203125, -0.07047271728515625, -0.06591796875, -0.06136322021484375, -0.0568084716796875, -0.05225372314453125, -0.047698974609375, -0.04314422607421875, -0.0385894775390625, -0.03403472900390625, -0.02947998046875, -0.02492523193359375, -0.0203704833984375, -0.01581573486328125, -0.011260986328125, -0.00670623779296875, -0.0021514892578125, 0.00240325927734375, 0.0069580078125, 0.01151275634765625, 0.0160675048828125, 0.02062225341796875, 0.025177001953125, 0.02973175048828125, 0.0342864990234375, 0.03884124755859375, 0.04339599609375, 0.04795074462890625, 0.0525054931640625, 0.05706024169921875, 0.061614990234375, 0.06616973876953125, 0.0707244873046875, 0.07527923583984375, 0.079833984375, 0.08438873291015625, 0.0889434814453125, 0.09349822998046875, 0.098052978515625, 0.10260772705078125, 0.1071624755859375, 0.11171722412109375, 0.11627197265625, 0.12082672119140625, 0.1253814697265625, 0.12993621826171875, 0.134490966796875, 0.13904571533203125, 0.1436004638671875, 0.14815521240234375, 0.1527099609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 11.0, 20.0, 21.0, 30.0, 32.0, 45.0, 57.0, 111.0, 162.0, 238.0, 413.0, 740.0, 1308.0, 2926.0, 6666.0, 17349.0, 49846.0, 159461.0, 396677.0, 275140.0, 88858.0, 28867.0, 10699.0, 4340.0, 2015.0, 1017.0, 578.0, 301.0, 217.0, 134.0, 82.0, 65.0, 25.0, 21.0, 22.0, 22.0, 12.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3095703125, -0.2998199462890625, -0.290069580078125, -0.2803192138671875, -0.27056884765625, -0.2608184814453125, -0.251068115234375, -0.2413177490234375, -0.2315673828125, -0.2218170166015625, -0.212066650390625, -0.2023162841796875, -0.19256591796875, -0.1828155517578125, -0.173065185546875, -0.1633148193359375, -0.153564453125, -0.1438140869140625, -0.134063720703125, -0.1243133544921875, -0.11456298828125, -0.1048126220703125, -0.095062255859375, -0.0853118896484375, -0.0755615234375, -0.0658111572265625, -0.056060791015625, -0.0463104248046875, -0.03656005859375, -0.0268096923828125, -0.017059326171875, -0.0073089599609375, 0.00244140625, 0.0121917724609375, 0.021942138671875, 0.0316925048828125, 0.04144287109375, 0.0511932373046875, 0.060943603515625, 0.0706939697265625, 0.0804443359375, 0.0901947021484375, 0.099945068359375, 0.1096954345703125, 0.11944580078125, 0.1291961669921875, 0.138946533203125, 0.1486968994140625, 0.158447265625, 0.1681976318359375, 0.177947998046875, 0.1876983642578125, 0.19744873046875, 0.2071990966796875, 0.216949462890625, 0.2266998291015625, 0.2364501953125, 0.2462005615234375, 0.255950927734375, 0.2657012939453125, 0.27545166015625, 0.2852020263671875, 0.294952392578125, 0.3047027587890625, 0.314453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 10.0, 8.0, 16.0, 17.0, 14.0, 19.0, 24.0, 25.0, 35.0, 25.0, 39.0, 28.0, 39.0, 38.0, 35.0, 40.0, 38.0, 54.0, 39.0, 38.0, 39.0, 38.0, 43.0, 32.0, 43.0, 33.0, 23.0, 17.0, 22.0, 19.0, 15.0, 14.0, 11.0, 13.0, 9.0, 8.0, 5.0, 5.0, 2.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3759765625, -0.363250732421875, -0.35052490234375, -0.337799072265625, -0.3250732421875, -0.312347412109375, -0.29962158203125, -0.286895751953125, -0.274169921875, -0.261444091796875, -0.24871826171875, -0.235992431640625, -0.2232666015625, -0.210540771484375, -0.19781494140625, -0.185089111328125, -0.17236328125, -0.159637451171875, -0.14691162109375, -0.134185791015625, -0.1214599609375, -0.108734130859375, -0.09600830078125, -0.083282470703125, -0.070556640625, -0.057830810546875, -0.04510498046875, -0.032379150390625, -0.0196533203125, -0.006927490234375, 0.00579833984375, 0.018524169921875, 0.03125, 0.043975830078125, 0.05670166015625, 0.069427490234375, 0.0821533203125, 0.094879150390625, 0.10760498046875, 0.120330810546875, 0.133056640625, 0.145782470703125, 0.15850830078125, 0.171234130859375, 0.1839599609375, 0.196685791015625, 0.20941162109375, 0.222137451171875, 0.23486328125, 0.247589111328125, 0.26031494140625, 0.273040771484375, 0.2857666015625, 0.298492431640625, 0.31121826171875, 0.323944091796875, 0.336669921875, 0.349395751953125, 0.36212158203125, 0.374847412109375, 0.3875732421875, 0.400299072265625, 0.41302490234375, 0.425750732421875, 0.4384765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 9.0, 5.0, 16.0, 36.0, 54.0, 207.0, 1288.0, 19211.0, 935264.0, 89349.0, 2540.0, 398.0, 101.0, 31.0, 16.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62646484375, -0.6072921752929688, -0.5881195068359375, -0.5689468383789062, -0.549774169921875, -0.5306015014648438, -0.5114288330078125, -0.49225616455078125, -0.47308349609375, -0.45391082763671875, -0.4347381591796875, -0.41556549072265625, -0.396392822265625, -0.37722015380859375, -0.3580474853515625, -0.33887481689453125, -0.3197021484375, -0.30052947998046875, -0.2813568115234375, -0.26218414306640625, -0.243011474609375, -0.22383880615234375, -0.2046661376953125, -0.18549346923828125, -0.16632080078125, -0.14714813232421875, -0.1279754638671875, -0.10880279541015625, -0.089630126953125, -0.07045745849609375, -0.0512847900390625, -0.03211212158203125, -0.012939453125, 0.00623321533203125, 0.0254058837890625, 0.04457855224609375, 0.063751220703125, 0.08292388916015625, 0.1020965576171875, 0.12126922607421875, 0.14044189453125, 0.15961456298828125, 0.1787872314453125, 0.19795989990234375, 0.217132568359375, 0.23630523681640625, 0.2554779052734375, 0.27465057373046875, 0.2938232421875, 0.31299591064453125, 0.3321685791015625, 0.35134124755859375, 0.370513916015625, 0.38968658447265625, 0.4088592529296875, 0.42803192138671875, 0.44720458984375, 0.46637725830078125, 0.4855499267578125, 0.5047225952148438, 0.523895263671875, 0.5430679321289062, 0.5622406005859375, 0.5814132690429688, 0.6005859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 11.0, 19.0, 41.0, 64.0, 115.0, 195.0, 187.0, 145.0, 108.0, 45.0, 25.0, 25.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012445449829101562, -0.00012071244418621063, -0.00011697039008140564, -0.00011322833597660065, -0.00010948628187179565, -0.00010574422776699066, -0.00010200217366218567, -9.826011955738068e-05, -9.451806545257568e-05, -9.077601134777069e-05, -8.70339572429657e-05, -8.32919031381607e-05, -7.954984903335571e-05, -7.580779492855072e-05, -7.206574082374573e-05, -6.832368671894073e-05, -6.458163261413574e-05, -6.083957850933075e-05, -5.709752440452576e-05, -5.3355470299720764e-05, -4.961341619491577e-05, -4.587136209011078e-05, -4.2129307985305786e-05, -3.8387253880500793e-05, -3.46451997756958e-05, -3.090314567089081e-05, -2.7161091566085815e-05, -2.3419037461280823e-05, -1.967698335647583e-05, -1.5934929251670837e-05, -1.2192875146865845e-05, -8.450821042060852e-06, -4.708766937255859e-06, -9.667128324508667e-07, 2.775341272354126e-06, 6.517395377159119e-06, 1.0259449481964111e-05, 1.4001503586769104e-05, 1.7743557691574097e-05, 2.148561179637909e-05, 2.5227665901184082e-05, 2.8969720005989075e-05, 3.271177411079407e-05, 3.645382821559906e-05, 4.019588232040405e-05, 4.3937936425209045e-05, 4.767999053001404e-05, 5.142204463481903e-05, 5.5164098739624023e-05, 5.8906152844429016e-05, 6.264820694923401e-05, 6.6390261054039e-05, 7.0132315158844e-05, 7.387436926364899e-05, 7.761642336845398e-05, 8.135847747325897e-05, 8.510053157806396e-05, 8.884258568286896e-05, 9.258463978767395e-05, 9.632669389247894e-05, 0.00010006874799728394, 0.00010381080210208893, 0.00010755285620689392, 0.00011129491031169891, 0.0001150369644165039]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 7.0, 12.0, 16.0, 13.0, 34.0, 46.0, 52.0, 112.0, 277.0, 894.0, 5610.0, 127711.0, 880880.0, 29334.0, 2570.0, 544.0, 169.0, 86.0, 58.0, 42.0, 31.0, 14.0, 10.0, 8.0, 5.0, 2.0, 9.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.74365234375, -0.7237167358398438, -0.7037811279296875, -0.6838455200195312, -0.663909912109375, -0.6439743041992188, -0.6240386962890625, -0.6041030883789062, -0.58416748046875, -0.5642318725585938, -0.5442962646484375, -0.5243606567382812, -0.504425048828125, -0.48448944091796875, -0.4645538330078125, -0.44461822509765625, -0.4246826171875, -0.40474700927734375, -0.3848114013671875, -0.36487579345703125, -0.344940185546875, -0.32500457763671875, -0.3050689697265625, -0.28513336181640625, -0.26519775390625, -0.24526214599609375, -0.2253265380859375, -0.20539093017578125, -0.185455322265625, -0.16551971435546875, -0.1455841064453125, -0.12564849853515625, -0.105712890625, -0.08577728271484375, -0.0658416748046875, -0.04590606689453125, -0.025970458984375, -0.00603485107421875, 0.0139007568359375, 0.03383636474609375, 0.05377197265625, 0.07370758056640625, 0.0936431884765625, 0.11357879638671875, 0.133514404296875, 0.15345001220703125, 0.1733856201171875, 0.19332122802734375, 0.2132568359375, 0.23319244384765625, 0.2531280517578125, 0.27306365966796875, 0.292999267578125, 0.31293487548828125, 0.3328704833984375, 0.35280609130859375, 0.37274169921875, 0.39267730712890625, 0.4126129150390625, 0.43254852294921875, 0.452484130859375, 0.47241973876953125, 0.4923553466796875, 0.5122909545898438, 0.5322265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 10.0, 13.0, 34.0, 28.0, 77.0, 84.0, 152.0, 217.0, 167.0, 81.0, 56.0, 33.0, 24.0, 12.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.16830825805664062, -0.15570831298828125, -0.14310836791992188, -0.1305084228515625, -0.11790847778320312, -0.10530853271484375, -0.09270858764648438, -0.080108642578125, -0.06750869750976562, -0.05490875244140625, -0.042308807373046875, -0.0297088623046875, -0.017108917236328125, -0.00450897216796875, 0.008090972900390625, 0.02069091796875, 0.033290863037109375, 0.04589080810546875, 0.058490753173828125, 0.0710906982421875, 0.08369064331054688, 0.09629058837890625, 0.10889053344726562, 0.121490478515625, 0.13409042358398438, 0.14669036865234375, 0.15929031372070312, 0.1718902587890625, 0.18449020385742188, 0.19709014892578125, 0.20969009399414062, 0.2222900390625, 0.23488998413085938, 0.24748992919921875, 0.2600898742675781, 0.2726898193359375, 0.2852897644042969, 0.29788970947265625, 0.3104896545410156, 0.323089599609375, 0.3356895446777344, 0.34828948974609375, 0.3608894348144531, 0.3734893798828125, 0.3860893249511719, 0.39868927001953125, 0.4112892150878906, 0.42388916015625, 0.4364891052246094, 0.44908905029296875, 0.4616889953613281, 0.4742889404296875, 0.4868888854980469, 0.49948883056640625, 0.5120887756347656, 0.524688720703125, 0.5372886657714844, 0.5498886108398438, 0.5624885559082031, 0.5750885009765625, 0.5876884460449219, 0.6002883911132812, 0.6128883361816406, 0.62548828125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 3.0, 22.0, 42.0, 129.0, 248.0, 303.0, 168.0, 60.0, 19.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9821116924285889, -1.7673717737197876, -1.5526318550109863, -1.3378918170928955, -1.1231518983840942, -0.908411979675293, -0.6936719417572021, -0.4789320230484009, -0.2641921043395996, -0.04945215582847595, 0.1652877926826477, 0.38002777099609375, 0.594767689704895, 0.8095076084136963, 1.024247646331787, 1.2389875650405884, 1.4537274837493896, 1.668467402458191, 1.8832073211669922, 2.097947359085083, 2.312687397003174, 2.5274271965026855, 2.7421672344207764, 2.956907272338867, 3.171647071838379, 3.3863871097564697, 3.6011269092559814, 3.8158669471740723, 4.030606746673584, 4.245347023010254, 4.460086822509766, 4.674826622009277, 4.889566421508789, 5.104306221008301, 5.319046497344971, 5.533786296844482, 5.748526096343994, 5.963266372680664, 6.178006172180176, 6.3927459716796875, 6.607485771179199, 6.822225570678711, 7.036965847015381, 7.251705646514893, 7.466445446014404, 7.681185722351074, 7.895925521850586, 8.110665321350098, 8.32540512084961, 8.540144920349121, 8.754884719848633, 8.969625473022461, 9.184365272521973, 9.399105072021484, 9.613844871520996, 9.828584671020508, 10.043325424194336, 10.258065223693848, 10.47280502319336, 10.687545776367188, 10.9022855758667, 11.117025375366211, 11.331765174865723, 11.546504974365234, 11.761244773864746]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 7.0, 4.0, 6.0, 1.0, 5.0, 7.0, 7.0, 11.0, 13.0, 22.0, 17.0, 27.0, 27.0, 29.0, 37.0, 25.0, 41.0, 39.0, 44.0, 38.0, 52.0, 39.0, 46.0, 43.0, 48.0, 41.0, 43.0, 29.0, 38.0, 32.0, 42.0, 30.0, 20.0, 19.0, 29.0, 14.0, 9.0, 9.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.325942039489746, -2.249173164367676, -2.1724042892456055, -2.095635175704956, -2.0188663005828857, -1.9420974254608154, -1.8653285503387451, -1.7885596752166748, -1.711790680885315, -1.6350218057632446, -1.5582528114318848, -1.4814839363098145, -1.4047150611877441, -1.3279460668563843, -1.251177191734314, -1.174408197402954, -1.0976393222808838, -1.0208704471588135, -0.9441014528274536, -0.8673325777053833, -0.7905636429786682, -0.7137947082519531, -0.6370258331298828, -0.5602568984031677, -0.48348796367645264, -0.40671902894973755, -0.32995012402534485, -0.25318121910095215, -0.17641228437423706, -0.09964334964752197, -0.022874444723129272, 0.05389446020126343, 0.13066315650939941, 0.2074320763349533, 0.2842009961605072, 0.3609699010848999, 0.437738835811615, 0.5145077705383301, 0.5912766456604004, 0.6680455803871155, 0.7448145151138306, 0.8215834498405457, 0.8983523845672607, 0.975121259689331, 1.0518901348114014, 1.1286591291427612, 1.2054280042648315, 1.2821969985961914, 1.3589658737182617, 1.435734748840332, 1.512503743171692, 1.5892726182937622, 1.666041612625122, 1.7428104877471924, 1.8195793628692627, 1.896348237991333, 1.9731172323226929, 2.0498862266540527, 2.126655101776123, 2.2034239768981934, 2.2801928520202637, 2.356961727142334, 2.4337308406829834, 2.5104997158050537, 2.587268590927124]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 15.0, 35.0, 40.0, 60.0, 104.0, 184.0, 395.0, 960.0, 4039.0, 35075.0, 4080279.0, 65063.0, 5612.0, 1336.0, 509.0, 232.0, 110.0, 73.0, 54.0, 26.0, 14.0, 13.0, 13.0, 8.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7919921875, -1.7386474609375, -1.685302734375, -1.6319580078125, -1.57861328125, -1.5252685546875, -1.471923828125, -1.4185791015625, -1.365234375, -1.3118896484375, -1.258544921875, -1.2052001953125, -1.15185546875, -1.0985107421875, -1.045166015625, -0.9918212890625, -0.9384765625, -0.8851318359375, -0.831787109375, -0.7784423828125, -0.72509765625, -0.6717529296875, -0.618408203125, -0.5650634765625, -0.51171875, -0.4583740234375, -0.405029296875, -0.3516845703125, -0.29833984375, -0.2449951171875, -0.191650390625, -0.1383056640625, -0.0849609375, -0.0316162109375, 0.021728515625, 0.0750732421875, 0.12841796875, 0.1817626953125, 0.235107421875, 0.2884521484375, 0.341796875, 0.3951416015625, 0.448486328125, 0.5018310546875, 0.55517578125, 0.6085205078125, 0.661865234375, 0.7152099609375, 0.7685546875, 0.8218994140625, 0.875244140625, 0.9285888671875, 0.98193359375, 1.0352783203125, 1.088623046875, 1.1419677734375, 1.1953125, 1.2486572265625, 1.302001953125, 1.3553466796875, 1.40869140625, 1.4620361328125, 1.515380859375, 1.5687255859375, 1.6220703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 9.0, 10.0, 16.0, 15.0, 24.0, 38.0, 40.0, 57.0, 50.0, 77.0, 73.0, 74.0, 90.0, 79.0, 77.0, 57.0, 52.0, 35.0, 32.0, 14.0, 17.0, 29.0, 7.0, 12.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2005615234375, -0.19515228271484375, -0.1897430419921875, -0.18433380126953125, -0.178924560546875, -0.17351531982421875, -0.1681060791015625, -0.16269683837890625, -0.15728759765625, -0.15187835693359375, -0.1464691162109375, -0.14105987548828125, -0.135650634765625, -0.13024139404296875, -0.1248321533203125, -0.11942291259765625, -0.114013671875, -0.10860443115234375, -0.1031951904296875, -0.09778594970703125, -0.092376708984375, -0.08696746826171875, -0.0815582275390625, -0.07614898681640625, -0.07073974609375, -0.06533050537109375, -0.0599212646484375, -0.05451202392578125, -0.049102783203125, -0.04369354248046875, -0.0382843017578125, -0.03287506103515625, -0.0274658203125, -0.02205657958984375, -0.0166473388671875, -0.01123809814453125, -0.005828857421875, -0.00041961669921875, 0.0049896240234375, 0.01039886474609375, 0.01580810546875, 0.02121734619140625, 0.0266265869140625, 0.03203582763671875, 0.037445068359375, 0.04285430908203125, 0.0482635498046875, 0.05367279052734375, 0.05908203125, 0.06449127197265625, 0.0699005126953125, 0.07530975341796875, 0.080718994140625, 0.08612823486328125, 0.0915374755859375, 0.09694671630859375, 0.10235595703125, 0.10776519775390625, 0.1131744384765625, 0.11858367919921875, 0.123992919921875, 0.12940216064453125, 0.1348114013671875, 0.14022064208984375, 0.1456298828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 4.0, 10.0, 8.0, 12.0, 22.0, 54.0, 72.0, 125.0, 185.0, 264.0, 410.0, 741.0, 1232.0, 2121.0, 3990.0, 7727.0, 18037.0, 56192.0, 434681.0, 3425653.0, 179557.0, 36034.0, 13244.0, 6264.0, 3183.0, 1868.0, 968.0, 597.0, 364.0, 249.0, 154.0, 90.0, 53.0, 30.0, 21.0, 22.0, 12.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.485595703125, -0.4700965881347656, -0.45459747314453125, -0.4390983581542969, -0.4235992431640625, -0.4081001281738281, -0.39260101318359375, -0.3771018981933594, -0.361602783203125, -0.3461036682128906, -0.33060455322265625, -0.3151054382324219, -0.2996063232421875, -0.2841072082519531, -0.26860809326171875, -0.2531089782714844, -0.23760986328125, -0.22211074829101562, -0.20661163330078125, -0.19111251831054688, -0.1756134033203125, -0.16011428833007812, -0.14461517333984375, -0.12911605834960938, -0.113616943359375, -0.09811782836914062, -0.08261871337890625, -0.06711959838867188, -0.0516204833984375, -0.036121368408203125, -0.02062225341796875, -0.005123138427734375, 0.0103759765625, 0.025875091552734375, 0.04137420654296875, 0.056873321533203125, 0.0723724365234375, 0.08787155151367188, 0.10337066650390625, 0.11886978149414062, 0.134368896484375, 0.14986801147460938, 0.16536712646484375, 0.18086624145507812, 0.1963653564453125, 0.21186447143554688, 0.22736358642578125, 0.24286270141601562, 0.25836181640625, 0.2738609313964844, 0.28936004638671875, 0.3048591613769531, 0.3203582763671875, 0.3358573913574219, 0.35135650634765625, 0.3668556213378906, 0.382354736328125, 0.3978538513183594, 0.41335296630859375, 0.4288520812988281, 0.4443511962890625, 0.4598503112792969, 0.47534942626953125, 0.4908485412597656, 0.50634765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 5.0, 11.0, 13.0, 22.0, 40.0, 59.0, 129.0, 270.0, 1297.0, 1602.0, 310.0, 118.0, 66.0, 37.0, 22.0, 13.0, 15.0, 9.0, 7.0, 3.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310546875, -0.29947662353515625, -0.2884063720703125, -0.27733612060546875, -0.266265869140625, -0.25519561767578125, -0.2441253662109375, -0.23305511474609375, -0.22198486328125, -0.21091461181640625, -0.1998443603515625, -0.18877410888671875, -0.177703857421875, -0.16663360595703125, -0.1555633544921875, -0.14449310302734375, -0.1334228515625, -0.12235260009765625, -0.1112823486328125, -0.10021209716796875, -0.089141845703125, -0.07807159423828125, -0.0670013427734375, -0.05593109130859375, -0.04486083984375, -0.03379058837890625, -0.0227203369140625, -0.01165008544921875, -0.000579833984375, 0.01049041748046875, 0.0215606689453125, 0.03263092041015625, 0.043701171875, 0.05477142333984375, 0.0658416748046875, 0.07691192626953125, 0.087982177734375, 0.09905242919921875, 0.1101226806640625, 0.12119293212890625, 0.13226318359375, 0.14333343505859375, 0.1544036865234375, 0.16547393798828125, 0.176544189453125, 0.18761444091796875, 0.1986846923828125, 0.20975494384765625, 0.2208251953125, 0.23189544677734375, 0.2429656982421875, 0.25403594970703125, 0.265106201171875, 0.27617645263671875, 0.2872467041015625, 0.29831695556640625, 0.30938720703125, 0.32045745849609375, 0.3315277099609375, 0.34259796142578125, 0.353668212890625, 0.36473846435546875, 0.3758087158203125, 0.38687896728515625, 0.39794921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 8.0, 19.0, 38.0, 142.0, 325.0, 297.0, 113.0, 46.0, 12.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.530750274658203, -6.402678966522217, -6.274608135223389, -6.146536827087402, -6.018465995788574, -5.890394687652588, -5.76232385635376, -5.634252548217773, -5.506181716918945, -5.378110408782959, -5.250039577484131, -5.1219682693481445, -4.993897438049316, -4.86582612991333, -4.737755298614502, -4.609683990478516, -4.481612682342529, -4.353541374206543, -4.225470542907715, -4.0973992347717285, -3.9693284034729004, -3.841257095336914, -3.713186025619507, -3.5851149559020996, -3.4570438861846924, -3.328972816467285, -3.200901746749878, -3.0728306770324707, -2.9447593688964844, -2.8166885375976562, -2.68861722946167, -2.5605461597442627, -2.4324750900268555, -2.3044040203094482, -2.176332950592041, -2.048261880874634, -1.920190691947937, -1.7921196222305298, -1.664048433303833, -1.5359773635864258, -1.407906174659729, -1.2798351049423218, -1.151763916015625, -1.0236928462982178, -0.8956217765808105, -0.7675507068634033, -0.6394795775413513, -0.5114084482192993, -0.3833373785018921, -0.2552662789821625, -0.12719517946243286, 0.0008759200572967529, 0.12894701957702637, 0.2570180892944336, 0.3850892186164856, 0.5131603479385376, 0.6412314176559448, 0.769302487373352, 0.897373616695404, 1.025444746017456, 1.1535158157348633, 1.2815868854522705, 1.4096579551696777, 1.5377291440963745, 1.6658002138137817]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 14.0, 10.0, 17.0, 26.0, 18.0, 18.0, 35.0, 27.0, 38.0, 48.0, 32.0, 38.0, 43.0, 47.0, 51.0, 46.0, 46.0, 38.0, 46.0, 37.0, 39.0, 41.0, 33.0, 31.0, 27.0, 20.0, 19.0, 23.0, 13.0, 16.0, 6.0, 9.0, 7.0, 5.0, 4.0, 9.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7322551012039185, -0.7076852917671204, -0.6831154823303223, -0.6585456728935242, -0.6339758634567261, -0.6094059944152832, -0.5848362445831299, -0.560266375541687, -0.5356965661048889, -0.5111267566680908, -0.4865569472312927, -0.46198713779449463, -0.43741729855537415, -0.41284748911857605, -0.38827767968177795, -0.36370784044265747, -0.33913806080818176, -0.31456825137138367, -0.28999844193458557, -0.2654286026954651, -0.240858793258667, -0.2162889838218689, -0.1917191743850708, -0.1671493500471115, -0.14257954061031342, -0.11800972372293472, -0.09343990683555603, -0.06887009739875793, -0.04430028051137924, -0.01973046362400055, 0.004839345812797546, 0.029409170150756836, 0.05397897958755493, 0.07854879647493362, 0.10311861336231232, 0.1276884227991104, 0.1522582471370697, 0.1768280565738678, 0.2013978660106659, 0.22596769034862518, 0.2505375146865845, 0.27510732412338257, 0.29967713356018066, 0.32424694299697876, 0.34881678223609924, 0.37338659167289734, 0.39795640110969543, 0.4225262403488159, 0.4470960199832916, 0.4716658294200897, 0.4962356388568878, 0.5208054780960083, 0.5453752875328064, 0.5699450969696045, 0.5945149064064026, 0.6190847158432007, 0.6436545252799988, 0.6682243347167969, 0.692794144153595, 0.7173639535903931, 0.7419337630271912, 0.7665035724639893, 0.7910734415054321, 0.8156432509422302, 0.8402130603790283]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 2.0, 4.0, 10.0, 14.0, 8.0, 12.0, 33.0, 41.0, 52.0, 90.0, 125.0, 175.0, 318.0, 514.0, 781.0, 1393.0, 2484.0, 4741.0, 9942.0, 24102.0, 67219.0, 202524.0, 381536.0, 226972.0, 76100.0, 26798.0, 11072.0, 5093.0, 2673.0, 1442.0, 797.0, 506.0, 334.0, 210.0, 128.0, 104.0, 58.0, 35.0, 29.0, 28.0, 21.0, 11.0, 5.0, 4.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.465087890625, -0.4520072937011719, -0.43892669677734375, -0.4258460998535156, -0.4127655029296875, -0.3996849060058594, -0.38660430908203125, -0.3735237121582031, -0.360443115234375, -0.3473625183105469, -0.33428192138671875, -0.3212013244628906, -0.3081207275390625, -0.2950401306152344, -0.28195953369140625, -0.2688789367675781, -0.25579833984375, -0.24271774291992188, -0.22963714599609375, -0.21655654907226562, -0.2034759521484375, -0.19039535522460938, -0.17731475830078125, -0.16423416137695312, -0.151153564453125, -0.13807296752929688, -0.12499237060546875, -0.11191177368164062, -0.0988311767578125, -0.08575057983398438, -0.07266998291015625, -0.059589385986328125, -0.0465087890625, -0.033428192138671875, -0.02034759521484375, -0.007266998291015625, 0.0058135986328125, 0.018894195556640625, 0.03197479248046875, 0.045055389404296875, 0.058135986328125, 0.07121658325195312, 0.08429718017578125, 0.09737777709960938, 0.1104583740234375, 0.12353897094726562, 0.13661956787109375, 0.14970016479492188, 0.16278076171875, 0.17586135864257812, 0.18894195556640625, 0.20202255249023438, 0.2151031494140625, 0.22818374633789062, 0.24126434326171875, 0.2543449401855469, 0.267425537109375, 0.2805061340332031, 0.29358673095703125, 0.3066673278808594, 0.3197479248046875, 0.3328285217285156, 0.34590911865234375, 0.3589897155761719, 0.3720703125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 12.0, 14.0, 15.0, 18.0, 22.0, 37.0, 30.0, 26.0, 49.0, 61.0, 58.0, 61.0, 61.0, 62.0, 65.0, 59.0, 53.0, 49.0, 52.0, 38.0, 30.0, 25.0, 21.0, 12.0, 17.0, 10.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.13217544555664062, -0.12751007080078125, -0.12284469604492188, -0.1181793212890625, -0.11351394653320312, -0.10884857177734375, -0.10418319702148438, -0.099517822265625, -0.09485244750976562, -0.09018707275390625, -0.08552169799804688, -0.0808563232421875, -0.07619094848632812, -0.07152557373046875, -0.06686019897460938, -0.06219482421875, -0.057529449462890625, -0.05286407470703125, -0.048198699951171875, -0.0435333251953125, -0.038867950439453125, -0.03420257568359375, -0.029537200927734375, -0.024871826171875, -0.020206451416015625, -0.01554107666015625, -0.010875701904296875, -0.0062103271484375, -0.001544952392578125, 0.00312042236328125, 0.007785797119140625, 0.012451171875, 0.017116546630859375, 0.02178192138671875, 0.026447296142578125, 0.0311126708984375, 0.035778045654296875, 0.04044342041015625, 0.045108795166015625, 0.049774169921875, 0.054439544677734375, 0.05910491943359375, 0.06377029418945312, 0.0684356689453125, 0.07310104370117188, 0.07776641845703125, 0.08243179321289062, 0.08709716796875, 0.09176254272460938, 0.09642791748046875, 0.10109329223632812, 0.1057586669921875, 0.11042404174804688, 0.11508941650390625, 0.11975479125976562, 0.124420166015625, 0.12908554077148438, 0.13375091552734375, 0.13841629028320312, 0.1430816650390625, 0.14774703979492188, 0.15241241455078125, 0.15707778930664062, 0.1617431640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 17.0, 19.0, 20.0, 16.0, 27.0, 35.0, 63.0, 89.0, 130.0, 181.0, 363.0, 569.0, 1088.0, 2116.0, 4624.0, 10130.0, 24381.0, 63275.0, 173159.0, 355654.0, 253740.0, 96026.0, 35655.0, 14577.0, 6404.0, 2929.0, 1439.0, 720.0, 392.0, 234.0, 148.0, 88.0, 52.0, 40.0, 40.0, 20.0, 18.0, 16.0, 11.0, 6.0, 3.0, 10.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.3330078125, -0.32312774658203125, -0.3132476806640625, -0.30336761474609375, -0.293487548828125, -0.28360748291015625, -0.2737274169921875, -0.26384735107421875, -0.25396728515625, -0.24408721923828125, -0.2342071533203125, -0.22432708740234375, -0.214447021484375, -0.20456695556640625, -0.1946868896484375, -0.18480682373046875, -0.1749267578125, -0.16504669189453125, -0.1551666259765625, -0.14528656005859375, -0.135406494140625, -0.12552642822265625, -0.1156463623046875, -0.10576629638671875, -0.09588623046875, -0.08600616455078125, -0.0761260986328125, -0.06624603271484375, -0.056365966796875, -0.04648590087890625, -0.0366058349609375, -0.02672576904296875, -0.016845703125, -0.00696563720703125, 0.0029144287109375, 0.01279449462890625, 0.022674560546875, 0.03255462646484375, 0.0424346923828125, 0.05231475830078125, 0.06219482421875, 0.07207489013671875, 0.0819549560546875, 0.09183502197265625, 0.101715087890625, 0.11159515380859375, 0.1214752197265625, 0.13135528564453125, 0.1412353515625, 0.15111541748046875, 0.1609954833984375, 0.17087554931640625, 0.180755615234375, 0.19063568115234375, 0.2005157470703125, 0.21039581298828125, 0.22027587890625, 0.23015594482421875, 0.2400360107421875, 0.24991607666015625, 0.259796142578125, 0.26967620849609375, 0.2795562744140625, 0.28943634033203125, 0.29931640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 12.0, 12.0, 13.0, 3.0, 12.0, 17.0, 18.0, 18.0, 22.0, 20.0, 29.0, 25.0, 38.0, 33.0, 30.0, 29.0, 29.0, 41.0, 37.0, 31.0, 31.0, 39.0, 53.0, 38.0, 41.0, 40.0, 22.0, 30.0, 29.0, 27.0, 18.0, 16.0, 20.0, 15.0, 15.0, 11.0, 6.0, 7.0, 7.0, 13.0, 11.0, 1.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0], "bins": [-0.432373046875, -0.4186210632324219, -0.40486907958984375, -0.3911170959472656, -0.3773651123046875, -0.3636131286621094, -0.34986114501953125, -0.3361091613769531, -0.322357177734375, -0.3086051940917969, -0.29485321044921875, -0.2811012268066406, -0.2673492431640625, -0.2535972595214844, -0.23984527587890625, -0.22609329223632812, -0.21234130859375, -0.19858932495117188, -0.18483734130859375, -0.17108535766601562, -0.1573333740234375, -0.14358139038085938, -0.12982940673828125, -0.11607742309570312, -0.102325439453125, -0.08857345581054688, -0.07482147216796875, -0.061069488525390625, -0.0473175048828125, -0.033565521240234375, -0.01981353759765625, -0.006061553955078125, 0.0076904296875, 0.021442413330078125, 0.03519439697265625, 0.048946380615234375, 0.0626983642578125, 0.07645034790039062, 0.09020233154296875, 0.10395431518554688, 0.117706298828125, 0.13145828247070312, 0.14521026611328125, 0.15896224975585938, 0.1727142333984375, 0.18646621704101562, 0.20021820068359375, 0.21397018432617188, 0.22772216796875, 0.24147415161132812, 0.25522613525390625, 0.2689781188964844, 0.2827301025390625, 0.2964820861816406, 0.31023406982421875, 0.3239860534667969, 0.337738037109375, 0.3514900207519531, 0.36524200439453125, 0.3789939880371094, 0.3927459716796875, 0.4064979553222656, 0.42024993896484375, 0.4340019226074219, 0.44775390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 6.0, 8.0, 19.0, 37.0, 61.0, 95.0, 208.0, 498.0, 1426.0, 5774.0, 43892.0, 412471.0, 513002.0, 60925.0, 7368.0, 1701.0, 544.0, 241.0, 120.0, 56.0, 34.0, 29.0, 9.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.245025634765625, -0.23687744140625, -0.228729248046875, -0.2205810546875, -0.212432861328125, -0.20428466796875, -0.196136474609375, -0.18798828125, -0.179840087890625, -0.17169189453125, -0.163543701171875, -0.1553955078125, -0.147247314453125, -0.13909912109375, -0.130950927734375, -0.122802734375, -0.114654541015625, -0.10650634765625, -0.098358154296875, -0.0902099609375, -0.082061767578125, -0.07391357421875, -0.065765380859375, -0.0576171875, -0.049468994140625, -0.04132080078125, -0.033172607421875, -0.0250244140625, -0.016876220703125, -0.00872802734375, -0.000579833984375, 0.007568359375, 0.015716552734375, 0.02386474609375, 0.032012939453125, 0.0401611328125, 0.048309326171875, 0.05645751953125, 0.064605712890625, 0.07275390625, 0.080902099609375, 0.08905029296875, 0.097198486328125, 0.1053466796875, 0.113494873046875, 0.12164306640625, 0.129791259765625, 0.137939453125, 0.146087646484375, 0.15423583984375, 0.162384033203125, 0.1705322265625, 0.178680419921875, 0.18682861328125, 0.194976806640625, 0.203125, 0.211273193359375, 0.21942138671875, 0.227569580078125, 0.2357177734375, 0.243865966796875, 0.25201416015625, 0.260162353515625, 0.268310546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 2.0, 11.0, 6.0, 19.0, 12.0, 23.0, 28.0, 36.0, 48.0, 52.0, 65.0, 90.0, 89.0, 85.0, 79.0, 77.0, 62.0, 40.0, 37.0, 45.0, 24.0, 20.0, 17.0, 11.0, 9.0, 4.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07099723815918e-05, -3.915838897228241e-05, -3.760680556297302e-05, -3.6055222153663635e-05, -3.450363874435425e-05, -3.295205533504486e-05, -3.1400471925735474e-05, -2.9848888516426086e-05, -2.82973051071167e-05, -2.6745721697807312e-05, -2.5194138288497925e-05, -2.3642554879188538e-05, -2.209097146987915e-05, -2.0539388060569763e-05, -1.8987804651260376e-05, -1.743622124195099e-05, -1.58846378326416e-05, -1.4333054423332214e-05, -1.2781471014022827e-05, -1.122988760471344e-05, -9.678304195404053e-06, -8.126720786094666e-06, -6.575137376785278e-06, -5.023553967475891e-06, -3.471970558166504e-06, -1.9203871488571167e-06, -3.688037395477295e-07, 1.1827796697616577e-06, 2.734363079071045e-06, 4.285946488380432e-06, 5.837529897689819e-06, 7.3891133069992065e-06, 8.940696716308594e-06, 1.0492280125617981e-05, 1.2043863534927368e-05, 1.3595446944236755e-05, 1.5147030353546143e-05, 1.669861376285553e-05, 1.8250197172164917e-05, 1.9801780581474304e-05, 2.135336399078369e-05, 2.290494740009308e-05, 2.4456530809402466e-05, 2.6008114218711853e-05, 2.755969762802124e-05, 2.9111281037330627e-05, 3.0662864446640015e-05, 3.22144478559494e-05, 3.376603126525879e-05, 3.5317614674568176e-05, 3.6869198083877563e-05, 3.842078149318695e-05, 3.997236490249634e-05, 4.1523948311805725e-05, 4.307553172111511e-05, 4.46271151304245e-05, 4.617869853973389e-05, 4.7730281949043274e-05, 4.928186535835266e-05, 5.083344876766205e-05, 5.2385032176971436e-05, 5.393661558628082e-05, 5.548819899559021e-05, 5.70397824048996e-05, 5.8591365814208984e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 4.0, 3.0, 5.0, 9.0, 12.0, 15.0, 36.0, 37.0, 59.0, 97.0, 127.0, 210.0, 325.0, 559.0, 1008.0, 1787.0, 3401.0, 7530.0, 19556.0, 56732.0, 169107.0, 350808.0, 274573.0, 104917.0, 34360.0, 12289.0, 5181.0, 2511.0, 1334.0, 707.0, 470.0, 294.0, 164.0, 88.0, 67.0, 42.0, 23.0, 29.0, 17.0, 19.0, 9.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.142578125, -0.1382274627685547, -0.13387680053710938, -0.12952613830566406, -0.12517547607421875, -0.12082481384277344, -0.11647415161132812, -0.11212348937988281, -0.1077728271484375, -0.10342216491699219, -0.09907150268554688, -0.09472084045410156, -0.09037017822265625, -0.08601951599121094, -0.08166885375976562, -0.07731819152832031, -0.072967529296875, -0.06861686706542969, -0.06426620483398438, -0.05991554260253906, -0.05556488037109375, -0.05121421813964844, -0.046863555908203125, -0.04251289367675781, -0.0381622314453125, -0.03381156921386719, -0.029460906982421875, -0.025110244750976562, -0.02075958251953125, -0.016408920288085938, -0.012058258056640625, -0.0077075958251953125, -0.00335693359375, 0.0009937286376953125, 0.005344390869140625, 0.009695053100585938, 0.01404571533203125, 0.018396377563476562, 0.022747039794921875, 0.027097702026367188, 0.0314483642578125, 0.03579902648925781, 0.040149688720703125, 0.04450035095214844, 0.04885101318359375, 0.05320167541503906, 0.057552337646484375, 0.06190299987792969, 0.066253662109375, 0.07060432434082031, 0.07495498657226562, 0.07930564880371094, 0.08365631103515625, 0.08800697326660156, 0.09235763549804688, 0.09670829772949219, 0.1010589599609375, 0.10540962219238281, 0.10976028442382812, 0.11411094665527344, 0.11846160888671875, 0.12281227111816406, 0.12716293334960938, 0.1315135955810547, 0.1358642578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 1.0, 8.0, 7.0, 13.0, 8.0, 14.0, 12.0, 24.0, 22.0, 27.0, 62.0, 52.0, 37.0, 64.0, 68.0, 78.0, 56.0, 66.0, 71.0, 52.0, 46.0, 46.0, 45.0, 22.0, 25.0, 17.0, 17.0, 12.0, 12.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.138427734375, -0.1337451934814453, -0.12906265258789062, -0.12438011169433594, -0.11969757080078125, -0.11501502990722656, -0.11033248901367188, -0.10564994812011719, -0.1009674072265625, -0.09628486633300781, -0.09160232543945312, -0.08691978454589844, -0.08223724365234375, -0.07755470275878906, -0.07287216186523438, -0.06818962097167969, -0.063507080078125, -0.05882453918457031, -0.054141998291015625, -0.04945945739746094, -0.04477691650390625, -0.04009437561035156, -0.035411834716796875, -0.030729293823242188, -0.0260467529296875, -0.021364212036132812, -0.016681671142578125, -0.011999130249023438, -0.00731658935546875, -0.0026340484619140625, 0.002048492431640625, 0.0067310333251953125, 0.01141357421875, 0.016096115112304688, 0.020778656005859375, 0.025461196899414062, 0.03014373779296875, 0.03482627868652344, 0.039508819580078125, 0.04419136047363281, 0.0488739013671875, 0.05355644226074219, 0.058238983154296875, 0.06292152404785156, 0.06760406494140625, 0.07228660583496094, 0.07696914672851562, 0.08165168762207031, 0.086334228515625, 0.09101676940917969, 0.09569931030273438, 0.10038185119628906, 0.10506439208984375, 0.10974693298339844, 0.11442947387695312, 0.11911201477050781, 0.1237945556640625, 0.1284770965576172, 0.13315963745117188, 0.13784217834472656, 0.14252471923828125, 0.14720726013183594, 0.15188980102539062, 0.1565723419189453, 0.1612548828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 11.0, 16.0, 42.0, 155.0, 289.0, 287.0, 132.0, 55.0, 18.0, 5.0, 3.0, 2.0, 1.0], "bins": [-14.008438110351562, -13.756943702697754, -13.505448341369629, -13.25395393371582, -13.002458572387695, -12.750964164733887, -12.499468803405762, -12.247974395751953, -11.996479034423828, -11.74498462677002, -11.493489265441895, -11.241994857788086, -10.990499496459961, -10.739005088806152, -10.487509727478027, -10.236015319824219, -9.984519958496094, -9.733025550842285, -9.48153018951416, -9.230035781860352, -8.978540420532227, -8.727046012878418, -8.475550651550293, -8.224056243896484, -7.972561836242676, -7.721066951751709, -7.469572067260742, -7.218077182769775, -6.966582298278809, -6.715087413787842, -6.463592529296875, -6.212098121643066, -5.960602760314941, -5.709107875823975, -5.457612991333008, -5.206118106842041, -4.954623222351074, -4.703128337860107, -4.451633453369141, -4.200139045715332, -3.948643922805786, -3.6971490383148193, -3.4456541538238525, -3.194159507751465, -2.942664623260498, -2.6911697387695312, -2.4396748542785645, -2.1881799697875977, -1.9366850852966309, -1.685190200805664, -1.4336953163146973, -1.18220055103302, -0.9307056665420532, -0.6792107820510864, -0.4277160167694092, -0.17622113227844238, 0.07527375221252441, 0.3267686069011688, 0.5782634615898132, 0.8297582864761353, 1.081253170967102, 1.3327480554580688, 1.584242820739746, 1.835737705230713, 2.0872325897216797]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 9.0, 11.0, 8.0, 5.0, 10.0, 19.0, 13.0, 21.0, 8.0, 23.0, 34.0, 27.0, 26.0, 35.0, 39.0, 35.0, 43.0, 35.0, 60.0, 46.0, 44.0, 38.0, 47.0, 44.0, 44.0, 42.0, 39.0, 27.0, 25.0, 23.0, 14.0, 12.0, 22.0, 14.0, 13.0, 9.0, 11.0, 8.0, 12.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.7802035808563232, -2.7022509574890137, -2.624298334121704, -2.5463454723358154, -2.468392848968506, -2.3904402256011963, -2.3124876022338867, -2.234534740447998, -2.1565821170806885, -2.078629493713379, -2.0006768703460693, -1.9227241277694702, -1.844771385192871, -1.7668187618255615, -1.688866138458252, -1.6109133958816528, -1.5329607725143433, -1.4550081491470337, -1.3770554065704346, -1.299102783203125, -1.2211500406265259, -1.1431974172592163, -1.0652446746826172, -0.9872920513153076, -0.9093393683433533, -0.8313866853713989, -0.7534340023994446, -0.6754813194274902, -0.5975286960601807, -0.5195759534835815, -0.441623330116272, -0.3636706471443176, -0.2857179641723633, -0.20776528120040894, -0.12981261312961578, -0.05185994505882263, 0.026092737913131714, 0.10404542088508606, 0.18199807405471802, 0.25995075702667236, 0.3379034399986267, 0.41585612297058105, 0.4938088059425354, 0.5717614889144897, 0.6497141122817993, 0.7276668548583984, 0.805619478225708, 0.8835721611976624, 0.9615248441696167, 1.0394774675369263, 1.1174302101135254, 1.195382833480835, 1.273335576057434, 1.3512881994247437, 1.4292409420013428, 1.5071935653686523, 1.585146188735962, 1.6630988121032715, 1.7410515546798706, 1.8190041780471802, 1.8969569206237793, 1.9749095439910889, 2.0528621673583984, 2.130815029144287, 2.2087676525115967]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 5.0, 5.0, 5.0, 12.0, 12.0, 13.0, 26.0, 47.0, 77.0, 129.0, 231.0, 460.0, 1110.0, 3085.0, 13986.0, 4054425.0, 109916.0, 7193.0, 1914.0, 768.0, 331.0, 165.0, 123.0, 80.0, 52.0, 20.0, 26.0, 15.0, 13.0, 11.0, 5.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -0.994110107421875, -0.95404052734375, -0.913970947265625, -0.8739013671875, -0.833831787109375, -0.79376220703125, -0.753692626953125, -0.713623046875, -0.673553466796875, -0.63348388671875, -0.593414306640625, -0.5533447265625, -0.513275146484375, -0.47320556640625, -0.433135986328125, -0.39306640625, -0.352996826171875, -0.31292724609375, -0.272857666015625, -0.2327880859375, -0.192718505859375, -0.15264892578125, -0.112579345703125, -0.072509765625, -0.032440185546875, 0.00762939453125, 0.047698974609375, 0.0877685546875, 0.127838134765625, 0.16790771484375, 0.207977294921875, 0.248046875, 0.288116455078125, 0.32818603515625, 0.368255615234375, 0.4083251953125, 0.448394775390625, 0.48846435546875, 0.528533935546875, 0.568603515625, 0.608673095703125, 0.64874267578125, 0.688812255859375, 0.7288818359375, 0.768951416015625, 0.80902099609375, 0.849090576171875, 0.88916015625, 0.929229736328125, 0.96929931640625, 1.009368896484375, 1.0494384765625, 1.089508056640625, 1.12957763671875, 1.169647216796875, 1.209716796875, 1.249786376953125, 1.28985595703125, 1.329925537109375, 1.3699951171875, 1.410064697265625, 1.45013427734375, 1.490203857421875, 1.5302734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 9.0, 2.0, 3.0, 10.0, 11.0, 8.0, 14.0, 17.0, 15.0, 24.0, 37.0, 36.0, 42.0, 49.0, 56.0, 52.0, 67.0, 43.0, 41.0, 48.0, 68.0, 50.0, 48.0, 45.0, 38.0, 32.0, 29.0, 20.0, 14.0, 25.0, 15.0, 12.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1395263671875, -0.13458633422851562, -0.12964630126953125, -0.12470626831054688, -0.1197662353515625, -0.11482620239257812, -0.10988616943359375, -0.10494613647460938, -0.100006103515625, -0.09506607055664062, -0.09012603759765625, -0.08518600463867188, -0.0802459716796875, -0.07530593872070312, -0.07036590576171875, -0.06542587280273438, -0.06048583984375, -0.055545806884765625, -0.05060577392578125, -0.045665740966796875, -0.0407257080078125, -0.035785675048828125, -0.03084564208984375, -0.025905609130859375, -0.020965576171875, -0.016025543212890625, -0.01108551025390625, -0.006145477294921875, -0.0012054443359375, 0.003734588623046875, 0.00867462158203125, 0.013614654541015625, 0.0185546875, 0.023494720458984375, 0.02843475341796875, 0.033374786376953125, 0.0383148193359375, 0.043254852294921875, 0.04819488525390625, 0.053134918212890625, 0.058074951171875, 0.06301498413085938, 0.06795501708984375, 0.07289505004882812, 0.0778350830078125, 0.08277511596679688, 0.08771514892578125, 0.09265518188476562, 0.09759521484375, 0.10253524780273438, 0.10747528076171875, 0.11241531372070312, 0.1173553466796875, 0.12229537963867188, 0.12723541259765625, 0.13217544555664062, 0.137115478515625, 0.14205551147460938, 0.14699554443359375, 0.15193557739257812, 0.1568756103515625, 0.16181564331054688, 0.16675567626953125, 0.17169570922851562, 0.1766357421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 7.0, 10.0, 13.0, 26.0, 24.0, 48.0, 61.0, 86.0, 120.0, 189.0, 264.0, 383.0, 629.0, 976.0, 1525.0, 2617.0, 4821.0, 11207.0, 46896.0, 3354583.0, 713822.0, 35437.0, 9619.0, 4371.0, 2367.0, 1498.0, 900.0, 566.0, 391.0, 248.0, 171.0, 114.0, 97.0, 58.0, 42.0, 24.0, 20.0, 16.0, 18.0, 4.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4285392761230469, -0.41201019287109375, -0.3954811096191406, -0.3789520263671875, -0.3624229431152344, -0.34589385986328125, -0.3293647766113281, -0.312835693359375, -0.2963066101074219, -0.27977752685546875, -0.2632484436035156, -0.2467193603515625, -0.23019027709960938, -0.21366119384765625, -0.19713211059570312, -0.18060302734375, -0.16407394409179688, -0.14754486083984375, -0.13101577758789062, -0.1144866943359375, -0.09795761108398438, -0.08142852783203125, -0.06489944458007812, -0.048370361328125, -0.031841278076171875, -0.01531219482421875, 0.001216888427734375, 0.0177459716796875, 0.034275054931640625, 0.05080413818359375, 0.06733322143554688, 0.0838623046875, 0.10039138793945312, 0.11692047119140625, 0.13344955444335938, 0.1499786376953125, 0.16650772094726562, 0.18303680419921875, 0.19956588745117188, 0.216094970703125, 0.23262405395507812, 0.24915313720703125, 0.2656822204589844, 0.2822113037109375, 0.2987403869628906, 0.31526947021484375, 0.3317985534667969, 0.34832763671875, 0.3648567199707031, 0.38138580322265625, 0.3979148864746094, 0.4144439697265625, 0.4309730529785156, 0.44750213623046875, 0.4640312194824219, 0.480560302734375, 0.4970893859863281, 0.5136184692382812, 0.5301475524902344, 0.5466766357421875, 0.5632057189941406, 0.5797348022460938, 0.5962638854980469, 0.61279296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 1.0, 9.0, 13.0, 10.0, 23.0, 51.0, 97.0, 302.0, 2995.0, 360.0, 98.0, 46.0, 21.0, 12.0, 7.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11993408203125, -0.11572551727294922, -0.11151695251464844, -0.10730838775634766, -0.10309982299804688, -0.0988912582397461, -0.09468269348144531, -0.09047412872314453, -0.08626556396484375, -0.08205699920654297, -0.07784843444824219, -0.0736398696899414, -0.06943130493164062, -0.06522274017333984, -0.06101417541503906, -0.05680561065673828, -0.0525970458984375, -0.04838848114013672, -0.04417991638183594, -0.039971351623535156, -0.035762786865234375, -0.031554222106933594, -0.027345657348632812, -0.02313709259033203, -0.01892852783203125, -0.014719963073730469, -0.010511398315429688, -0.006302833557128906, -0.002094268798828125, 0.0021142959594726562, 0.0063228607177734375, 0.010531425476074219, 0.014739990234375, 0.01894855499267578, 0.023157119750976562, 0.027365684509277344, 0.031574249267578125, 0.035782814025878906, 0.03999137878417969, 0.04419994354248047, 0.04840850830078125, 0.05261707305908203, 0.05682563781738281, 0.061034202575683594, 0.06524276733398438, 0.06945133209228516, 0.07365989685058594, 0.07786846160888672, 0.0820770263671875, 0.08628559112548828, 0.09049415588378906, 0.09470272064208984, 0.09891128540039062, 0.1031198501586914, 0.10732841491699219, 0.11153697967529297, 0.11574554443359375, 0.11995410919189453, 0.12416267395019531, 0.1283712387084961, 0.13257980346679688, 0.13678836822509766, 0.14099693298339844, 0.14520549774169922, 0.1494140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 11.0, 17.0, 19.0, 42.0, 58.0, 102.0, 103.0, 130.0, 123.0, 126.0, 67.0, 80.0, 38.0, 24.0, 20.0, 14.0, 12.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7795180678367615, -0.763255774974823, -0.7469934821128845, -0.730731189250946, -0.7144688963890076, -0.6982066035270691, -0.6819443106651306, -0.6656820178031921, -0.6494197249412537, -0.6331574320793152, -0.6168951392173767, -0.6006328463554382, -0.5843705534934998, -0.5681082606315613, -0.5518459677696228, -0.5355836749076843, -0.5193213224411011, -0.5030590295791626, -0.4867967367172241, -0.47053444385528564, -0.45427215099334717, -0.4380098581314087, -0.4217475652694702, -0.40548527240753174, -0.38922297954559326, -0.3729606866836548, -0.3566983938217163, -0.34043610095977783, -0.32417380809783936, -0.3079115152359009, -0.2916492223739624, -0.2753869295120239, -0.25912463665008545, -0.24286234378814697, -0.2266000509262085, -0.21033775806427002, -0.19407546520233154, -0.17781317234039307, -0.1615508645772934, -0.14528857171535492, -0.12902627885341644, -0.11276398599147797, -0.09650169312953949, -0.08023939281702042, -0.06397709995508194, -0.04771480709314346, -0.03145250678062439, -0.015190213918685913, 0.0010720789432525635, 0.01733437366783619, 0.033596668392419815, 0.04985896497964859, 0.06612125784158707, 0.08238355070352554, 0.09864585101604462, 0.1149081438779831, 0.13117043673992157, 0.14743272960186005, 0.16369502246379852, 0.1799573302268982, 0.19621962308883667, 0.21248191595077515, 0.22874420881271362, 0.2450065016746521, 0.2612687945365906]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 5.0, 12.0, 8.0, 11.0, 16.0, 8.0, 14.0, 10.0, 17.0, 23.0, 26.0, 24.0, 27.0, 24.0, 33.0, 34.0, 45.0, 41.0, 49.0, 34.0, 28.0, 23.0, 37.0, 38.0, 36.0, 34.0, 24.0, 34.0, 20.0, 32.0, 22.0, 32.0, 27.0, 14.0, 25.0, 18.0, 21.0, 10.0, 7.0, 11.0, 9.0, 5.0, 5.0, 7.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-0.21808671951293945, -0.21139484643936157, -0.2047029733657837, -0.19801108539104462, -0.19131921231746674, -0.18462733924388885, -0.17793545126914978, -0.1712435781955719, -0.16455170512199402, -0.15785983204841614, -0.15116795897483826, -0.14447607100009918, -0.1377841979265213, -0.13109232485294342, -0.12440044432878494, -0.11770856380462646, -0.11101669073104858, -0.1043248176574707, -0.09763293713331223, -0.09094105660915375, -0.08424918353557587, -0.07755731046199799, -0.07086542993783951, -0.06417354941368103, -0.05748167634010315, -0.05078979954123497, -0.04409792274236679, -0.03740604594349861, -0.030714169144630432, -0.024022292345762253, -0.017330415546894073, -0.010638538748025894, -0.003946661949157715, 0.0027452148497104645, 0.009437091648578644, 0.016128968447446823, 0.022820845246315002, 0.029512722045183182, 0.03620459884405136, 0.04289647564291954, 0.04958835244178772, 0.0562802292406559, 0.06297210603952408, 0.06966398656368256, 0.07635585963726044, 0.08304773271083832, 0.0897396132349968, 0.09643149375915527, 0.10312336683273315, 0.10981523990631104, 0.11650712043046951, 0.12319900095462799, 0.12989087402820587, 0.13658274710178375, 0.14327463507652283, 0.1499665081501007, 0.1566583812236786, 0.16335025429725647, 0.17004212737083435, 0.17673401534557343, 0.1834258884191513, 0.1901177614927292, 0.19680964946746826, 0.20350152254104614, 0.21019339561462402]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 9.0, 15.0, 21.0, 21.0, 37.0, 60.0, 91.0, 150.0, 260.0, 423.0, 694.0, 1286.0, 2355.0, 5026.0, 11580.0, 29226.0, 82209.0, 228130.0, 363360.0, 204695.0, 72408.0, 26465.0, 10477.0, 4594.0, 2207.0, 1073.0, 595.0, 404.0, 231.0, 146.0, 109.0, 55.0, 37.0, 26.0, 21.0, 7.0, 6.0, 9.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384765625, -0.37169647216796875, -0.3586273193359375, -0.34555816650390625, -0.332489013671875, -0.31941986083984375, -0.3063507080078125, -0.29328155517578125, -0.28021240234375, -0.26714324951171875, -0.2540740966796875, -0.24100494384765625, -0.227935791015625, -0.21486663818359375, -0.2017974853515625, -0.18872833251953125, -0.1756591796875, -0.16259002685546875, -0.1495208740234375, -0.13645172119140625, -0.123382568359375, -0.11031341552734375, -0.0972442626953125, -0.08417510986328125, -0.07110595703125, -0.05803680419921875, -0.0449676513671875, -0.03189849853515625, -0.018829345703125, -0.00576019287109375, 0.0073089599609375, 0.02037811279296875, 0.033447265625, 0.04651641845703125, 0.0595855712890625, 0.07265472412109375, 0.085723876953125, 0.09879302978515625, 0.1118621826171875, 0.12493133544921875, 0.13800048828125, 0.15106964111328125, 0.1641387939453125, 0.17720794677734375, 0.190277099609375, 0.20334625244140625, 0.2164154052734375, 0.22948455810546875, 0.2425537109375, 0.25562286376953125, 0.2686920166015625, 0.28176116943359375, 0.294830322265625, 0.30789947509765625, 0.3209686279296875, 0.33403778076171875, 0.34710693359375, 0.36017608642578125, 0.3732452392578125, 0.38631439208984375, 0.399383544921875, 0.41245269775390625, 0.4255218505859375, 0.43859100341796875, 0.45166015625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 10.0, 9.0, 11.0, 10.0, 19.0, 25.0, 24.0, 19.0, 34.0, 29.0, 38.0, 49.0, 53.0, 49.0, 50.0, 57.0, 57.0, 47.0, 49.0, 47.0, 57.0, 36.0, 32.0, 32.0, 28.0, 25.0, 20.0, 21.0, 17.0, 12.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.133544921875, -0.128631591796875, -0.12371826171875, -0.118804931640625, -0.1138916015625, -0.108978271484375, -0.10406494140625, -0.099151611328125, -0.09423828125, -0.089324951171875, -0.08441162109375, -0.079498291015625, -0.0745849609375, -0.069671630859375, -0.06475830078125, -0.059844970703125, -0.054931640625, -0.050018310546875, -0.04510498046875, -0.040191650390625, -0.0352783203125, -0.030364990234375, -0.02545166015625, -0.020538330078125, -0.015625, -0.010711669921875, -0.00579833984375, -0.000885009765625, 0.0040283203125, 0.008941650390625, 0.01385498046875, 0.018768310546875, 0.023681640625, 0.028594970703125, 0.03350830078125, 0.038421630859375, 0.0433349609375, 0.048248291015625, 0.05316162109375, 0.058074951171875, 0.06298828125, 0.067901611328125, 0.07281494140625, 0.077728271484375, 0.0826416015625, 0.087554931640625, 0.09246826171875, 0.097381591796875, 0.102294921875, 0.107208251953125, 0.11212158203125, 0.117034912109375, 0.1219482421875, 0.126861572265625, 0.13177490234375, 0.136688232421875, 0.1416015625, 0.146514892578125, 0.15142822265625, 0.156341552734375, 0.1612548828125, 0.166168212890625, 0.17108154296875, 0.175994873046875, 0.180908203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 11.0, 5.0, 9.0, 6.0, 8.0, 13.0, 16.0, 29.0, 45.0, 60.0, 80.0, 132.0, 173.0, 327.0, 577.0, 1198.0, 2865.0, 7715.0, 23932.0, 91478.0, 402281.0, 391617.0, 89511.0, 23295.0, 7592.0, 2922.0, 1258.0, 548.0, 306.0, 172.0, 108.0, 75.0, 52.0, 40.0, 33.0, 19.0, 18.0, 10.0, 5.0, 9.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423828125, -0.4101524353027344, -0.39647674560546875, -0.3828010559082031, -0.3691253662109375, -0.3554496765136719, -0.34177398681640625, -0.3280982971191406, -0.314422607421875, -0.3007469177246094, -0.28707122802734375, -0.2733955383300781, -0.2597198486328125, -0.24604415893554688, -0.23236846923828125, -0.21869277954101562, -0.20501708984375, -0.19134140014648438, -0.17766571044921875, -0.16399002075195312, -0.1503143310546875, -0.13663864135742188, -0.12296295166015625, -0.10928726196289062, -0.095611572265625, -0.08193588256835938, -0.06826019287109375, -0.054584503173828125, -0.0409088134765625, -0.027233123779296875, -0.01355743408203125, 0.000118255615234375, 0.0137939453125, 0.027469635009765625, 0.04114532470703125, 0.054821014404296875, 0.0684967041015625, 0.08217239379882812, 0.09584808349609375, 0.10952377319335938, 0.123199462890625, 0.13687515258789062, 0.15055084228515625, 0.16422653198242188, 0.1779022216796875, 0.19157791137695312, 0.20525360107421875, 0.21892929077148438, 0.23260498046875, 0.24628067016601562, 0.25995635986328125, 0.2736320495605469, 0.2873077392578125, 0.3009834289550781, 0.31465911865234375, 0.3283348083496094, 0.342010498046875, 0.3556861877441406, 0.36936187744140625, 0.3830375671386719, 0.3967132568359375, 0.4103889465332031, 0.42406463623046875, 0.4377403259277344, 0.451416015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 3.0, 11.0, 8.0, 19.0, 10.0, 16.0, 16.0, 19.0, 22.0, 26.0, 26.0, 29.0, 27.0, 44.0, 36.0, 40.0, 31.0, 45.0, 44.0, 39.0, 48.0, 49.0, 43.0, 33.0, 42.0, 37.0, 28.0, 34.0, 23.0, 25.0, 13.0, 18.0, 9.0, 11.0, 15.0, 15.0, 6.0, 7.0, 7.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5382843017578125, -0.519439697265625, -0.5005950927734375, -0.48175048828125, -0.4629058837890625, -0.444061279296875, -0.4252166748046875, -0.4063720703125, -0.3875274658203125, -0.368682861328125, -0.3498382568359375, -0.33099365234375, -0.3121490478515625, -0.293304443359375, -0.2744598388671875, -0.255615234375, -0.2367706298828125, -0.217926025390625, -0.1990814208984375, -0.18023681640625, -0.1613922119140625, -0.142547607421875, -0.1237030029296875, -0.1048583984375, -0.0860137939453125, -0.067169189453125, -0.0483245849609375, -0.02947998046875, -0.0106353759765625, 0.008209228515625, 0.0270538330078125, 0.0458984375, 0.0647430419921875, 0.083587646484375, 0.1024322509765625, 0.12127685546875, 0.1401214599609375, 0.158966064453125, 0.1778106689453125, 0.1966552734375, 0.2154998779296875, 0.234344482421875, 0.2531890869140625, 0.27203369140625, 0.2908782958984375, 0.309722900390625, 0.3285675048828125, 0.347412109375, 0.3662567138671875, 0.385101318359375, 0.4039459228515625, 0.42279052734375, 0.4416351318359375, 0.460479736328125, 0.4793243408203125, 0.4981689453125, 0.5170135498046875, 0.535858154296875, 0.5547027587890625, 0.57354736328125, 0.5923919677734375, 0.611236572265625, 0.6300811767578125, 0.64892578125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 3.0, 3.0, 4.0, 7.0, 7.0, 6.0, 7.0, 13.0, 29.0, 25.0, 34.0, 68.0, 91.0, 145.0, 236.0, 358.0, 708.0, 1599.0, 4815.0, 20832.0, 182744.0, 711160.0, 105004.0, 14220.0, 3581.0, 1314.0, 613.0, 328.0, 170.0, 137.0, 95.0, 53.0, 37.0, 34.0, 27.0, 13.0, 6.0, 6.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30859375, -0.2993507385253906, -0.29010772705078125, -0.2808647155761719, -0.2716217041015625, -0.2623786926269531, -0.25313568115234375, -0.24389266967773438, -0.234649658203125, -0.22540664672851562, -0.21616363525390625, -0.20692062377929688, -0.1976776123046875, -0.18843460083007812, -0.17919158935546875, -0.16994857788085938, -0.16070556640625, -0.15146255493164062, -0.14221954345703125, -0.13297653198242188, -0.1237335205078125, -0.11449050903320312, -0.10524749755859375, -0.09600448608398438, -0.086761474609375, -0.07751846313476562, -0.06827545166015625, -0.059032440185546875, -0.0497894287109375, -0.040546417236328125, -0.03130340576171875, -0.022060394287109375, -0.0128173828125, -0.003574371337890625, 0.00566864013671875, 0.014911651611328125, 0.0241546630859375, 0.033397674560546875, 0.04264068603515625, 0.051883697509765625, 0.061126708984375, 0.07036972045898438, 0.07961273193359375, 0.08885574340820312, 0.0980987548828125, 0.10734176635742188, 0.11658477783203125, 0.12582778930664062, 0.13507080078125, 0.14431381225585938, 0.15355682373046875, 0.16279983520507812, 0.1720428466796875, 0.18128585815429688, 0.19052886962890625, 0.19977188110351562, 0.209014892578125, 0.21825790405273438, 0.22750091552734375, 0.23674392700195312, 0.2459869384765625, 0.2552299499511719, 0.26447296142578125, 0.2737159729003906, 0.282958984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 6.0, 21.0, 27.0, 50.0, 62.0, 113.0, 127.0, 137.0, 135.0, 99.0, 86.0, 58.0, 34.0, 16.0, 10.0, 7.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.810924530029297e-05, -9.52649861574173e-05, -9.242072701454163e-05, -8.957646787166595e-05, -8.673220872879028e-05, -8.388794958591461e-05, -8.104369044303894e-05, -7.819943130016327e-05, -7.53551721572876e-05, -7.251091301441193e-05, -6.966665387153625e-05, -6.682239472866058e-05, -6.397813558578491e-05, -6.113387644290924e-05, -5.828961730003357e-05, -5.54453581571579e-05, -5.2601099014282227e-05, -4.9756839871406555e-05, -4.6912580728530884e-05, -4.406832158565521e-05, -4.122406244277954e-05, -3.837980329990387e-05, -3.55355441570282e-05, -3.269128501415253e-05, -2.9847025871276855e-05, -2.7002766728401184e-05, -2.4158507585525513e-05, -2.131424844264984e-05, -1.846998929977417e-05, -1.56257301568985e-05, -1.2781471014022827e-05, -9.937211871147156e-06, -7.092952728271484e-06, -4.248693585395813e-06, -1.4044344425201416e-06, 1.4398247003555298e-06, 4.284083843231201e-06, 7.1283429861068726e-06, 9.972602128982544e-06, 1.2816861271858215e-05, 1.5661120414733887e-05, 1.8505379557609558e-05, 2.134963870048523e-05, 2.41938978433609e-05, 2.7038156986236572e-05, 2.9882416129112244e-05, 3.2726675271987915e-05, 3.5570934414863586e-05, 3.841519355773926e-05, 4.125945270061493e-05, 4.41037118434906e-05, 4.694797098636627e-05, 4.979223012924194e-05, 5.2636489272117615e-05, 5.5480748414993286e-05, 5.832500755786896e-05, 6.116926670074463e-05, 6.40135258436203e-05, 6.685778498649597e-05, 6.970204412937164e-05, 7.254630327224731e-05, 7.539056241512299e-05, 7.823482155799866e-05, 8.107908070087433e-05, 8.392333984375e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 11.0, 13.0, 9.0, 11.0, 16.0, 37.0, 49.0, 56.0, 100.0, 167.0, 253.0, 462.0, 858.0, 1688.0, 3691.0, 9435.0, 30083.0, 118385.0, 470343.0, 309970.0, 70827.0, 19634.0, 6734.0, 2764.0, 1302.0, 654.0, 370.0, 218.0, 133.0, 81.0, 56.0, 36.0, 29.0, 19.0, 10.0, 12.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.2015380859375, -0.1947803497314453, -0.18802261352539062, -0.18126487731933594, -0.17450714111328125, -0.16774940490722656, -0.16099166870117188, -0.1542339324951172, -0.1474761962890625, -0.1407184600830078, -0.13396072387695312, -0.12720298767089844, -0.12044525146484375, -0.11368751525878906, -0.10692977905273438, -0.10017204284667969, -0.093414306640625, -0.08665657043457031, -0.07989883422851562, -0.07314109802246094, -0.06638336181640625, -0.05962562561035156, -0.052867889404296875, -0.04611015319824219, -0.0393524169921875, -0.03259468078613281, -0.025836944580078125, -0.019079208374023438, -0.01232147216796875, -0.0055637359619140625, 0.001194000244140625, 0.007951736450195312, 0.01470947265625, 0.021467208862304688, 0.028224945068359375, 0.03498268127441406, 0.04174041748046875, 0.04849815368652344, 0.055255889892578125, 0.06201362609863281, 0.0687713623046875, 0.07552909851074219, 0.08228683471679688, 0.08904457092285156, 0.09580230712890625, 0.10256004333496094, 0.10931777954101562, 0.11607551574707031, 0.122833251953125, 0.1295909881591797, 0.13634872436523438, 0.14310646057128906, 0.14986419677734375, 0.15662193298339844, 0.16337966918945312, 0.1701374053955078, 0.1768951416015625, 0.1836528778076172, 0.19041061401367188, 0.19716835021972656, 0.20392608642578125, 0.21068382263183594, 0.21744155883789062, 0.2241992950439453, 0.23095703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 9.0, 15.0, 22.0, 22.0, 20.0, 26.0, 46.0, 60.0, 82.0, 74.0, 99.0, 98.0, 70.0, 86.0, 70.0, 30.0, 33.0, 28.0, 18.0, 22.0, 12.0, 10.0, 7.0, 11.0, 3.0, 6.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3095703125, -0.3012199401855469, -0.29286956787109375, -0.2845191955566406, -0.2761688232421875, -0.2678184509277344, -0.25946807861328125, -0.2511177062988281, -0.242767333984375, -0.23441696166992188, -0.22606658935546875, -0.21771621704101562, -0.2093658447265625, -0.20101547241210938, -0.19266510009765625, -0.18431472778320312, -0.17596435546875, -0.16761398315429688, -0.15926361083984375, -0.15091323852539062, -0.1425628662109375, -0.13421249389648438, -0.12586212158203125, -0.11751174926757812, -0.109161376953125, -0.10081100463867188, -0.09246063232421875, -0.08411026000976562, -0.0757598876953125, -0.06740951538085938, -0.05905914306640625, -0.050708770751953125, -0.0423583984375, -0.034008026123046875, -0.02565765380859375, -0.017307281494140625, -0.0089569091796875, -0.000606536865234375, 0.00774383544921875, 0.016094207763671875, 0.024444580078125, 0.032794952392578125, 0.04114532470703125, 0.049495697021484375, 0.0578460693359375, 0.06619644165039062, 0.07454681396484375, 0.08289718627929688, 0.09124755859375, 0.09959793090820312, 0.10794830322265625, 0.11629867553710938, 0.1246490478515625, 0.13299942016601562, 0.14134979248046875, 0.14970016479492188, 0.158050537109375, 0.16640090942382812, 0.17475128173828125, 0.18310165405273438, 0.1914520263671875, 0.19980239868164062, 0.20815277099609375, 0.21650314331054688, 0.224853515625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 17.0, 56.0, 100.0, 143.0, 194.0, 183.0, 131.0, 81.0, 43.0, 19.0, 11.0, 10.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.588495254516602, -4.403305530548096, -4.218116283416748, -4.032926559448242, -3.8477370738983154, -3.6625475883483887, -3.477357864379883, -3.292168378829956, -3.1069788932800293, -2.9217894077301025, -2.7365996837615967, -2.55141019821167, -2.366220712661743, -2.1810312271118164, -1.9958415031433105, -1.8106520175933838, -1.625462293624878, -1.4402726888656616, -1.2550832033157349, -1.0698935985565186, -0.884704053401947, -0.6995145082473755, -0.5143249034881592, -0.3291354179382324, -0.1439458131790161, 0.041243746876716614, 0.22643330693244934, 0.41162288188934326, 0.5968124270439148, 0.7820019721984863, 0.9671915769577026, 1.1523810625076294, 1.3375706672668457, 1.522760272026062, 1.7079497575759888, 1.893139362335205, 2.078328847885132, 2.2635183334350586, 2.4487080574035645, 2.633897542953491, 2.819087028503418, 3.0042765140533447, 3.1894662380218506, 3.3746557235717773, 3.559845209121704, 3.745034694671631, 3.9302244186401367, 4.115413665771484, 4.300603866577148, 4.485793590545654, 4.670982837677002, 4.856172561645508, 5.041362285614014, 5.226551532745361, 5.411741256713867, 5.596930503845215, 5.782120227813721, 5.967309951782227, 6.152499198913574, 6.33768892288208, 6.522878646850586, 6.708067893981934, 6.8932576179504395, 7.078447341918945, 7.263636589050293]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 7.0, 7.0, 14.0, 9.0, 24.0, 9.0, 21.0, 14.0, 24.0, 29.0, 34.0, 29.0, 36.0, 28.0, 52.0, 40.0, 38.0, 59.0, 38.0, 43.0, 47.0, 29.0, 43.0, 38.0, 32.0, 25.0, 27.0, 37.0, 20.0, 23.0, 15.0, 9.0, 15.0, 16.0, 10.0, 7.0, 10.0, 8.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.9503173828125, -2.857133626937866, -2.7639496326446533, -2.6707658767700195, -2.5775818824768066, -2.484398126602173, -2.391214370727539, -2.298030376434326, -2.2048466205596924, -2.1116628646850586, -2.0184788703918457, -1.925295114517212, -1.8321112394332886, -1.7389273643493652, -1.6457436084747314, -1.552559733390808, -1.4593758583068848, -1.3661919832229614, -1.273008108139038, -1.1798243522644043, -1.086640477180481, -0.9934566020965576, -0.900272786617279, -0.8070889711380005, -0.7139050960540771, -0.6207212209701538, -0.5275374054908752, -0.4343535602092743, -0.34116971492767334, -0.2479858696460724, -0.15480202436447144, -0.06161820888519287, 0.03156566619873047, 0.12474951148033142, 0.21793335676193237, 0.3111172020435333, 0.4043010473251343, 0.49748489260673523, 0.5906687378883362, 0.6838525533676147, 0.7770364284515381, 0.8702203035354614, 0.96340411901474, 1.0565879344940186, 1.149771809577942, 1.2429556846618652, 1.336139440536499, 1.4293233156204224, 1.5225071907043457, 1.615691065788269, 1.7088749408721924, 1.8020586967468262, 1.8952425718307495, 1.9884264469146729, 2.0816102027893066, 2.1747941970825195, 2.2679779529571533, 2.361161708831787, 2.454345703125, 2.547529458999634, 2.6407132148742676, 2.7338972091674805, 2.8270809650421143, 2.920264720916748, 3.013448715209961]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 9.0, 14.0, 12.0, 26.0, 35.0, 74.0, 102.0, 185.0, 324.0, 632.0, 1287.0, 3489.0, 14055.0, 142589.0, 3950784.0, 66012.0, 9483.0, 2843.0, 1095.0, 512.0, 292.0, 146.0, 100.0, 56.0, 34.0, 22.0, 14.0, 15.0, 15.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6005859375, -0.5814437866210938, -0.5623016357421875, -0.5431594848632812, -0.524017333984375, -0.5048751831054688, -0.4857330322265625, -0.46659088134765625, -0.44744873046875, -0.42830657958984375, -0.4091644287109375, -0.39002227783203125, -0.370880126953125, -0.35173797607421875, -0.3325958251953125, -0.31345367431640625, -0.2943115234375, -0.27516937255859375, -0.2560272216796875, -0.23688507080078125, -0.217742919921875, -0.19860076904296875, -0.1794586181640625, -0.16031646728515625, -0.14117431640625, -0.12203216552734375, -0.1028900146484375, -0.08374786376953125, -0.064605712890625, -0.04546356201171875, -0.0263214111328125, -0.00717926025390625, 0.011962890625, 0.03110504150390625, 0.0502471923828125, 0.06938934326171875, 0.088531494140625, 0.10767364501953125, 0.1268157958984375, 0.14595794677734375, 0.16510009765625, 0.18424224853515625, 0.2033843994140625, 0.22252655029296875, 0.241668701171875, 0.26081085205078125, 0.2799530029296875, 0.29909515380859375, 0.3182373046875, 0.33737945556640625, 0.3565216064453125, 0.37566375732421875, 0.394805908203125, 0.41394805908203125, 0.4330902099609375, 0.45223236083984375, 0.47137451171875, 0.49051666259765625, 0.5096588134765625, 0.5288009643554688, 0.547943115234375, 0.5670852661132812, 0.5862274169921875, 0.6053695678710938, 0.62451171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 0.0, 11.0, 10.0, 6.0, 7.0, 22.0, 13.0, 25.0, 25.0, 28.0, 30.0, 35.0, 50.0, 50.0, 64.0, 67.0, 66.0, 77.0, 78.0, 60.0, 61.0, 39.0, 35.0, 32.0, 33.0, 22.0, 16.0, 16.0, 11.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15033721923828125, -0.1436920166015625, -0.13704681396484375, -0.130401611328125, -0.12375640869140625, -0.1171112060546875, -0.11046600341796875, -0.10382080078125, -0.09717559814453125, -0.0905303955078125, -0.08388519287109375, -0.077239990234375, -0.07059478759765625, -0.0639495849609375, -0.05730438232421875, -0.0506591796875, -0.04401397705078125, -0.0373687744140625, -0.03072357177734375, -0.024078369140625, -0.01743316650390625, -0.0107879638671875, -0.00414276123046875, 0.00250244140625, 0.00914764404296875, 0.0157928466796875, 0.02243804931640625, 0.029083251953125, 0.03572845458984375, 0.0423736572265625, 0.04901885986328125, 0.0556640625, 0.06230926513671875, 0.0689544677734375, 0.07559967041015625, 0.082244873046875, 0.08889007568359375, 0.0955352783203125, 0.10218048095703125, 0.10882568359375, 0.11547088623046875, 0.1221160888671875, 0.12876129150390625, 0.135406494140625, 0.14205169677734375, 0.1486968994140625, 0.15534210205078125, 0.1619873046875, 0.16863250732421875, 0.1752777099609375, 0.18192291259765625, 0.188568115234375, 0.19521331787109375, 0.2018585205078125, 0.20850372314453125, 0.21514892578125, 0.22179412841796875, 0.2284393310546875, 0.23508453369140625, 0.241729736328125, 0.24837493896484375, 0.2550201416015625, 0.26166534423828125, 0.268310546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 17.0, 17.0, 26.0, 26.0, 34.0, 68.0, 73.0, 82.0, 132.0, 179.0, 250.0, 364.0, 546.0, 892.0, 1546.0, 2984.0, 6479.0, 18598.0, 82365.0, 2578721.0, 1396667.0, 73682.0, 17196.0, 6168.0, 2910.0, 1495.0, 864.0, 541.0, 374.0, 272.0, 193.0, 148.0, 104.0, 72.0, 41.0, 28.0, 37.0, 23.0, 12.0, 11.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444580078125, -0.4292335510253906, -0.41388702392578125, -0.3985404968261719, -0.3831939697265625, -0.3678474426269531, -0.35250091552734375, -0.3371543884277344, -0.321807861328125, -0.3064613342285156, -0.29111480712890625, -0.2757682800292969, -0.2604217529296875, -0.24507522583007812, -0.22972869873046875, -0.21438217163085938, -0.19903564453125, -0.18368911743164062, -0.16834259033203125, -0.15299606323242188, -0.1376495361328125, -0.12230300903320312, -0.10695648193359375, -0.09160995483398438, -0.076263427734375, -0.060916900634765625, -0.04557037353515625, -0.030223846435546875, -0.0148773193359375, 0.000469207763671875, 0.01581573486328125, 0.031162261962890625, 0.0465087890625, 0.061855316162109375, 0.07720184326171875, 0.09254837036132812, 0.1078948974609375, 0.12324142456054688, 0.13858795166015625, 0.15393447875976562, 0.169281005859375, 0.18462753295898438, 0.19997406005859375, 0.21532058715820312, 0.2306671142578125, 0.24601364135742188, 0.26136016845703125, 0.2767066955566406, 0.29205322265625, 0.3073997497558594, 0.32274627685546875, 0.3380928039550781, 0.3534393310546875, 0.3687858581542969, 0.38413238525390625, 0.3994789123535156, 0.414825439453125, 0.4301719665527344, 0.44551849365234375, 0.4608650207519531, 0.4762115478515625, 0.4915580749511719, 0.5069046020507812, 0.5222511291503906, 0.53759765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 5.0, 6.0, 19.0, 28.0, 38.0, 76.0, 151.0, 417.0, 2150.0, 704.0, 218.0, 89.0, 49.0, 36.0, 18.0, 15.0, 12.0, 10.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1517333984375, -0.14679336547851562, -0.14185333251953125, -0.13691329956054688, -0.1319732666015625, -0.12703323364257812, -0.12209320068359375, -0.11715316772460938, -0.112213134765625, -0.10727310180664062, -0.10233306884765625, -0.09739303588867188, -0.0924530029296875, -0.08751296997070312, -0.08257293701171875, -0.07763290405273438, -0.07269287109375, -0.06775283813476562, -0.06281280517578125, -0.057872772216796875, -0.0529327392578125, -0.047992706298828125, -0.04305267333984375, -0.038112640380859375, -0.033172607421875, -0.028232574462890625, -0.02329254150390625, -0.018352508544921875, -0.0134124755859375, -0.008472442626953125, -0.00353240966796875, 0.001407623291015625, 0.00634765625, 0.011287689208984375, 0.01622772216796875, 0.021167755126953125, 0.0261077880859375, 0.031047821044921875, 0.03598785400390625, 0.040927886962890625, 0.045867919921875, 0.050807952880859375, 0.05574798583984375, 0.060688018798828125, 0.0656280517578125, 0.07056808471679688, 0.07550811767578125, 0.08044815063476562, 0.08538818359375, 0.09032821655273438, 0.09526824951171875, 0.10020828247070312, 0.1051483154296875, 0.11008834838867188, 0.11502838134765625, 0.11996841430664062, 0.124908447265625, 0.12984848022460938, 0.13478851318359375, 0.13972854614257812, 0.1446685791015625, 0.14960861206054688, 0.15454864501953125, 0.15948867797851562, 0.1644287109375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 3.0, 13.0, 9.0, 20.0, 37.0, 58.0, 103.0, 108.0, 136.0, 140.0, 136.0, 105.0, 57.0, 29.0, 15.0, 8.0, 6.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0267754793167114, -0.9971585869789124, -0.9675417542457581, -0.937924861907959, -0.9083080291748047, -0.8786911368370056, -0.8490742444992065, -0.8194574117660522, -0.789840579032898, -0.7602236866950989, -0.7306068539619446, -0.7009899616241455, -0.6713731288909912, -0.6417562365531921, -0.6121393442153931, -0.5825225114822388, -0.5529056191444397, -0.5232887268066406, -0.49367189407348633, -0.46405500173568726, -0.43443816900253296, -0.4048212766647339, -0.3752044141292572, -0.3455875515937805, -0.31597068905830383, -0.28635382652282715, -0.25673696398735046, -0.22712008655071259, -0.1975032240152359, -0.16788636147975922, -0.13826948404312134, -0.10865262150764465, -0.07903575897216797, -0.049418892711400986, -0.019802026450634003, 0.009814843535423279, 0.03943170607089996, 0.06904856860637665, 0.09866544604301453, 0.1282823085784912, 0.1578991711139679, 0.18751603364944458, 0.21713289618492126, 0.24674977362155914, 0.276366651058197, 0.3059834837913513, 0.3356003761291504, 0.3652172386646271, 0.39483410120010376, 0.42445096373558044, 0.45406782627105713, 0.4836847186088562, 0.5133015513420105, 0.5429184436798096, 0.5725352764129639, 0.6021521687507629, 0.631769061088562, 0.6613859534263611, 0.6910027861595154, 0.7206196784973145, 0.7502365112304688, 0.7798534035682678, 0.8094702959060669, 0.8390871286392212, 0.8687039613723755]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 14.0, 11.0, 14.0, 20.0, 15.0, 17.0, 22.0, 22.0, 36.0, 39.0, 43.0, 46.0, 42.0, 43.0, 49.0, 63.0, 44.0, 49.0, 51.0, 48.0, 39.0, 36.0, 50.0, 31.0, 27.0, 23.0, 14.0, 18.0, 18.0, 12.0, 9.0, 14.0, 5.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47379982471466064, -0.4570058286190033, -0.44021180272102356, -0.4234178066253662, -0.4066237807273865, -0.3898297846317291, -0.3730357885360718, -0.35624176263809204, -0.3394477665424347, -0.32265377044677734, -0.3058597445487976, -0.28906574845314026, -0.2722717523574829, -0.2554777264595032, -0.23868373036384583, -0.22188971936702728, -0.20509570837020874, -0.1883016973733902, -0.17150768637657166, -0.1547136902809143, -0.13791967928409576, -0.12112566828727722, -0.10433166474103928, -0.08753766119480133, -0.07074365019798279, -0.053949642926454544, -0.0371556356549263, -0.020361628383398056, -0.003567621111869812, 0.01322638988494873, 0.030020393431186676, 0.04681439697742462, 0.06360840797424316, 0.0804024189710617, 0.09719642251729965, 0.1139904260635376, 0.13078443706035614, 0.14757844805717468, 0.16437244415283203, 0.18116645514965057, 0.19796046614646912, 0.21475447714328766, 0.2315484881401062, 0.24834248423576355, 0.2651364803314209, 0.28193050622940063, 0.298724502325058, 0.31551849842071533, 0.33231252431869507, 0.3491065204143524, 0.36590054631233215, 0.3826945424079895, 0.39948856830596924, 0.4162825644016266, 0.43307656049728394, 0.44987058639526367, 0.466664582490921, 0.48345857858657837, 0.5002526044845581, 0.5170466303825378, 0.5338405966758728, 0.5506346225738525, 0.5674286484718323, 0.5842226147651672, 0.601016640663147]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 2.0, 5.0, 12.0, 18.0, 25.0, 29.0, 39.0, 76.0, 109.0, 202.0, 381.0, 803.0, 1729.0, 4339.0, 12604.0, 40753.0, 153738.0, 424449.0, 293128.0, 80765.0, 22756.0, 7323.0, 2829.0, 1182.0, 569.0, 257.0, 169.0, 89.0, 59.0, 41.0, 21.0, 19.0, 13.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.35137176513671875, -0.3382415771484375, -0.32511138916015625, -0.311981201171875, -0.29885101318359375, -0.2857208251953125, -0.27259063720703125, -0.25946044921875, -0.24633026123046875, -0.2332000732421875, -0.22006988525390625, -0.206939697265625, -0.19380950927734375, -0.1806793212890625, -0.16754913330078125, -0.1544189453125, -0.14128875732421875, -0.1281585693359375, -0.11502838134765625, -0.101898193359375, -0.08876800537109375, -0.0756378173828125, -0.06250762939453125, -0.04937744140625, -0.03624725341796875, -0.0231170654296875, -0.00998687744140625, 0.003143310546875, 0.01627349853515625, 0.0294036865234375, 0.04253387451171875, 0.0556640625, 0.06879425048828125, 0.0819244384765625, 0.09505462646484375, 0.108184814453125, 0.12131500244140625, 0.1344451904296875, 0.14757537841796875, 0.16070556640625, 0.17383575439453125, 0.1869659423828125, 0.20009613037109375, 0.213226318359375, 0.22635650634765625, 0.2394866943359375, 0.25261688232421875, 0.2657470703125, 0.27887725830078125, 0.2920074462890625, 0.30513763427734375, 0.318267822265625, 0.33139801025390625, 0.3445281982421875, 0.35765838623046875, 0.37078857421875, 0.38391876220703125, 0.3970489501953125, 0.41017913818359375, 0.423309326171875, 0.43643951416015625, 0.4495697021484375, 0.46269989013671875, 0.475830078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 5.0, 16.0, 11.0, 10.0, 28.0, 31.0, 43.0, 30.0, 33.0, 41.0, 63.0, 60.0, 55.0, 69.0, 63.0, 65.0, 55.0, 59.0, 46.0, 43.0, 45.0, 28.0, 19.0, 19.0, 17.0, 8.0, 14.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.15831375122070312, -0.15134429931640625, -0.14437484741210938, -0.1374053955078125, -0.13043594360351562, -0.12346649169921875, -0.11649703979492188, -0.109527587890625, -0.10255813598632812, -0.09558868408203125, -0.08861923217773438, -0.0816497802734375, -0.07468032836914062, -0.06771087646484375, -0.060741424560546875, -0.05377197265625, -0.046802520751953125, -0.03983306884765625, -0.032863616943359375, -0.0258941650390625, -0.018924713134765625, -0.01195526123046875, -0.004985809326171875, 0.001983642578125, 0.008953094482421875, 0.01592254638671875, 0.022891998291015625, 0.0298614501953125, 0.036830902099609375, 0.04380035400390625, 0.050769805908203125, 0.0577392578125, 0.06470870971679688, 0.07167816162109375, 0.07864761352539062, 0.0856170654296875, 0.09258651733398438, 0.09955596923828125, 0.10652542114257812, 0.113494873046875, 0.12046432495117188, 0.12743377685546875, 0.13440322875976562, 0.1413726806640625, 0.14834213256835938, 0.15531158447265625, 0.16228103637695312, 0.16925048828125, 0.17621994018554688, 0.18318939208984375, 0.19015884399414062, 0.1971282958984375, 0.20409774780273438, 0.21106719970703125, 0.21803665161132812, 0.225006103515625, 0.23197555541992188, 0.23894500732421875, 0.24591445922851562, 0.2528839111328125, 0.2598533630371094, 0.26682281494140625, 0.2737922668457031, 0.28076171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 9.0, 5.0, 9.0, 4.0, 9.0, 10.0, 14.0, 24.0, 28.0, 45.0, 67.0, 152.0, 258.0, 533.0, 1206.0, 3326.0, 12633.0, 95427.0, 770878.0, 141466.0, 15918.0, 3965.0, 1304.0, 580.0, 291.0, 142.0, 88.0, 54.0, 38.0, 14.0, 16.0, 5.0, 9.0, 7.0, 8.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.98193359375, -0.9543304443359375, -0.926727294921875, -0.8991241455078125, -0.87152099609375, -0.8439178466796875, -0.816314697265625, -0.7887115478515625, -0.7611083984375, -0.7335052490234375, -0.705902099609375, -0.6782989501953125, -0.65069580078125, -0.6230926513671875, -0.595489501953125, -0.5678863525390625, -0.540283203125, -0.5126800537109375, -0.485076904296875, -0.4574737548828125, -0.42987060546875, -0.4022674560546875, -0.374664306640625, -0.3470611572265625, -0.3194580078125, -0.2918548583984375, -0.264251708984375, -0.2366485595703125, -0.20904541015625, -0.1814422607421875, -0.153839111328125, -0.1262359619140625, -0.0986328125, -0.0710296630859375, -0.043426513671875, -0.0158233642578125, 0.01177978515625, 0.0393829345703125, 0.066986083984375, 0.0945892333984375, 0.1221923828125, 0.1497955322265625, 0.177398681640625, 0.2050018310546875, 0.23260498046875, 0.2602081298828125, 0.287811279296875, 0.3154144287109375, 0.343017578125, 0.3706207275390625, 0.398223876953125, 0.4258270263671875, 0.45343017578125, 0.4810333251953125, 0.508636474609375, 0.5362396240234375, 0.5638427734375, 0.5914459228515625, 0.619049072265625, 0.6466522216796875, 0.67425537109375, 0.7018585205078125, 0.729461669921875, 0.7570648193359375, 0.78466796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 8.0, 8.0, 16.0, 17.0, 24.0, 32.0, 48.0, 34.0, 50.0, 46.0, 53.0, 59.0, 82.0, 47.0, 69.0, 50.0, 74.0, 41.0, 47.0, 36.0, 23.0, 34.0, 16.0, 16.0, 12.0, 8.0, 11.0, 6.0, 8.0, 1.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.202850341796875, -1.16448974609375, -1.126129150390625, -1.0877685546875, -1.049407958984375, -1.01104736328125, -0.972686767578125, -0.934326171875, -0.895965576171875, -0.85760498046875, -0.819244384765625, -0.7808837890625, -0.742523193359375, -0.70416259765625, -0.665802001953125, -0.62744140625, -0.589080810546875, -0.55072021484375, -0.512359619140625, -0.4739990234375, -0.435638427734375, -0.39727783203125, -0.358917236328125, -0.320556640625, -0.282196044921875, -0.24383544921875, -0.205474853515625, -0.1671142578125, -0.128753662109375, -0.09039306640625, -0.052032470703125, -0.013671875, 0.024688720703125, 0.06304931640625, 0.101409912109375, 0.1397705078125, 0.178131103515625, 0.21649169921875, 0.254852294921875, 0.293212890625, 0.331573486328125, 0.36993408203125, 0.408294677734375, 0.4466552734375, 0.485015869140625, 0.52337646484375, 0.561737060546875, 0.60009765625, 0.638458251953125, 0.67681884765625, 0.715179443359375, 0.7535400390625, 0.791900634765625, 0.83026123046875, 0.868621826171875, 0.906982421875, 0.945343017578125, 0.98370361328125, 1.022064208984375, 1.0604248046875, 1.098785400390625, 1.13714599609375, 1.175506591796875, 1.2138671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 4.0, 2.0, 12.0, 16.0, 23.0, 44.0, 102.0, 231.0, 795.0, 5398.0, 665364.0, 371407.0, 4110.0, 650.0, 210.0, 85.0, 42.0, 23.0, 16.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4613533020019531, -0.43564605712890625, -0.4099388122558594, -0.3842315673828125, -0.3585243225097656, -0.33281707763671875, -0.3071098327636719, -0.281402587890625, -0.2556953430175781, -0.22998809814453125, -0.20428085327148438, -0.1785736083984375, -0.15286636352539062, -0.12715911865234375, -0.10145187377929688, -0.07574462890625, -0.050037384033203125, -0.02433013916015625, 0.001377105712890625, 0.0270843505859375, 0.052791595458984375, 0.07849884033203125, 0.10420608520507812, 0.129913330078125, 0.15562057495117188, 0.18132781982421875, 0.20703506469726562, 0.2327423095703125, 0.2584495544433594, 0.28415679931640625, 0.3098640441894531, 0.3355712890625, 0.3612785339355469, 0.38698577880859375, 0.4126930236816406, 0.4384002685546875, 0.4641075134277344, 0.48981475830078125, 0.5155220031738281, 0.541229248046875, 0.5669364929199219, 0.5926437377929688, 0.6183509826660156, 0.6440582275390625, 0.6697654724121094, 0.6954727172851562, 0.7211799621582031, 0.74688720703125, 0.7725944519042969, 0.7983016967773438, 0.8240089416503906, 0.8497161865234375, 0.8754234313964844, 0.9011306762695312, 0.9268379211425781, 0.952545166015625, 0.9782524108886719, 1.0039596557617188, 1.0296669006347656, 1.0553741455078125, 1.0810813903808594, 1.1067886352539062, 1.1324958801269531, 1.158203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 3.0, 11.0, 27.0, 35.0, 45.0, 113.0, 182.0, 184.0, 122.0, 116.0, 64.0, 43.0, 25.0, 10.0, 5.0, 6.0, 6.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2988529205322266e-05, -4.954729229211807e-05, -4.610605537891388e-05, -4.2664818465709686e-05, -3.922358155250549e-05, -3.57823446393013e-05, -3.234110772609711e-05, -2.8899870812892914e-05, -2.545863389968872e-05, -2.2017396986484528e-05, -1.8576160073280334e-05, -1.5134923160076141e-05, -1.1693686246871948e-05, -8.252449333667755e-06, -4.811212420463562e-06, -1.369975507259369e-06, 2.0712614059448242e-06, 5.512498319149017e-06, 8.95373523235321e-06, 1.2394972145557404e-05, 1.5836209058761597e-05, 1.927744597196579e-05, 2.2718682885169983e-05, 2.6159919798374176e-05, 2.960115671157837e-05, 3.304239362478256e-05, 3.6483630537986755e-05, 3.992486745119095e-05, 4.336610436439514e-05, 4.6807341277599335e-05, 5.024857819080353e-05, 5.368981510400772e-05, 5.7131052017211914e-05, 6.057228893041611e-05, 6.40135258436203e-05, 6.74547627568245e-05, 7.089599967002869e-05, 7.433723658323288e-05, 7.777847349643707e-05, 8.121971040964127e-05, 8.466094732284546e-05, 8.810218423604965e-05, 9.154342114925385e-05, 9.498465806245804e-05, 9.842589497566223e-05, 0.00010186713188886642, 0.00010530836880207062, 0.00010874960571527481, 0.000112190842628479, 0.0001156320795416832, 0.00011907331645488739, 0.00012251455336809158, 0.00012595579028129578, 0.00012939702719449997, 0.00013283826410770416, 0.00013627950102090836, 0.00013972073793411255, 0.00014316197484731674, 0.00014660321176052094, 0.00015004444867372513, 0.00015348568558692932, 0.00015692692250013351, 0.0001603681594133377, 0.0001638093963265419, 0.0001672506332397461]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 11.0, 19.0, 25.0, 40.0, 61.0, 120.0, 202.0, 682.0, 2736.0, 29988.0, 914601.0, 93991.0, 4549.0, 896.0, 292.0, 131.0, 65.0, 54.0, 29.0, 16.0, 16.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.573211669921875, -0.55169677734375, -0.530181884765625, -0.5086669921875, -0.487152099609375, -0.46563720703125, -0.444122314453125, -0.422607421875, -0.401092529296875, -0.37957763671875, -0.358062744140625, -0.3365478515625, -0.315032958984375, -0.29351806640625, -0.272003173828125, -0.25048828125, -0.228973388671875, -0.20745849609375, -0.185943603515625, -0.1644287109375, -0.142913818359375, -0.12139892578125, -0.099884033203125, -0.078369140625, -0.056854248046875, -0.03533935546875, -0.013824462890625, 0.0076904296875, 0.029205322265625, 0.05072021484375, 0.072235107421875, 0.09375, 0.115264892578125, 0.13677978515625, 0.158294677734375, 0.1798095703125, 0.201324462890625, 0.22283935546875, 0.244354248046875, 0.265869140625, 0.287384033203125, 0.30889892578125, 0.330413818359375, 0.3519287109375, 0.373443603515625, 0.39495849609375, 0.416473388671875, 0.43798828125, 0.459503173828125, 0.48101806640625, 0.502532958984375, 0.5240478515625, 0.545562744140625, 0.56707763671875, 0.588592529296875, 0.610107421875, 0.631622314453125, 0.65313720703125, 0.674652099609375, 0.6961669921875, 0.717681884765625, 0.73919677734375, 0.760711669921875, 0.7822265625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 14.0, 39.0, 63.0, 143.0, 242.0, 245.0, 135.0, 65.0, 31.0, 11.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.3981170654296875, -0.371429443359375, -0.3447418212890625, -0.31805419921875, -0.2913665771484375, -0.264678955078125, -0.2379913330078125, -0.2113037109375, -0.1846160888671875, -0.157928466796875, -0.1312408447265625, -0.10455322265625, -0.0778656005859375, -0.051177978515625, -0.0244903564453125, 0.002197265625, 0.0288848876953125, 0.055572509765625, 0.0822601318359375, 0.10894775390625, 0.1356353759765625, 0.162322998046875, 0.1890106201171875, 0.2156982421875, 0.2423858642578125, 0.269073486328125, 0.2957611083984375, 0.32244873046875, 0.3491363525390625, 0.375823974609375, 0.4025115966796875, 0.42919921875, 0.4558868408203125, 0.482574462890625, 0.5092620849609375, 0.53594970703125, 0.5626373291015625, 0.589324951171875, 0.6160125732421875, 0.6427001953125, 0.6693878173828125, 0.696075439453125, 0.7227630615234375, 0.74945068359375, 0.7761383056640625, 0.802825927734375, 0.8295135498046875, 0.856201171875, 0.8828887939453125, 0.909576416015625, 0.9362640380859375, 0.96295166015625, 0.9896392822265625, 1.016326904296875, 1.0430145263671875, 1.0697021484375, 1.0963897705078125, 1.123077392578125, 1.1497650146484375, 1.17645263671875, 1.2031402587890625, 1.229827880859375, 1.2565155029296875, 1.283203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 8.0, 6.0, 36.0, 69.0, 171.0, 265.0, 222.0, 130.0, 59.0, 21.0, 11.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.255622863769531, -3.984893798828125, -3.714164972305298, -3.4434361457824707, -3.1727070808410645, -2.901978015899658, -2.631249189376831, -2.360520362854004, -2.0897912979125977, -1.819062352180481, -1.5483334064483643, -1.2776044607162476, -1.0068755149841309, -0.7361465692520142, -0.46541762351989746, -0.19468867778778076, 0.07604026794433594, 0.34676921367645264, 0.6174981594085693, 0.888227105140686, 1.1589560508728027, 1.4296849966049194, 1.7004139423370361, 1.9711428880691528, 2.2418718338012695, 2.512600898742676, 2.783329725265503, 3.05405855178833, 3.3247876167297363, 3.5955166816711426, 3.8662455081939697, 4.136974334716797, 4.407703399658203, 4.678432464599609, 4.949161529541016, 5.219890117645264, 5.49061918258667, 5.761348247528076, 6.032076835632324, 6.3028059005737305, 6.573534965515137, 6.844264030456543, 7.114993095397949, 7.385721683502197, 7.6564507484436035, 7.92717981338501, 8.197908401489258, 8.468637466430664, 8.73936653137207, 9.010095596313477, 9.280824661254883, 9.551553726196289, 9.822282791137695, 10.093010902404785, 10.363739967346191, 10.634469032287598, 10.905198097229004, 11.17592716217041, 11.446656227111816, 11.717385292053223, 11.988113403320312, 12.258842468261719, 12.529571533203125, 12.800300598144531, 13.071029663085938]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 9.0, 13.0, 20.0, 26.0, 35.0, 33.0, 42.0, 45.0, 57.0, 70.0, 74.0, 80.0, 61.0, 63.0, 55.0, 50.0, 52.0, 33.0, 24.0, 25.0, 32.0, 18.0, 17.0, 16.0, 6.0, 11.0, 8.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30012321472168, -4.128546714782715, -3.956969976425171, -3.785393238067627, -3.613816738128662, -3.4422402381896973, -3.2706634998321533, -3.0990867614746094, -2.9275102615356445, -2.7559337615966797, -2.5843570232391357, -2.412780284881592, -2.241203784942627, -2.069627285003662, -1.8980505466461182, -1.7264739274978638, -1.5548973083496094, -1.383320689201355, -1.2117440700531006, -1.0401674509048462, -0.8685908317565918, -0.6970142126083374, -0.525437593460083, -0.3538609743118286, -0.18228435516357422, -0.010707736015319824, 0.16086888313293457, 0.33244550228118896, 0.5040221214294434, 0.6755987405776978, 0.8471753597259521, 1.0187519788742065, 1.1903281211853027, 1.3619047403335571, 1.5334813594818115, 1.705057978630066, 1.8766345977783203, 2.048211097717285, 2.219787836074829, 2.391364574432373, 2.562941074371338, 2.7345175743103027, 2.9060943126678467, 3.0776710510253906, 3.2492475509643555, 3.4208240509033203, 3.5924007892608643, 3.763977527618408, 3.935554027557373, 4.107130527496338, 4.278707504272461, 4.450284004211426, 4.621860504150391, 4.7934370040893555, 4.96501350402832, 5.136590480804443, 5.308166980743408, 5.479743480682373, 5.651320457458496, 5.822896957397461, 5.994473457336426, 6.166049957275391, 6.3376264572143555, 6.5092034339904785, 6.680779933929443]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 10.0, 5.0, 7.0, 6.0, 16.0, 24.0, 25.0, 21.0, 39.0, 46.0, 80.0, 161.0, 314.0, 744.0, 2592.0, 16568.0, 4082574.0, 83068.0, 5415.0, 1371.0, 504.0, 239.0, 136.0, 101.0, 65.0, 37.0, 25.0, 33.0, 13.0, 6.0, 11.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.96875, -0.940032958984375, -0.91131591796875, -0.882598876953125, -0.8538818359375, -0.825164794921875, -0.79644775390625, -0.767730712890625, -0.739013671875, -0.710296630859375, -0.68157958984375, -0.652862548828125, -0.6241455078125, -0.595428466796875, -0.56671142578125, -0.537994384765625, -0.50927734375, -0.480560302734375, -0.45184326171875, -0.423126220703125, -0.3944091796875, -0.365692138671875, -0.33697509765625, -0.308258056640625, -0.279541015625, -0.250823974609375, -0.22210693359375, -0.193389892578125, -0.1646728515625, -0.135955810546875, -0.10723876953125, -0.078521728515625, -0.0498046875, -0.021087646484375, 0.00762939453125, 0.036346435546875, 0.0650634765625, 0.093780517578125, 0.12249755859375, 0.151214599609375, 0.179931640625, 0.208648681640625, 0.23736572265625, 0.266082763671875, 0.2947998046875, 0.323516845703125, 0.35223388671875, 0.380950927734375, 0.40966796875, 0.438385009765625, 0.46710205078125, 0.495819091796875, 0.5245361328125, 0.553253173828125, 0.58197021484375, 0.610687255859375, 0.639404296875, 0.668121337890625, 0.69683837890625, 0.725555419921875, 0.7542724609375, 0.782989501953125, 0.81170654296875, 0.840423583984375, 0.869140625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 14.0, 31.0, 37.0, 78.0, 85.0, 99.0, 133.0, 123.0, 116.0, 96.0, 48.0, 35.0, 32.0, 21.0, 12.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.3095359802246094, -0.29412078857421875, -0.2787055969238281, -0.2632904052734375, -0.24787521362304688, -0.23246002197265625, -0.21704483032226562, -0.201629638671875, -0.18621444702148438, -0.17079925537109375, -0.15538406372070312, -0.1399688720703125, -0.12455368041992188, -0.10913848876953125, -0.09372329711914062, -0.07830810546875, -0.06289291381835938, -0.04747772216796875, -0.032062530517578125, -0.0166473388671875, -0.001232147216796875, 0.01418304443359375, 0.029598236083984375, 0.045013427734375, 0.060428619384765625, 0.07584381103515625, 0.09125900268554688, 0.1066741943359375, 0.12208938598632812, 0.13750457763671875, 0.15291976928710938, 0.1683349609375, 0.18375015258789062, 0.19916534423828125, 0.21458053588867188, 0.2299957275390625, 0.24541091918945312, 0.26082611083984375, 0.2762413024902344, 0.291656494140625, 0.3070716857910156, 0.32248687744140625, 0.3379020690917969, 0.3533172607421875, 0.3687324523925781, 0.38414764404296875, 0.3995628356933594, 0.41497802734375, 0.4303932189941406, 0.44580841064453125, 0.4612236022949219, 0.4766387939453125, 0.4920539855957031, 0.5074691772460938, 0.5228843688964844, 0.538299560546875, 0.5537147521972656, 0.5691299438476562, 0.5845451354980469, 0.5999603271484375, 0.6153755187988281, 0.6307907104492188, 0.6462059020996094, 0.66162109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 13.0, 9.0, 17.0, 22.0, 29.0, 28.0, 50.0, 84.0, 101.0, 134.0, 210.0, 300.0, 443.0, 758.0, 1268.0, 2486.0, 5060.0, 14470.0, 75124.0, 3784488.0, 265599.0, 27448.0, 8069.0, 3469.0, 1733.0, 968.0, 613.0, 391.0, 285.0, 169.0, 126.0, 83.0, 61.0, 39.0, 29.0, 29.0, 21.0, 14.0, 11.0, 7.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.57666015625, -0.5595626831054688, -0.5424652099609375, -0.5253677368164062, -0.508270263671875, -0.49117279052734375, -0.4740753173828125, -0.45697784423828125, -0.43988037109375, -0.42278289794921875, -0.4056854248046875, -0.38858795166015625, -0.371490478515625, -0.35439300537109375, -0.3372955322265625, -0.32019805908203125, -0.3031005859375, -0.28600311279296875, -0.2689056396484375, -0.25180816650390625, -0.234710693359375, -0.21761322021484375, -0.2005157470703125, -0.18341827392578125, -0.16632080078125, -0.14922332763671875, -0.1321258544921875, -0.11502838134765625, -0.097930908203125, -0.08083343505859375, -0.0637359619140625, -0.04663848876953125, -0.029541015625, -0.01244354248046875, 0.0046539306640625, 0.02175140380859375, 0.038848876953125, 0.05594635009765625, 0.0730438232421875, 0.09014129638671875, 0.10723876953125, 0.12433624267578125, 0.1414337158203125, 0.15853118896484375, 0.175628662109375, 0.19272613525390625, 0.2098236083984375, 0.22692108154296875, 0.2440185546875, 0.26111602783203125, 0.2782135009765625, 0.29531097412109375, 0.312408447265625, 0.32950592041015625, 0.3466033935546875, 0.36370086669921875, 0.38079833984375, 0.39789581298828125, 0.4149932861328125, 0.43209075927734375, 0.449188232421875, 0.46628570556640625, 0.4833831787109375, 0.5004806518554688, 0.517578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 13.0, 37.0, 51.0, 122.0, 353.0, 2812.0, 381.0, 111.0, 70.0, 29.0, 17.0, 9.0, 14.0, 11.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11187744140625, -0.10712146759033203, -0.10236549377441406, -0.0976095199584961, -0.09285354614257812, -0.08809757232666016, -0.08334159851074219, -0.07858562469482422, -0.07382965087890625, -0.06907367706298828, -0.06431770324707031, -0.059561729431152344, -0.054805755615234375, -0.050049781799316406, -0.04529380798339844, -0.04053783416748047, -0.0357818603515625, -0.03102588653564453, -0.026269912719726562, -0.021513938903808594, -0.016757965087890625, -0.012001991271972656, -0.0072460174560546875, -0.0024900436401367188, 0.00226593017578125, 0.007021903991699219, 0.011777877807617188, 0.016533851623535156, 0.021289825439453125, 0.026045799255371094, 0.030801773071289062, 0.03555774688720703, 0.040313720703125, 0.04506969451904297, 0.04982566833496094, 0.054581642150878906, 0.059337615966796875, 0.06409358978271484, 0.06884956359863281, 0.07360553741455078, 0.07836151123046875, 0.08311748504638672, 0.08787345886230469, 0.09262943267822266, 0.09738540649414062, 0.1021413803100586, 0.10689735412597656, 0.11165332794189453, 0.1164093017578125, 0.12116527557373047, 0.12592124938964844, 0.1306772232055664, 0.13543319702148438, 0.14018917083740234, 0.1449451446533203, 0.14970111846923828, 0.15445709228515625, 0.15921306610107422, 0.1639690399169922, 0.16872501373291016, 0.17348098754882812, 0.1782369613647461, 0.18299293518066406, 0.18774890899658203, 0.1925048828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 13.0, 28.0, 64.0, 189.0, 246.0, 189.0, 134.0, 49.0, 39.0, 19.0, 8.0, 4.0, 3.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.678025722503662, -1.6373077630996704, -1.5965898036956787, -1.5558717250823975, -1.5151537656784058, -1.474435806274414, -1.4337178468704224, -1.3929998874664307, -1.3522818088531494, -1.3115638494491577, -1.270845890045166, -1.2301278114318848, -1.189409852027893, -1.1486918926239014, -1.1079739332199097, -1.067255973815918, -1.0265380144119263, -0.9858200550079346, -0.9451020359992981, -0.9043840765953064, -0.8636660575866699, -0.8229480981826782, -0.7822301387786865, -0.7415121793746948, -0.7007941603660583, -0.6600762009620667, -0.6193581819534302, -0.5786402225494385, -0.5379222631454468, -0.4972042441368103, -0.4564862847328186, -0.4157682955265045, -0.3750503659248352, -0.3343323767185211, -0.29361438751220703, -0.25289642810821533, -0.21217843890190125, -0.17146044969558716, -0.13074247539043427, -0.09002450108528137, -0.049306511878967285, -0.008588530123233795, 0.032129451632499695, 0.07284743338823318, 0.11356541514396667, 0.15428340435028076, 0.19500137865543365, 0.23571935296058655, 0.27643734216690063, 0.3171553313732147, 0.3578733205795288, 0.3985912799835205, 0.4393092691898346, 0.4800272583961487, 0.5207452178001404, 0.5614632368087769, 0.6021811962127686, 0.6428991556167603, 0.6836171746253967, 0.7243351340293884, 0.7650531530380249, 0.8057711124420166, 0.8464890718460083, 0.88720703125, 0.9279250502586365]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 18.0, 7.0, 10.0, 17.0, 26.0, 21.0, 34.0, 19.0, 20.0, 31.0, 29.0, 37.0, 45.0, 51.0, 35.0, 49.0, 44.0, 38.0, 44.0, 43.0, 44.0, 42.0, 33.0, 40.0, 38.0, 26.0, 28.0, 21.0, 20.0, 20.0, 19.0, 14.0, 10.0, 4.0, 8.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47067564725875854, -0.45612066984176636, -0.44156569242477417, -0.427010715007782, -0.4124557375907898, -0.3979007601737976, -0.3833457827568054, -0.36879080533981323, -0.35423582792282104, -0.33968085050582886, -0.32512587308883667, -0.3105708956718445, -0.2960159182548523, -0.2814609408378601, -0.2669059634208679, -0.25235098600387573, -0.23779603838920593, -0.22324106097221375, -0.20868608355522156, -0.19413110613822937, -0.17957612872123718, -0.165021151304245, -0.150466188788414, -0.13591121137142181, -0.12135623395442963, -0.10680125653743744, -0.09224627912044525, -0.07769130915403366, -0.06313633173704147, -0.048581354320049286, -0.034026384353637695, -0.019471406936645508, -0.00491642951965332, 0.009638546034693718, 0.024193521589040756, 0.038748495280742645, 0.05330347269773483, 0.06785845011472702, 0.08241342008113861, 0.0969683974981308, 0.11152337491512299, 0.12607835233211517, 0.14063332974910736, 0.15518829226493835, 0.16974326968193054, 0.18429824709892273, 0.19885322451591492, 0.2134082019329071, 0.2279631793498993, 0.24251815676689148, 0.25707313418388367, 0.27162811160087585, 0.28618308901786804, 0.30073806643486023, 0.31529301404953003, 0.3298479914665222, 0.3444029688835144, 0.3589579463005066, 0.3735129237174988, 0.38806790113449097, 0.40262287855148315, 0.41717785596847534, 0.43173283338546753, 0.4462878108024597, 0.4608427882194519]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 11.0, 20.0, 14.0, 16.0, 31.0, 27.0, 34.0, 68.0, 75.0, 108.0, 170.0, 295.0, 517.0, 1043.0, 2507.0, 6897.0, 23039.0, 97423.0, 421985.0, 378949.0, 84466.0, 20340.0, 5950.0, 2261.0, 994.0, 491.0, 248.0, 161.0, 104.0, 57.0, 58.0, 35.0, 28.0, 30.0, 17.0, 16.0, 11.0, 8.0, 7.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.443115234375, -0.4287986755371094, -0.41448211669921875, -0.4001655578613281, -0.3858489990234375, -0.3715324401855469, -0.35721588134765625, -0.3428993225097656, -0.328582763671875, -0.3142662048339844, -0.29994964599609375, -0.2856330871582031, -0.2713165283203125, -0.2569999694824219, -0.24268341064453125, -0.22836685180664062, -0.21405029296875, -0.19973373413085938, -0.18541717529296875, -0.17110061645507812, -0.1567840576171875, -0.14246749877929688, -0.12815093994140625, -0.11383438110351562, -0.099517822265625, -0.08520126342773438, -0.07088470458984375, -0.056568145751953125, -0.0422515869140625, -0.027935028076171875, -0.01361846923828125, 0.000698089599609375, 0.0150146484375, 0.029331207275390625, 0.04364776611328125, 0.057964324951171875, 0.0722808837890625, 0.08659744262695312, 0.10091400146484375, 0.11523056030273438, 0.129547119140625, 0.14386367797851562, 0.15818023681640625, 0.17249679565429688, 0.1868133544921875, 0.20112991333007812, 0.21544647216796875, 0.22976303100585938, 0.24407958984375, 0.2583961486816406, 0.27271270751953125, 0.2870292663574219, 0.3013458251953125, 0.3156623840332031, 0.32997894287109375, 0.3442955017089844, 0.358612060546875, 0.3729286193847656, 0.38724517822265625, 0.4015617370605469, 0.4158782958984375, 0.4301948547363281, 0.44451141357421875, 0.4588279724121094, 0.47314453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 11.0, 8.0, 25.0, 33.0, 50.0, 71.0, 89.0, 97.0, 124.0, 101.0, 112.0, 85.0, 67.0, 37.0, 23.0, 23.0, 17.0, 14.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31689453125, -0.3018341064453125, -0.286773681640625, -0.2717132568359375, -0.25665283203125, -0.2415924072265625, -0.226531982421875, -0.2114715576171875, -0.1964111328125, -0.1813507080078125, -0.166290283203125, -0.1512298583984375, -0.13616943359375, -0.1211090087890625, -0.106048583984375, -0.0909881591796875, -0.075927734375, -0.0608673095703125, -0.045806884765625, -0.0307464599609375, -0.01568603515625, -0.0006256103515625, 0.014434814453125, 0.0294952392578125, 0.0445556640625, 0.0596160888671875, 0.074676513671875, 0.0897369384765625, 0.10479736328125, 0.1198577880859375, 0.134918212890625, 0.1499786376953125, 0.1650390625, 0.1800994873046875, 0.195159912109375, 0.2102203369140625, 0.22528076171875, 0.2403411865234375, 0.255401611328125, 0.2704620361328125, 0.2855224609375, 0.3005828857421875, 0.315643310546875, 0.3307037353515625, 0.34576416015625, 0.3608245849609375, 0.375885009765625, 0.3909454345703125, 0.406005859375, 0.4210662841796875, 0.436126708984375, 0.4511871337890625, 0.46624755859375, 0.4813079833984375, 0.496368408203125, 0.5114288330078125, 0.5264892578125, 0.5415496826171875, 0.556610107421875, 0.5716705322265625, 0.58673095703125, 0.6017913818359375, 0.616851806640625, 0.6319122314453125, 0.64697265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 17.0, 19.0, 21.0, 37.0, 46.0, 76.0, 126.0, 249.0, 457.0, 912.0, 2411.0, 8361.0, 52865.0, 691080.0, 260783.0, 23040.0, 4966.0, 1566.0, 703.0, 307.0, 187.0, 110.0, 74.0, 37.0, 27.0, 19.0, 14.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.88427734375, -0.8588638305664062, -0.8334503173828125, -0.8080368041992188, -0.782623291015625, -0.7572097778320312, -0.7317962646484375, -0.7063827514648438, -0.68096923828125, -0.6555557250976562, -0.6301422119140625, -0.6047286987304688, -0.579315185546875, -0.5539016723632812, -0.5284881591796875, -0.5030746459960938, -0.4776611328125, -0.45224761962890625, -0.4268341064453125, -0.40142059326171875, -0.376007080078125, -0.35059356689453125, -0.3251800537109375, -0.29976654052734375, -0.27435302734375, -0.24893951416015625, -0.2235260009765625, -0.19811248779296875, -0.172698974609375, -0.14728546142578125, -0.1218719482421875, -0.09645843505859375, -0.071044921875, -0.04563140869140625, -0.0202178955078125, 0.00519561767578125, 0.030609130859375, 0.05602264404296875, 0.0814361572265625, 0.10684967041015625, 0.13226318359375, 0.15767669677734375, 0.1830902099609375, 0.20850372314453125, 0.233917236328125, 0.25933074951171875, 0.2847442626953125, 0.31015777587890625, 0.3355712890625, 0.36098480224609375, 0.3863983154296875, 0.41181182861328125, 0.437225341796875, 0.46263885498046875, 0.4880523681640625, 0.5134658813476562, 0.53887939453125, 0.5642929077148438, 0.5897064208984375, 0.6151199340820312, 0.640533447265625, 0.6659469604492188, 0.6913604736328125, 0.7167739868164062, 0.7421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 8.0, 3.0, 5.0, 8.0, 15.0, 18.0, 28.0, 17.0, 42.0, 53.0, 48.0, 44.0, 61.0, 59.0, 65.0, 64.0, 57.0, 60.0, 52.0, 45.0, 56.0, 37.0, 23.0, 22.0, 26.0, 19.0, 19.0, 8.0, 8.0, 4.0, 3.0, 5.0, 4.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.087890625, -1.04608154296875, -1.0042724609375, -0.96246337890625, -0.920654296875, -0.87884521484375, -0.8370361328125, -0.79522705078125, -0.75341796875, -0.71160888671875, -0.6697998046875, -0.62799072265625, -0.586181640625, -0.54437255859375, -0.5025634765625, -0.46075439453125, -0.4189453125, -0.37713623046875, -0.3353271484375, -0.29351806640625, -0.251708984375, -0.20989990234375, -0.1680908203125, -0.12628173828125, -0.08447265625, -0.04266357421875, -0.0008544921875, 0.04095458984375, 0.082763671875, 0.12457275390625, 0.1663818359375, 0.20819091796875, 0.25, 0.29180908203125, 0.3336181640625, 0.37542724609375, 0.417236328125, 0.45904541015625, 0.5008544921875, 0.54266357421875, 0.58447265625, 0.62628173828125, 0.6680908203125, 0.70989990234375, 0.751708984375, 0.79351806640625, 0.8353271484375, 0.87713623046875, 0.9189453125, 0.96075439453125, 1.0025634765625, 1.04437255859375, 1.086181640625, 1.12799072265625, 1.1697998046875, 1.21160888671875, 1.25341796875, 1.29522705078125, 1.3370361328125, 1.37884521484375, 1.420654296875, 1.46246337890625, 1.5042724609375, 1.54608154296875, 1.587890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 6.0, 12.0, 12.0, 28.0, 59.0, 93.0, 238.0, 643.0, 2283.0, 25706.0, 936885.0, 77546.0, 3615.0, 846.0, 285.0, 115.0, 71.0, 39.0, 20.0, 9.0, 7.0, 8.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.484619140625, -0.4697685241699219, -0.45491790771484375, -0.4400672912597656, -0.4252166748046875, -0.4103660583496094, -0.39551544189453125, -0.3806648254394531, -0.365814208984375, -0.3509635925292969, -0.33611297607421875, -0.3212623596191406, -0.3064117431640625, -0.2915611267089844, -0.27671051025390625, -0.2618598937988281, -0.24700927734375, -0.23215866088867188, -0.21730804443359375, -0.20245742797851562, -0.1876068115234375, -0.17275619506835938, -0.15790557861328125, -0.14305496215820312, -0.128204345703125, -0.11335372924804688, -0.09850311279296875, -0.08365249633789062, -0.0688018798828125, -0.053951263427734375, -0.03910064697265625, -0.024250030517578125, -0.0093994140625, 0.005451202392578125, 0.02030181884765625, 0.035152435302734375, 0.0500030517578125, 0.06485366821289062, 0.07970428466796875, 0.09455490112304688, 0.109405517578125, 0.12425613403320312, 0.13910675048828125, 0.15395736694335938, 0.1688079833984375, 0.18365859985351562, 0.19850921630859375, 0.21335983276367188, 0.22821044921875, 0.24306106567382812, 0.25791168212890625, 0.2727622985839844, 0.2876129150390625, 0.3024635314941406, 0.31731414794921875, 0.3321647644042969, 0.347015380859375, 0.3618659973144531, 0.37671661376953125, 0.3915672302246094, 0.4064178466796875, 0.4212684631347656, 0.43611907958984375, 0.4509696960449219, 0.4658203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 9.0, 8.0, 18.0, 17.0, 36.0, 44.0, 51.0, 70.0, 88.0, 130.0, 111.0, 91.0, 80.0, 59.0, 54.0, 37.0, 28.0, 19.0, 9.0, 19.0, 11.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.343292236328125e-05, -7.178541272878647e-05, -7.013790309429169e-05, -6.84903934597969e-05, -6.684288382530212e-05, -6.519537419080734e-05, -6.354786455631256e-05, -6.190035492181778e-05, -6.0252845287323e-05, -5.8605335652828217e-05, -5.6957826018333435e-05, -5.5310316383838654e-05, -5.366280674934387e-05, -5.201529711484909e-05, -5.036778748035431e-05, -4.872027784585953e-05, -4.7072768211364746e-05, -4.5425258576869965e-05, -4.377774894237518e-05, -4.21302393078804e-05, -4.048272967338562e-05, -3.883522003889084e-05, -3.718771040439606e-05, -3.5540200769901276e-05, -3.3892691135406494e-05, -3.224518150091171e-05, -3.059767186641693e-05, -2.895016223192215e-05, -2.7302652597427368e-05, -2.5655142962932587e-05, -2.4007633328437805e-05, -2.2360123693943024e-05, -2.0712614059448242e-05, -1.906510442495346e-05, -1.741759479045868e-05, -1.5770085155963898e-05, -1.4122575521469116e-05, -1.2475065886974335e-05, -1.0827556252479553e-05, -9.180046617984772e-06, -7.53253698348999e-06, -5.885027348995209e-06, -4.237517714500427e-06, -2.5900080800056458e-06, -9.424984455108643e-07, 7.050111889839172e-07, 2.3525208234786987e-06, 4.00003045797348e-06, 5.647540092468262e-06, 7.295049726963043e-06, 8.942559361457825e-06, 1.0590068995952606e-05, 1.2237578630447388e-05, 1.388508826494217e-05, 1.553259789943695e-05, 1.7180107533931732e-05, 1.8827617168426514e-05, 2.0475126802921295e-05, 2.2122636437416077e-05, 2.3770146071910858e-05, 2.541765570640564e-05, 2.706516534090042e-05, 2.8712674975395203e-05, 3.0360184609889984e-05, 3.2007694244384766e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 11.0, 20.0, 32.0, 39.0, 52.0, 92.0, 163.0, 346.0, 600.0, 1410.0, 4160.0, 18859.0, 176557.0, 734510.0, 93981.0, 12280.0, 3109.0, 1158.0, 572.0, 271.0, 133.0, 57.0, 43.0, 23.0, 25.0, 8.0, 9.0, 1.0, 5.0, 6.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2281494140625, -0.2194995880126953, -0.21084976196289062, -0.20219993591308594, -0.19355010986328125, -0.18490028381347656, -0.17625045776367188, -0.1676006317138672, -0.1589508056640625, -0.1503009796142578, -0.14165115356445312, -0.13300132751464844, -0.12435150146484375, -0.11570167541503906, -0.10705184936523438, -0.09840202331542969, -0.089752197265625, -0.08110237121582031, -0.07245254516601562, -0.06380271911621094, -0.05515289306640625, -0.04650306701660156, -0.037853240966796875, -0.029203414916992188, -0.0205535888671875, -0.011903762817382812, -0.003253936767578125, 0.0053958892822265625, 0.01404571533203125, 0.022695541381835938, 0.031345367431640625, 0.03999519348144531, 0.04864501953125, 0.05729484558105469, 0.06594467163085938, 0.07459449768066406, 0.08324432373046875, 0.09189414978027344, 0.10054397583007812, 0.10919380187988281, 0.1178436279296875, 0.1264934539794922, 0.13514328002929688, 0.14379310607910156, 0.15244293212890625, 0.16109275817871094, 0.16974258422851562, 0.1783924102783203, 0.187042236328125, 0.1956920623779297, 0.20434188842773438, 0.21299171447753906, 0.22164154052734375, 0.23029136657714844, 0.23894119262695312, 0.2475910186767578, 0.2562408447265625, 0.2648906707763672, 0.2735404968261719, 0.28219032287597656, 0.29084014892578125, 0.29948997497558594, 0.3081398010253906, 0.3167896270751953, 0.325439453125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 11.0, 15.0, 12.0, 17.0, 26.0, 37.0, 55.0, 61.0, 73.0, 83.0, 106.0, 88.0, 104.0, 80.0, 60.0, 52.0, 31.0, 19.0, 19.0, 14.0, 8.0, 11.0, 8.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.291259765625, -0.28357696533203125, -0.2758941650390625, -0.26821136474609375, -0.260528564453125, -0.25284576416015625, -0.2451629638671875, -0.23748016357421875, -0.22979736328125, -0.22211456298828125, -0.2144317626953125, -0.20674896240234375, -0.199066162109375, -0.19138336181640625, -0.1837005615234375, -0.17601776123046875, -0.1683349609375, -0.16065216064453125, -0.1529693603515625, -0.14528656005859375, -0.137603759765625, -0.12992095947265625, -0.1222381591796875, -0.11455535888671875, -0.10687255859375, -0.09918975830078125, -0.0915069580078125, -0.08382415771484375, -0.076141357421875, -0.06845855712890625, -0.0607757568359375, -0.05309295654296875, -0.04541015625, -0.03772735595703125, -0.0300445556640625, -0.02236175537109375, -0.014678955078125, -0.00699615478515625, 0.0006866455078125, 0.00836944580078125, 0.01605224609375, 0.02373504638671875, 0.0314178466796875, 0.03910064697265625, 0.046783447265625, 0.05446624755859375, 0.0621490478515625, 0.06983184814453125, 0.0775146484375, 0.08519744873046875, 0.0928802490234375, 0.10056304931640625, 0.108245849609375, 0.11592864990234375, 0.1236114501953125, 0.13129425048828125, 0.13897705078125, 0.14665985107421875, 0.1543426513671875, 0.16202545166015625, 0.169708251953125, 0.17739105224609375, 0.1850738525390625, 0.19275665283203125, 0.200439453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 35.0, 61.0, 189.0, 297.0, 251.0, 90.0, 38.0, 19.0, 7.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.559494972229004, -10.306618690490723, -10.053741455078125, -9.800865173339844, -9.547987937927246, -9.295111656188965, -9.042234420776367, -8.789358139038086, -8.536481857299805, -8.283605575561523, -8.030728340148926, -7.777851581573486, -7.524974822998047, -7.272098541259766, -7.019221782684326, -6.766345024108887, -6.513467788696289, -6.26059103012085, -6.00771427154541, -5.754837512969971, -5.501960754394531, -5.24908447265625, -4.9962077140808105, -4.743330955505371, -4.490454196929932, -4.237577438354492, -3.9847006797790527, -3.7318241596221924, -3.478947401046753, -3.2260706424713135, -2.973194122314453, -2.7203173637390137, -2.4674415588378906, -2.214564800262451, -1.9616881608963013, -1.7088115215301514, -1.455934762954712, -1.2030580043792725, -0.9501813650131226, -0.6973047256469727, -0.4444279670715332, -0.19155126810073853, 0.06132543087005615, 0.31420212984085083, 0.5670788288116455, 0.819955587387085, 1.0728322267532349, 1.3257088661193848, 1.5785856246948242, 1.8314623832702637, 2.084339141845703, 2.3372156620025635, 2.590092420578003, 2.8429691791534424, 3.0958456993103027, 3.348722457885742, 3.6015992164611816, 3.854475975036621, 4.1073527336120605, 4.3602294921875, 4.613105773925781, 4.865983009338379, 5.11885929107666, 5.3717360496521, 5.624612808227539]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 10.0, 14.0, 10.0, 6.0, 19.0, 10.0, 18.0, 19.0, 24.0, 34.0, 28.0, 44.0, 37.0, 46.0, 42.0, 48.0, 63.0, 58.0, 41.0, 55.0, 41.0, 49.0, 38.0, 41.0, 41.0, 32.0, 27.0, 10.0, 16.0, 10.0, 16.0, 6.0, 9.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 6.0], "bins": [-5.251676559448242, -5.118388652801514, -4.985100746154785, -4.851812839508057, -4.718524932861328, -4.5852370262146, -4.451949119567871, -4.318661212921143, -4.185373306274414, -4.0520853996276855, -3.918797492980957, -3.7855095863342285, -3.6522216796875, -3.5189337730407715, -3.385645866394043, -3.2523579597473145, -3.119070291519165, -2.9857823848724365, -2.852494478225708, -2.7192065715789795, -2.585918664932251, -2.4526307582855225, -2.319343090057373, -2.1860551834106445, -2.052767276763916, -1.9194793701171875, -1.786191463470459, -1.6529035568237305, -1.519615650177002, -1.3863277435302734, -1.2530399560928345, -1.119752049446106, -0.9864640235900879, -0.8531761169433594, -0.7198882102966309, -0.5866003632545471, -0.4533124566078186, -0.3200245499610901, -0.18673670291900635, -0.05344879627227783, 0.07983911037445068, 0.213127002120018, 0.3464148938655853, 0.47970277070999146, 0.61299067735672, 0.7462785840034485, 0.8795664310455322, 1.0128543376922607, 1.1461422443389893, 1.2794301509857178, 1.4127180576324463, 1.5460059642791748, 1.6792938709259033, 1.8125817775726318, 1.9458695650100708, 2.0791573524475098, 2.2124452590942383, 2.345733165740967, 2.4790210723876953, 2.612308979034424, 2.7455968856811523, 2.878884792327881, 3.0121726989746094, 3.145460605621338, 3.2787485122680664]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 14.0, 21.0, 24.0, 31.0, 63.0, 103.0, 190.0, 423.0, 851.0, 1957.0, 6247.0, 49217.0, 4013961.0, 107175.0, 9305.0, 2501.0, 1033.0, 500.0, 256.0, 151.0, 102.0, 47.0, 35.0, 16.0, 13.0, 12.0, 8.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.57861328125, -0.5608749389648438, -0.5431365966796875, -0.5253982543945312, -0.507659912109375, -0.48992156982421875, -0.4721832275390625, -0.45444488525390625, -0.43670654296875, -0.41896820068359375, -0.4012298583984375, -0.38349151611328125, -0.365753173828125, -0.34801483154296875, -0.3302764892578125, -0.31253814697265625, -0.2947998046875, -0.27706146240234375, -0.2593231201171875, -0.24158477783203125, -0.223846435546875, -0.20610809326171875, -0.1883697509765625, -0.17063140869140625, -0.15289306640625, -0.13515472412109375, -0.1174163818359375, -0.09967803955078125, -0.081939697265625, -0.06420135498046875, -0.0464630126953125, -0.02872467041015625, -0.010986328125, 0.00675201416015625, 0.0244903564453125, 0.04222869873046875, 0.059967041015625, 0.07770538330078125, 0.0954437255859375, 0.11318206787109375, 0.13092041015625, 0.14865875244140625, 0.1663970947265625, 0.18413543701171875, 0.201873779296875, 0.21961212158203125, 0.2373504638671875, 0.25508880615234375, 0.2728271484375, 0.29056549072265625, 0.3083038330078125, 0.32604217529296875, 0.343780517578125, 0.36151885986328125, 0.3792572021484375, 0.39699554443359375, 0.41473388671875, 0.43247222900390625, 0.4502105712890625, 0.46794891357421875, 0.485687255859375, 0.5034255981445312, 0.5211639404296875, 0.5389022827148438, 0.556640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 8.0, 9.0, 17.0, 27.0, 40.0, 62.0, 70.0, 62.0, 82.0, 110.0, 107.0, 74.0, 83.0, 63.0, 53.0, 51.0, 19.0, 20.0, 14.0, 10.0, 3.0, 7.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27978515625, -0.2677268981933594, -0.25566864013671875, -0.24361038208007812, -0.2315521240234375, -0.21949386596679688, -0.20743560791015625, -0.19537734985351562, -0.183319091796875, -0.17126083374023438, -0.15920257568359375, -0.14714431762695312, -0.1350860595703125, -0.12302780151367188, -0.11096954345703125, -0.09891128540039062, -0.08685302734375, -0.07479476928710938, -0.06273651123046875, -0.050678253173828125, -0.0386199951171875, -0.026561737060546875, -0.01450347900390625, -0.002445220947265625, 0.009613037109375, 0.021671295166015625, 0.03372955322265625, 0.045787811279296875, 0.0578460693359375, 0.06990432739257812, 0.08196258544921875, 0.09402084350585938, 0.1060791015625, 0.11813735961914062, 0.13019561767578125, 0.14225387573242188, 0.1543121337890625, 0.16637039184570312, 0.17842864990234375, 0.19048690795898438, 0.202545166015625, 0.21460342407226562, 0.22666168212890625, 0.23871994018554688, 0.2507781982421875, 0.2628364562988281, 0.27489471435546875, 0.2869529724121094, 0.29901123046875, 0.3110694885253906, 0.32312774658203125, 0.3351860046386719, 0.3472442626953125, 0.3593025207519531, 0.37136077880859375, 0.3834190368652344, 0.395477294921875, 0.4075355529785156, 0.41959381103515625, 0.4316520690917969, 0.4437103271484375, 0.4557685852050781, 0.46782684326171875, 0.4798851013183594, 0.491943359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 4.0, 6.0, 10.0, 10.0, 19.0, 30.0, 39.0, 58.0, 96.0, 129.0, 183.0, 290.0, 513.0, 863.0, 1711.0, 4036.0, 15117.0, 171748.0, 3908080.0, 74756.0, 10162.0, 3046.0, 1421.0, 741.0, 415.0, 260.0, 173.0, 107.0, 82.0, 55.0, 33.0, 32.0, 14.0, 12.0, 11.0, 4.0, 8.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.63623046875, -0.6159515380859375, -0.595672607421875, -0.5753936767578125, -0.55511474609375, -0.5348358154296875, -0.514556884765625, -0.4942779541015625, -0.4739990234375, -0.4537200927734375, -0.433441162109375, -0.4131622314453125, -0.39288330078125, -0.3726043701171875, -0.352325439453125, -0.3320465087890625, -0.311767578125, -0.2914886474609375, -0.271209716796875, -0.2509307861328125, -0.23065185546875, -0.2103729248046875, -0.190093994140625, -0.1698150634765625, -0.1495361328125, -0.1292572021484375, -0.108978271484375, -0.0886993408203125, -0.06842041015625, -0.0481414794921875, -0.027862548828125, -0.0075836181640625, 0.0126953125, 0.0329742431640625, 0.053253173828125, 0.0735321044921875, 0.09381103515625, 0.1140899658203125, 0.134368896484375, 0.1546478271484375, 0.1749267578125, 0.1952056884765625, 0.215484619140625, 0.2357635498046875, 0.25604248046875, 0.2763214111328125, 0.296600341796875, 0.3168792724609375, 0.337158203125, 0.3574371337890625, 0.377716064453125, 0.3979949951171875, 0.41827392578125, 0.4385528564453125, 0.458831787109375, 0.4791107177734375, 0.4993896484375, 0.5196685791015625, 0.539947509765625, 0.5602264404296875, 0.58050537109375, 0.6007843017578125, 0.621063232421875, 0.6413421630859375, 0.66162109375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 12.0, 11.0, 16.0, 30.0, 73.0, 182.0, 802.0, 2429.0, 301.0, 107.0, 43.0, 25.0, 13.0, 11.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32568359375, -0.31589508056640625, -0.3061065673828125, -0.29631805419921875, -0.286529541015625, -0.27674102783203125, -0.2669525146484375, -0.25716400146484375, -0.24737548828125, -0.23758697509765625, -0.2277984619140625, -0.21800994873046875, -0.208221435546875, -0.19843292236328125, -0.1886444091796875, -0.17885589599609375, -0.1690673828125, -0.15927886962890625, -0.1494903564453125, -0.13970184326171875, -0.129913330078125, -0.12012481689453125, -0.1103363037109375, -0.10054779052734375, -0.09075927734375, -0.08097076416015625, -0.0711822509765625, -0.06139373779296875, -0.051605224609375, -0.04181671142578125, -0.0320281982421875, -0.02223968505859375, -0.012451171875, -0.00266265869140625, 0.0071258544921875, 0.01691436767578125, 0.026702880859375, 0.03649139404296875, 0.0462799072265625, 0.05606842041015625, 0.06585693359375, 0.07564544677734375, 0.0854339599609375, 0.09522247314453125, 0.105010986328125, 0.11479949951171875, 0.1245880126953125, 0.13437652587890625, 0.1441650390625, 0.15395355224609375, 0.1637420654296875, 0.17353057861328125, 0.183319091796875, 0.19310760498046875, 0.2028961181640625, 0.21268463134765625, 0.22247314453125, 0.23226165771484375, 0.2420501708984375, 0.25183868408203125, 0.261627197265625, 0.27141571044921875, 0.2812042236328125, 0.29099273681640625, 0.30078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 2.0, 6.0, 17.0, 10.0, 15.0, 24.0, 32.0, 46.0, 53.0, 86.0, 126.0, 147.0, 133.0, 112.0, 86.0, 44.0, 28.0, 13.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4222581386566162, -1.3833366632461548, -1.3444151878356934, -1.305493712425232, -1.2665722370147705, -1.227650761604309, -1.1887292861938477, -1.1498078107833862, -1.1108863353729248, -1.0719648599624634, -1.033043384552002, -0.9941219091415405, -0.9552004337310791, -0.9162789583206177, -0.8773574829101562, -0.8384360074996948, -0.7995145320892334, -0.760593056678772, -0.7216715812683105, -0.6827501058578491, -0.6438286304473877, -0.6049071550369263, -0.5659856796264648, -0.5270642042160034, -0.488142728805542, -0.44922125339508057, -0.41029977798461914, -0.3713783025741577, -0.3324568271636963, -0.29353535175323486, -0.25461387634277344, -0.215692400932312, -0.17677092552185059, -0.13784945011138916, -0.09892797470092773, -0.06000649929046631, -0.021085023880004883, 0.017836451530456543, 0.05675792694091797, 0.0956794023513794, 0.13460087776184082, 0.17352235317230225, 0.21244382858276367, 0.2513653039932251, 0.2902867794036865, 0.32920825481414795, 0.3681297302246094, 0.4070512056350708, 0.4459726810455322, 0.48489415645599365, 0.5238156318664551, 0.5627371072769165, 0.6016585826873779, 0.6405800580978394, 0.6795015335083008, 0.7184230089187622, 0.7573444843292236, 0.7962659597396851, 0.8351874351501465, 0.8741089105606079, 0.9130303859710693, 0.9519518613815308, 0.9908733367919922, 1.0297948122024536, 1.068716287612915]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 9.0, 5.0, 14.0, 15.0, 11.0, 12.0, 21.0, 24.0, 17.0, 22.0, 29.0, 29.0, 34.0, 33.0, 33.0, 41.0, 43.0, 43.0, 50.0, 37.0, 38.0, 34.0, 46.0, 36.0, 38.0, 43.0, 30.0, 38.0, 20.0, 28.0, 14.0, 27.0, 14.0, 12.0, 9.0, 13.0, 9.0, 9.0, 10.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.8517274856567383, -0.8287113904953003, -0.8056952953338623, -0.7826792001724243, -0.7596631050109863, -0.7366470098495483, -0.7136309146881104, -0.6906148195266724, -0.6675987243652344, -0.6445826292037964, -0.6215665340423584, -0.5985504388809204, -0.5755343437194824, -0.5525182485580444, -0.5295021533966064, -0.5064860582351685, -0.48346996307373047, -0.4604538679122925, -0.4374377727508545, -0.4144216775894165, -0.3914055824279785, -0.3683894872665405, -0.34537339210510254, -0.32235729694366455, -0.29934120178222656, -0.2763251066207886, -0.2533090114593506, -0.2302929162979126, -0.2072768211364746, -0.18426072597503662, -0.16124463081359863, -0.13822853565216064, -0.11521250009536743, -0.09219640493392944, -0.06918030977249146, -0.04616421461105347, -0.02314811944961548, -0.00013202428817749023, 0.022884070873260498, 0.045900166034698486, 0.06891626119613647, 0.09193235635757446, 0.11494845151901245, 0.13796454668045044, 0.16098064184188843, 0.18399673700332642, 0.2070128321647644, 0.2300289273262024, 0.2530450224876404, 0.27606111764907837, 0.29907721281051636, 0.32209330797195435, 0.34510940313339233, 0.3681254982948303, 0.3911415934562683, 0.4141576886177063, 0.4371737837791443, 0.4601898789405823, 0.48320597410202026, 0.5062220692634583, 0.5292381644248962, 0.5522542595863342, 0.5752703547477722, 0.5982864499092102, 0.6213025450706482]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 7.0, 12.0, 18.0, 29.0, 57.0, 63.0, 163.0, 295.0, 612.0, 1530.0, 4538.0, 18816.0, 113871.0, 579988.0, 275325.0, 40694.0, 8221.0, 2493.0, 919.0, 426.0, 194.0, 124.0, 68.0, 21.0, 19.0, 19.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.765625, -0.7472763061523438, -0.7289276123046875, -0.7105789184570312, -0.692230224609375, -0.6738815307617188, -0.6555328369140625, -0.6371841430664062, -0.61883544921875, -0.6004867553710938, -0.5821380615234375, -0.5637893676757812, -0.545440673828125, -0.5270919799804688, -0.5087432861328125, -0.49039459228515625, -0.4720458984375, -0.45369720458984375, -0.4353485107421875, -0.41699981689453125, -0.398651123046875, -0.38030242919921875, -0.3619537353515625, -0.34360504150390625, -0.32525634765625, -0.30690765380859375, -0.2885589599609375, -0.27021026611328125, -0.251861572265625, -0.23351287841796875, -0.2151641845703125, -0.19681549072265625, -0.178466796875, -0.16011810302734375, -0.1417694091796875, -0.12342071533203125, -0.105072021484375, -0.08672332763671875, -0.0683746337890625, -0.05002593994140625, -0.03167724609375, -0.01332855224609375, 0.0050201416015625, 0.02336883544921875, 0.041717529296875, 0.06006622314453125, 0.0784149169921875, 0.09676361083984375, 0.1151123046875, 0.13346099853515625, 0.1518096923828125, 0.17015838623046875, 0.188507080078125, 0.20685577392578125, 0.2252044677734375, 0.24355316162109375, 0.26190185546875, 0.28025054931640625, 0.2985992431640625, 0.31694793701171875, 0.335296630859375, 0.35364532470703125, 0.3719940185546875, 0.39034271240234375, 0.40869140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 11.0, 14.0, 27.0, 33.0, 24.0, 45.0, 69.0, 55.0, 77.0, 86.0, 63.0, 83.0, 79.0, 64.0, 59.0, 42.0, 46.0, 39.0, 18.0, 16.0, 12.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275390625, -0.2651214599609375, -0.254852294921875, -0.2445831298828125, -0.23431396484375, -0.2240447998046875, -0.213775634765625, -0.2035064697265625, -0.1932373046875, -0.1829681396484375, -0.172698974609375, -0.1624298095703125, -0.15216064453125, -0.1418914794921875, -0.131622314453125, -0.1213531494140625, -0.111083984375, -0.1008148193359375, -0.090545654296875, -0.0802764892578125, -0.07000732421875, -0.0597381591796875, -0.049468994140625, -0.0391998291015625, -0.0289306640625, -0.0186614990234375, -0.008392333984375, 0.0018768310546875, 0.01214599609375, 0.0224151611328125, 0.032684326171875, 0.0429534912109375, 0.05322265625, 0.0634918212890625, 0.073760986328125, 0.0840301513671875, 0.09429931640625, 0.1045684814453125, 0.114837646484375, 0.1251068115234375, 0.1353759765625, 0.1456451416015625, 0.155914306640625, 0.1661834716796875, 0.17645263671875, 0.1867218017578125, 0.196990966796875, 0.2072601318359375, 0.217529296875, 0.2277984619140625, 0.238067626953125, 0.2483367919921875, 0.25860595703125, 0.2688751220703125, 0.279144287109375, 0.2894134521484375, 0.2996826171875, 0.3099517822265625, 0.320220947265625, 0.3304901123046875, 0.34075927734375, 0.3510284423828125, 0.361297607421875, 0.3715667724609375, 0.3818359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 9.0, 7.0, 11.0, 23.0, 37.0, 61.0, 117.0, 197.0, 381.0, 1057.0, 3329.0, 20590.0, 553521.0, 446335.0, 18132.0, 3015.0, 906.0, 379.0, 203.0, 88.0, 48.0, 33.0, 26.0, 19.0, 8.0, 5.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8603515625, -0.82958984375, -0.798828125, -0.76806640625, -0.7373046875, -0.70654296875, -0.67578125, -0.64501953125, -0.6142578125, -0.58349609375, -0.552734375, -0.52197265625, -0.4912109375, -0.46044921875, -0.4296875, -0.39892578125, -0.3681640625, -0.33740234375, -0.306640625, -0.27587890625, -0.2451171875, -0.21435546875, -0.18359375, -0.15283203125, -0.1220703125, -0.09130859375, -0.060546875, -0.02978515625, 0.0009765625, 0.03173828125, 0.0625, 0.09326171875, 0.1240234375, 0.15478515625, 0.185546875, 0.21630859375, 0.2470703125, 0.27783203125, 0.30859375, 0.33935546875, 0.3701171875, 0.40087890625, 0.431640625, 0.46240234375, 0.4931640625, 0.52392578125, 0.5546875, 0.58544921875, 0.6162109375, 0.64697265625, 0.677734375, 0.70849609375, 0.7392578125, 0.77001953125, 0.80078125, 0.83154296875, 0.8623046875, 0.89306640625, 0.923828125, 0.95458984375, 0.9853515625, 1.01611328125, 1.046875, 1.07763671875, 1.1083984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 7.0, 10.0, 9.0, 20.0, 22.0, 31.0, 18.0, 25.0, 33.0, 38.0, 33.0, 52.0, 50.0, 37.0, 44.0, 37.0, 51.0, 44.0, 34.0, 34.0, 43.0, 40.0, 25.0, 40.0, 34.0, 23.0, 23.0, 21.0, 13.0, 14.0, 14.0, 13.0, 6.0, 10.0, 6.0, 5.0, 4.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.859375, -0.8346405029296875, -0.809906005859375, -0.7851715087890625, -0.76043701171875, -0.7357025146484375, -0.710968017578125, -0.6862335205078125, -0.6614990234375, -0.6367645263671875, -0.612030029296875, -0.5872955322265625, -0.56256103515625, -0.5378265380859375, -0.513092041015625, -0.4883575439453125, -0.463623046875, -0.4388885498046875, -0.414154052734375, -0.3894195556640625, -0.36468505859375, -0.3399505615234375, -0.315216064453125, -0.2904815673828125, -0.2657470703125, -0.2410125732421875, -0.216278076171875, -0.1915435791015625, -0.16680908203125, -0.1420745849609375, -0.117340087890625, -0.0926055908203125, -0.06787109375, -0.0431365966796875, -0.018402099609375, 0.0063323974609375, 0.03106689453125, 0.0558013916015625, 0.080535888671875, 0.1052703857421875, 0.1300048828125, 0.1547393798828125, 0.179473876953125, 0.2042083740234375, 0.22894287109375, 0.2536773681640625, 0.278411865234375, 0.3031463623046875, 0.327880859375, 0.3526153564453125, 0.377349853515625, 0.4020843505859375, 0.42681884765625, 0.4515533447265625, 0.476287841796875, 0.5010223388671875, 0.5257568359375, 0.5504913330078125, 0.575225830078125, 0.5999603271484375, 0.62469482421875, 0.6494293212890625, 0.674163818359375, 0.6988983154296875, 0.7236328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 7.0, 3.0, 6.0, 9.0, 11.0, 16.0, 22.0, 37.0, 39.0, 86.0, 136.0, 223.0, 347.0, 708.0, 1368.0, 3497.0, 10947.0, 55179.0, 446697.0, 455604.0, 55930.0, 11222.0, 3446.0, 1369.0, 669.0, 344.0, 180.0, 140.0, 95.0, 61.0, 35.0, 32.0, 18.0, 23.0, 6.0, 4.0, 9.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19862747192382812, -0.19242095947265625, -0.18621444702148438, -0.1800079345703125, -0.17380142211914062, -0.16759490966796875, -0.16138839721679688, -0.155181884765625, -0.14897537231445312, -0.14276885986328125, -0.13656234741210938, -0.1303558349609375, -0.12414932250976562, -0.11794281005859375, -0.11173629760742188, -0.10552978515625, -0.09932327270507812, -0.09311676025390625, -0.08691024780273438, -0.0807037353515625, -0.07449722290039062, -0.06829071044921875, -0.062084197998046875, -0.055877685546875, -0.049671173095703125, -0.04346466064453125, -0.037258148193359375, -0.0310516357421875, -0.024845123291015625, -0.01863861083984375, -0.012432098388671875, -0.0062255859375, -1.9073486328125e-05, 0.00618743896484375, 0.012393951416015625, 0.0186004638671875, 0.024806976318359375, 0.03101348876953125, 0.037220001220703125, 0.043426513671875, 0.049633026123046875, 0.05583953857421875, 0.062046051025390625, 0.0682525634765625, 0.07445907592773438, 0.08066558837890625, 0.08687210083007812, 0.09307861328125, 0.09928512573242188, 0.10549163818359375, 0.11169815063476562, 0.1179046630859375, 0.12411117553710938, 0.13031768798828125, 0.13652420043945312, 0.142730712890625, 0.14893722534179688, 0.15514373779296875, 0.16135025024414062, 0.1675567626953125, 0.17376327514648438, 0.17996978759765625, 0.18617630004882812, 0.1923828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 13.0, 17.0, 12.0, 22.0, 28.0, 23.0, 44.0, 57.0, 76.0, 87.0, 90.0, 99.0, 84.0, 68.0, 48.0, 46.0, 25.0, 23.0, 32.0, 22.0, 17.0, 9.0, 8.0, 3.0, 4.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.245208740234375e-05, -5.095265805721283e-05, -4.945322871208191e-05, -4.795379936695099e-05, -4.645437002182007e-05, -4.495494067668915e-05, -4.345551133155823e-05, -4.195608198642731e-05, -4.045665264129639e-05, -3.8957223296165466e-05, -3.7457793951034546e-05, -3.5958364605903625e-05, -3.4458935260772705e-05, -3.2959505915641785e-05, -3.1460076570510864e-05, -2.9960647225379944e-05, -2.8461217880249023e-05, -2.6961788535118103e-05, -2.5462359189987183e-05, -2.3962929844856262e-05, -2.2463500499725342e-05, -2.096407115459442e-05, -1.94646418094635e-05, -1.796521246433258e-05, -1.646578311920166e-05, -1.496635377407074e-05, -1.346692442893982e-05, -1.1967495083808899e-05, -1.0468065738677979e-05, -8.968636393547058e-06, -7.469207048416138e-06, -5.969777703285217e-06, -4.470348358154297e-06, -2.9709190130233765e-06, -1.471489667892456e-06, 2.7939677238464355e-08, 1.5273690223693848e-06, 3.026798367500305e-06, 4.526227712631226e-06, 6.025657057762146e-06, 7.525086402893066e-06, 9.024515748023987e-06, 1.0523945093154907e-05, 1.2023374438285828e-05, 1.3522803783416748e-05, 1.5022233128547668e-05, 1.652166247367859e-05, 1.802109181880951e-05, 1.952052116394043e-05, 2.101995050907135e-05, 2.251937985420227e-05, 2.401880919933319e-05, 2.551823854446411e-05, 2.7017667889595032e-05, 2.8517097234725952e-05, 3.0016526579856873e-05, 3.151595592498779e-05, 3.301538527011871e-05, 3.4514814615249634e-05, 3.6014243960380554e-05, 3.7513673305511475e-05, 3.9013102650642395e-05, 4.0512531995773315e-05, 4.2011961340904236e-05, 4.3511390686035156e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 14.0, 27.0, 41.0, 54.0, 63.0, 95.0, 153.0, 265.0, 446.0, 695.0, 1494.0, 3168.0, 9831.0, 41038.0, 244409.0, 607001.0, 108330.0, 20877.0, 5791.0, 2164.0, 1046.0, 557.0, 375.0, 185.0, 115.0, 81.0, 58.0, 36.0, 39.0, 18.0, 17.0, 6.0, 11.0, 10.0, 9.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1993408203125, -0.19296836853027344, -0.18659591674804688, -0.1802234649658203, -0.17385101318359375, -0.1674785614013672, -0.16110610961914062, -0.15473365783691406, -0.1483612060546875, -0.14198875427246094, -0.13561630249023438, -0.1292438507080078, -0.12287139892578125, -0.11649894714355469, -0.11012649536132812, -0.10375404357910156, -0.097381591796875, -0.09100914001464844, -0.08463668823242188, -0.07826423645019531, -0.07189178466796875, -0.06551933288574219, -0.059146881103515625, -0.05277442932128906, -0.0464019775390625, -0.04002952575683594, -0.033657073974609375, -0.027284622192382812, -0.02091217041015625, -0.014539718627929688, -0.008167266845703125, -0.0017948150634765625, 0.00457763671875, 0.010950088500976562, 0.017322540283203125, 0.023694992065429688, 0.03006744384765625, 0.03643989562988281, 0.042812347412109375, 0.04918479919433594, 0.0555572509765625, 0.06192970275878906, 0.06830215454101562, 0.07467460632324219, 0.08104705810546875, 0.08741950988769531, 0.09379196166992188, 0.10016441345214844, 0.106536865234375, 0.11290931701660156, 0.11928176879882812, 0.1256542205810547, 0.13202667236328125, 0.1383991241455078, 0.14477157592773438, 0.15114402770996094, 0.1575164794921875, 0.16388893127441406, 0.17026138305664062, 0.1766338348388672, 0.18300628662109375, 0.1893787384033203, 0.19575119018554688, 0.20212364196777344, 0.20849609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 10.0, 8.0, 16.0, 20.0, 13.0, 13.0, 19.0, 44.0, 30.0, 46.0, 53.0, 56.0, 75.0, 72.0, 57.0, 85.0, 61.0, 46.0, 44.0, 38.0, 36.0, 29.0, 29.0, 12.0, 12.0, 21.0, 7.0, 8.0, 5.0, 9.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1417236328125, -0.13650131225585938, -0.13127899169921875, -0.12605667114257812, -0.1208343505859375, -0.11561203002929688, -0.11038970947265625, -0.10516738891601562, -0.099945068359375, -0.09472274780273438, -0.08950042724609375, -0.08427810668945312, -0.0790557861328125, -0.07383346557617188, -0.06861114501953125, -0.06338882446289062, -0.05816650390625, -0.052944183349609375, -0.04772186279296875, -0.042499542236328125, -0.0372772216796875, -0.032054901123046875, -0.02683258056640625, -0.021610260009765625, -0.016387939453125, -0.011165618896484375, -0.00594329833984375, -0.000720977783203125, 0.0045013427734375, 0.009723663330078125, 0.01494598388671875, 0.020168304443359375, 0.025390625, 0.030612945556640625, 0.03583526611328125, 0.041057586669921875, 0.0462799072265625, 0.051502227783203125, 0.05672454833984375, 0.061946868896484375, 0.067169189453125, 0.07239151000976562, 0.07761383056640625, 0.08283615112304688, 0.0880584716796875, 0.09328079223632812, 0.09850311279296875, 0.10372543334960938, 0.10894775390625, 0.11417007446289062, 0.11939239501953125, 0.12461471557617188, 0.1298370361328125, 0.13505935668945312, 0.14028167724609375, 0.14550399780273438, 0.150726318359375, 0.15594863891601562, 0.16117095947265625, 0.16639328002929688, 0.1716156005859375, 0.17683792114257812, 0.18206024169921875, 0.18728256225585938, 0.1925048828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 8.0, 14.0, 30.0, 36.0, 73.0, 133.0, 171.0, 168.0, 128.0, 86.0, 60.0, 36.0, 17.0, 14.0, 5.0, 8.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.891074180603027, -5.74791955947876, -5.604764461517334, -5.461609840393066, -5.318454742431641, -5.175300121307373, -5.032145023345947, -4.88899040222168, -4.745835304260254, -4.602680683135986, -4.4595255851745605, -4.316370964050293, -4.173215866088867, -4.0300612449646, -3.886906385421753, -3.7437515258789062, -3.6005969047546387, -3.457442045211792, -3.3142871856689453, -3.1711323261260986, -3.027977466583252, -2.8848228454589844, -2.7416679859161377, -2.598513126373291, -2.4553582668304443, -2.3122034072875977, -2.169048547744751, -2.0258936882019043, -1.8827389478683472, -1.7395840883255005, -1.5964293479919434, -1.4532744884490967, -1.310119390487671, -1.1669645309448242, -1.0238096714019775, -0.8806549310684204, -0.7375000715255737, -0.594345211982727, -0.45119041204452515, -0.30803561210632324, -0.16488075256347656, -0.02172592282295227, 0.12142890691757202, 0.2645837366580963, 0.4077385663986206, 0.5508934259414673, 0.6940482258796692, 0.8372030258178711, 0.9803578853607178, 1.1235127449035645, 1.2666676044464111, 1.4098223447799683, 1.552977204322815, 1.6961320638656616, 1.8392868041992188, 1.9824416637420654, 2.125596523284912, 2.268751382827759, 2.4119062423706055, 2.555061101913452, 2.698215961456299, 2.8413705825805664, 2.984525442123413, 3.1276803016662598, 3.2708351612091064]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 8.0, 6.0, 8.0, 11.0, 14.0, 16.0, 16.0, 23.0, 32.0, 29.0, 26.0, 40.0, 46.0, 46.0, 47.0, 57.0, 66.0, 57.0, 49.0, 57.0, 52.0, 49.0, 32.0, 39.0, 37.0, 23.0, 26.0, 18.0, 11.0, 10.0, 8.0, 6.0, 2.0, 5.0, 6.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.542490482330322, -4.4160685539245605, -4.289646625518799, -4.163224697113037, -4.036802291870117, -3.9103806018829346, -3.7839584350585938, -3.657536506652832, -3.5311145782470703, -3.4046926498413086, -3.278270721435547, -3.151848554611206, -3.0254266262054443, -2.8990046977996826, -2.772582530975342, -2.64616060256958, -2.5197386741638184, -2.3933167457580566, -2.266894817352295, -2.140472650527954, -2.0140507221221924, -1.8876287937164307, -1.7612067461013794, -1.6347846984863281, -1.5083627700805664, -1.3819408416748047, -1.2555187940597534, -1.1290967464447021, -1.0026748180389404, -0.8762528300285339, -0.7498308420181274, -0.623408854007721, -0.49698686599731445, -0.37056487798690796, -0.24414288997650146, -0.11772090196609497, 0.008701086044311523, 0.13512307405471802, 0.2615450620651245, 0.387967050075531, 0.5143890380859375, 0.640811026096344, 0.7672330141067505, 0.893655002117157, 1.0200769901275635, 1.1464989185333252, 1.2729209661483765, 1.3993430137634277, 1.5257649421691895, 1.6521868705749512, 1.7786089181900024, 1.9050309658050537, 2.0314528942108154, 2.157874822616577, 2.284296989440918, 2.4107189178466797, 2.5371408462524414, 2.663562774658203, 2.789984703063965, 2.9164068698883057, 3.0428287982940674, 3.169250726699829, 3.29567289352417, 3.4220948219299316, 3.5485167503356934]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 14.0, 14.0, 37.0, 52.0, 86.0, 127.0, 236.0, 476.0, 1057.0, 2927.0, 10152.0, 63439.0, 3188530.0, 888781.0, 28197.0, 6310.0, 2063.0, 884.0, 384.0, 225.0, 109.0, 63.0, 40.0, 15.0, 17.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6220703125, -0.6036834716796875, -0.585296630859375, -0.5669097900390625, -0.54852294921875, -0.5301361083984375, -0.511749267578125, -0.4933624267578125, -0.4749755859375, -0.4565887451171875, -0.438201904296875, -0.4198150634765625, -0.40142822265625, -0.3830413818359375, -0.364654541015625, -0.3462677001953125, -0.327880859375, -0.3094940185546875, -0.291107177734375, -0.2727203369140625, -0.25433349609375, -0.2359466552734375, -0.217559814453125, -0.1991729736328125, -0.1807861328125, -0.1623992919921875, -0.144012451171875, -0.1256256103515625, -0.10723876953125, -0.0888519287109375, -0.070465087890625, -0.0520782470703125, -0.03369140625, -0.0153045654296875, 0.003082275390625, 0.0214691162109375, 0.03985595703125, 0.0582427978515625, 0.076629638671875, 0.0950164794921875, 0.1134033203125, 0.1317901611328125, 0.150177001953125, 0.1685638427734375, 0.18695068359375, 0.2053375244140625, 0.223724365234375, 0.2421112060546875, 0.260498046875, 0.2788848876953125, 0.297271728515625, 0.3156585693359375, 0.33404541015625, 0.3524322509765625, 0.370819091796875, 0.3892059326171875, 0.4075927734375, 0.4259796142578125, 0.444366455078125, 0.4627532958984375, 0.48114013671875, 0.4995269775390625, 0.517913818359375, 0.5363006591796875, 0.5546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 11.0, 7.0, 9.0, 15.0, 20.0, 26.0, 41.0, 31.0, 50.0, 69.0, 70.0, 94.0, 84.0, 71.0, 61.0, 67.0, 62.0, 44.0, 52.0, 34.0, 33.0, 18.0, 11.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2086181640625, -0.1991443634033203, -0.18967056274414062, -0.18019676208496094, -0.17072296142578125, -0.16124916076660156, -0.15177536010742188, -0.1423015594482422, -0.1328277587890625, -0.12335395812988281, -0.11388015747070312, -0.10440635681152344, -0.09493255615234375, -0.08545875549316406, -0.07598495483398438, -0.06651115417480469, -0.057037353515625, -0.04756355285644531, -0.038089752197265625, -0.028615951538085938, -0.01914215087890625, -0.009668350219726562, -0.000194549560546875, 0.009279251098632812, 0.0187530517578125, 0.028226852416992188, 0.037700653076171875, 0.04717445373535156, 0.05664825439453125, 0.06612205505371094, 0.07559585571289062, 0.08506965637207031, 0.09454345703125, 0.10401725769042969, 0.11349105834960938, 0.12296485900878906, 0.13243865966796875, 0.14191246032714844, 0.15138626098632812, 0.1608600616455078, 0.1703338623046875, 0.1798076629638672, 0.18928146362304688, 0.19875526428222656, 0.20822906494140625, 0.21770286560058594, 0.22717666625976562, 0.2366504669189453, 0.246124267578125, 0.2555980682373047, 0.2650718688964844, 0.27454566955566406, 0.28401947021484375, 0.29349327087402344, 0.3029670715332031, 0.3124408721923828, 0.3219146728515625, 0.3313884735107422, 0.3408622741699219, 0.35033607482910156, 0.35980987548828125, 0.36928367614746094, 0.3787574768066406, 0.3882312774658203, 0.397705078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 7.0, 7.0, 12.0, 9.0, 25.0, 35.0, 69.0, 136.0, 328.0, 812.0, 2518.0, 8399.0, 40952.0, 946707.0, 3101978.0, 74198.0, 12712.0, 3359.0, 1135.0, 447.0, 180.0, 98.0, 39.0, 31.0, 22.0, 19.0, 11.0, 10.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5669708251953125, -0.547515869140625, -0.5280609130859375, -0.50860595703125, -0.4891510009765625, -0.469696044921875, -0.4502410888671875, -0.4307861328125, -0.4113311767578125, -0.391876220703125, -0.3724212646484375, -0.35296630859375, -0.3335113525390625, -0.314056396484375, -0.2946014404296875, -0.275146484375, -0.2556915283203125, -0.236236572265625, -0.2167816162109375, -0.19732666015625, -0.1778717041015625, -0.158416748046875, -0.1389617919921875, -0.1195068359375, -0.1000518798828125, -0.080596923828125, -0.0611419677734375, -0.04168701171875, -0.0222320556640625, -0.002777099609375, 0.0166778564453125, 0.0361328125, 0.0555877685546875, 0.075042724609375, 0.0944976806640625, 0.11395263671875, 0.1334075927734375, 0.152862548828125, 0.1723175048828125, 0.1917724609375, 0.2112274169921875, 0.230682373046875, 0.2501373291015625, 0.26959228515625, 0.2890472412109375, 0.308502197265625, 0.3279571533203125, 0.347412109375, 0.3668670654296875, 0.386322021484375, 0.4057769775390625, 0.42523193359375, 0.4446868896484375, 0.464141845703125, 0.4835968017578125, 0.5030517578125, 0.5225067138671875, 0.541961669921875, 0.5614166259765625, 0.58087158203125, 0.6003265380859375, 0.619781494140625, 0.6392364501953125, 0.65869140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 9.0, 8.0, 2.0, 8.0, 5.0, 11.0, 21.0, 30.0, 34.0, 45.0, 96.0, 151.0, 319.0, 581.0, 927.0, 798.0, 437.0, 239.0, 105.0, 72.0, 50.0, 31.0, 20.0, 15.0, 7.0, 12.0, 9.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.49755096435546875, -0.4819183349609375, -0.46628570556640625, -0.450653076171875, -0.43502044677734375, -0.4193878173828125, -0.40375518798828125, -0.38812255859375, -0.37248992919921875, -0.3568572998046875, -0.34122467041015625, -0.325592041015625, -0.30995941162109375, -0.2943267822265625, -0.27869415283203125, -0.2630615234375, -0.24742889404296875, -0.2317962646484375, -0.21616363525390625, -0.200531005859375, -0.18489837646484375, -0.1692657470703125, -0.15363311767578125, -0.13800048828125, -0.12236785888671875, -0.1067352294921875, -0.09110260009765625, -0.075469970703125, -0.05983734130859375, -0.0442047119140625, -0.02857208251953125, -0.012939453125, 0.00269317626953125, 0.0183258056640625, 0.03395843505859375, 0.049591064453125, 0.06522369384765625, 0.0808563232421875, 0.09648895263671875, 0.11212158203125, 0.12775421142578125, 0.1433868408203125, 0.15901947021484375, 0.174652099609375, 0.19028472900390625, 0.2059173583984375, 0.22154998779296875, 0.2371826171875, 0.25281524658203125, 0.2684478759765625, 0.28408050537109375, 0.299713134765625, 0.31534576416015625, 0.3309783935546875, 0.34661102294921875, 0.36224365234375, 0.37787628173828125, 0.3935089111328125, 0.40914154052734375, 0.424774169921875, 0.44040679931640625, 0.4560394287109375, 0.47167205810546875, 0.4873046875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 7.0, 19.0, 98.0, 259.0, 360.0, 188.0, 33.0, 11.0, 11.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.754988670349121, -13.475505828857422, -13.196022987365723, -12.916540145874023, -12.637057304382324, -12.357574462890625, -12.078091621398926, -11.798608779907227, -11.519125938415527, -11.239643096923828, -10.960160255432129, -10.68067741394043, -10.40119457244873, -10.121711730957031, -9.842228889465332, -9.562746047973633, -9.283263206481934, -9.003780364990234, -8.724297523498535, -8.444814682006836, -8.165331840515137, -7.8858489990234375, -7.606366157531738, -7.326883316040039, -7.04740047454834, -6.767917633056641, -6.488434791564941, -6.208951950073242, -5.929469108581543, -5.649986267089844, -5.3705034255981445, -5.091020584106445, -4.811538219451904, -4.532055377960205, -4.252572536468506, -3.9730896949768066, -3.6936068534851074, -3.414124011993408, -3.134641170501709, -2.8551583290100098, -2.5756754875183105, -2.2961926460266113, -2.016709804534912, -1.737226963043213, -1.4577441215515137, -1.1782612800598145, -0.8987784385681152, -0.619295597076416, -0.3398127555847168, -0.06032991409301758, 0.21915292739868164, 0.49863576889038086, 0.7781186103820801, 1.0576014518737793, 1.3370842933654785, 1.6165671348571777, 1.896049976348877, 2.175532817840576, 2.4550156593322754, 2.7344985008239746, 3.013981342315674, 3.293464183807373, 3.5729470252990723, 3.8524298667907715, 4.131912708282471]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 10.0, 13.0, 19.0, 24.0, 25.0, 22.0, 26.0, 50.0, 36.0, 43.0, 29.0, 56.0, 61.0, 39.0, 69.0, 59.0, 42.0, 44.0, 43.0, 42.0, 38.0, 43.0, 28.0, 16.0, 26.0, 12.0, 24.0, 16.0, 9.0, 3.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.4966812133789062, -2.429938793182373, -2.3631961345672607, -2.2964534759521484, -2.2297110557556152, -2.162968635559082, -2.0962259769439697, -2.0294833183288574, -1.9627408981323242, -1.8959983587265015, -1.8292558193206787, -1.762513279914856, -1.6957707405090332, -1.6290282011032104, -1.5622856616973877, -1.495543122291565, -1.4288005828857422, -1.3620580434799194, -1.2953155040740967, -1.228572964668274, -1.1618304252624512, -1.0950878858566284, -1.0283453464508057, -0.9616028070449829, -0.8948602676391602, -0.8281177282333374, -0.7613751888275146, -0.6946326494216919, -0.6278901100158691, -0.5611475706100464, -0.49440503120422363, -0.4276624917984009, -0.3609200716018677, -0.2941775321960449, -0.22743499279022217, -0.16069245338439941, -0.09394991397857666, -0.027207374572753906, 0.03953516483306885, 0.1062777042388916, 0.17302024364471436, 0.2397627830505371, 0.30650532245635986, 0.3732478618621826, 0.43999040126800537, 0.5067329406738281, 0.5734754800796509, 0.6402180194854736, 0.7069605588912964, 0.7737030982971191, 0.8404456377029419, 0.9071881771087646, 0.9739307165145874, 1.0406732559204102, 1.107415795326233, 1.1741583347320557, 1.2409008741378784, 1.3076434135437012, 1.374385952949524, 1.4411284923553467, 1.5078710317611694, 1.5746135711669922, 1.641356110572815, 1.7080986499786377, 1.7748411893844604]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 8.0, 9.0, 16.0, 29.0, 46.0, 75.0, 121.0, 178.0, 290.0, 595.0, 973.0, 1696.0, 2997.0, 5627.0, 10824.0, 21575.0, 43969.0, 92768.0, 193802.0, 297790.0, 193625.0, 92551.0, 44154.0, 21323.0, 10821.0, 5663.0, 3010.0, 1693.0, 978.0, 541.0, 325.0, 170.0, 123.0, 81.0, 38.0, 32.0, 11.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1864013671875, -0.17962265014648438, -0.17284393310546875, -0.16606521606445312, -0.1592864990234375, -0.15250778198242188, -0.14572906494140625, -0.13895034790039062, -0.132171630859375, -0.12539291381835938, -0.11861419677734375, -0.11183547973632812, -0.1050567626953125, -0.09827804565429688, -0.09149932861328125, -0.08472061157226562, -0.07794189453125, -0.07116317749023438, -0.06438446044921875, -0.057605743408203125, -0.0508270263671875, -0.044048309326171875, -0.03726959228515625, -0.030490875244140625, -0.023712158203125, -0.016933441162109375, -0.01015472412109375, -0.003376007080078125, 0.0034027099609375, 0.010181427001953125, 0.01696014404296875, 0.023738861083984375, 0.030517578125, 0.037296295166015625, 0.04407501220703125, 0.050853729248046875, 0.0576324462890625, 0.06441116333007812, 0.07118988037109375, 0.07796859741210938, 0.084747314453125, 0.09152603149414062, 0.09830474853515625, 0.10508346557617188, 0.1118621826171875, 0.11864089965820312, 0.12541961669921875, 0.13219833374023438, 0.13897705078125, 0.14575576782226562, 0.15253448486328125, 0.15931320190429688, 0.1660919189453125, 0.17287063598632812, 0.17964935302734375, 0.18642807006835938, 0.193206787109375, 0.19998550415039062, 0.20676422119140625, 0.21354293823242188, 0.2203216552734375, 0.22710037231445312, 0.23387908935546875, 0.24065780639648438, 0.2474365234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 4.0, 8.0, 12.0, 6.0, 5.0, 10.0, 9.0, 13.0, 17.0, 17.0, 22.0, 21.0, 21.0, 26.0, 31.0, 25.0, 33.0, 38.0, 43.0, 30.0, 47.0, 44.0, 50.0, 44.0, 33.0, 42.0, 36.0, 40.0, 29.0, 36.0, 32.0, 17.0, 21.0, 26.0, 17.0, 16.0, 17.0, 10.0, 9.0, 6.0, 6.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1455078125, -0.1403064727783203, -0.13510513305664062, -0.12990379333496094, -0.12470245361328125, -0.11950111389160156, -0.11429977416992188, -0.10909843444824219, -0.1038970947265625, -0.09869575500488281, -0.09349441528320312, -0.08829307556152344, -0.08309173583984375, -0.07789039611816406, -0.07268905639648438, -0.06748771667480469, -0.062286376953125, -0.05708503723144531, -0.051883697509765625, -0.04668235778808594, -0.04148101806640625, -0.03627967834472656, -0.031078338623046875, -0.025876998901367188, -0.0206756591796875, -0.015474319458007812, -0.010272979736328125, -0.0050716400146484375, 0.00012969970703125, 0.0053310394287109375, 0.010532379150390625, 0.015733718872070312, 0.02093505859375, 0.026136398315429688, 0.031337738037109375, 0.03653907775878906, 0.04174041748046875, 0.04694175720214844, 0.052143096923828125, 0.05734443664550781, 0.0625457763671875, 0.06774711608886719, 0.07294845581054688, 0.07814979553222656, 0.08335113525390625, 0.08855247497558594, 0.09375381469726562, 0.09895515441894531, 0.104156494140625, 0.10935783386230469, 0.11455917358398438, 0.11976051330566406, 0.12496185302734375, 0.13016319274902344, 0.13536453247070312, 0.1405658721923828, 0.1457672119140625, 0.1509685516357422, 0.15616989135742188, 0.16137123107910156, 0.16657257080078125, 0.17177391052246094, 0.17697525024414062, 0.1821765899658203, 0.1873779296875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 11.0, 10.0, 15.0, 11.0, 19.0, 36.0, 47.0, 78.0, 118.0, 174.0, 295.0, 512.0, 867.0, 1958.0, 5888.0, 37061.0, 649236.0, 321655.0, 22510.0, 4400.0, 1633.0, 835.0, 426.0, 236.0, 158.0, 103.0, 64.0, 50.0, 40.0, 28.0, 19.0, 17.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6676025390625, -0.645263671875, -0.6229248046875, -0.6005859375, -0.5782470703125, -0.555908203125, -0.5335693359375, -0.51123046875, -0.4888916015625, -0.466552734375, -0.4442138671875, -0.421875, -0.3995361328125, -0.377197265625, -0.3548583984375, -0.33251953125, -0.3101806640625, -0.287841796875, -0.2655029296875, -0.2431640625, -0.2208251953125, -0.198486328125, -0.1761474609375, -0.15380859375, -0.1314697265625, -0.109130859375, -0.0867919921875, -0.064453125, -0.0421142578125, -0.019775390625, 0.0025634765625, 0.02490234375, 0.0472412109375, 0.069580078125, 0.0919189453125, 0.1142578125, 0.1365966796875, 0.158935546875, 0.1812744140625, 0.20361328125, 0.2259521484375, 0.248291015625, 0.2706298828125, 0.29296875, 0.3153076171875, 0.337646484375, 0.3599853515625, 0.38232421875, 0.4046630859375, 0.427001953125, 0.4493408203125, 0.4716796875, 0.4940185546875, 0.516357421875, 0.5386962890625, 0.56103515625, 0.5833740234375, 0.605712890625, 0.6280517578125, 0.650390625, 0.6727294921875, 0.695068359375, 0.7174072265625, 0.73974609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 11.0, 7.0, 10.0, 10.0, 11.0, 15.0, 17.0, 35.0, 30.0, 24.0, 26.0, 37.0, 46.0, 31.0, 46.0, 46.0, 55.0, 40.0, 57.0, 44.0, 60.0, 48.0, 42.0, 44.0, 34.0, 22.0, 27.0, 21.0, 18.0, 20.0, 12.0, 8.0, 3.0, 3.0, 7.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.7158966064453125, -0.690093994140625, -0.6642913818359375, -0.63848876953125, -0.6126861572265625, -0.586883544921875, -0.5610809326171875, -0.5352783203125, -0.5094757080078125, -0.483673095703125, -0.4578704833984375, -0.43206787109375, -0.4062652587890625, -0.380462646484375, -0.3546600341796875, -0.328857421875, -0.3030548095703125, -0.277252197265625, -0.2514495849609375, -0.22564697265625, -0.1998443603515625, -0.174041748046875, -0.1482391357421875, -0.1224365234375, -0.0966339111328125, -0.070831298828125, -0.0450286865234375, -0.01922607421875, 0.0065765380859375, 0.032379150390625, 0.0581817626953125, 0.083984375, 0.1097869873046875, 0.135589599609375, 0.1613922119140625, 0.18719482421875, 0.2129974365234375, 0.238800048828125, 0.2646026611328125, 0.2904052734375, 0.3162078857421875, 0.342010498046875, 0.3678131103515625, 0.39361572265625, 0.4194183349609375, 0.445220947265625, 0.4710235595703125, 0.496826171875, 0.5226287841796875, 0.548431396484375, 0.5742340087890625, 0.60003662109375, 0.6258392333984375, 0.651641845703125, 0.6774444580078125, 0.7032470703125, 0.7290496826171875, 0.754852294921875, 0.7806549072265625, 0.80645751953125, 0.8322601318359375, 0.858062744140625, 0.8838653564453125, 0.90966796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 5.0, 8.0, 13.0, 13.0, 23.0, 33.0, 36.0, 59.0, 103.0, 137.0, 277.0, 533.0, 1009.0, 2514.0, 7720.0, 38181.0, 611252.0, 346214.0, 29640.0, 6500.0, 2180.0, 936.0, 491.0, 250.0, 154.0, 84.0, 44.0, 46.0, 23.0, 17.0, 17.0, 6.0, 8.0, 4.0, 3.0, 4.0, 7.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.2577629089355469, -0.24819183349609375, -0.23862075805664062, -0.2290496826171875, -0.21947860717773438, -0.20990753173828125, -0.20033645629882812, -0.190765380859375, -0.18119430541992188, -0.17162322998046875, -0.16205215454101562, -0.1524810791015625, -0.14291000366210938, -0.13333892822265625, -0.12376785278320312, -0.11419677734375, -0.10462570190429688, -0.09505462646484375, -0.08548355102539062, -0.0759124755859375, -0.06634140014648438, -0.05677032470703125, -0.047199249267578125, -0.037628173828125, -0.028057098388671875, -0.01848602294921875, -0.008914947509765625, 0.0006561279296875, 0.010227203369140625, 0.01979827880859375, 0.029369354248046875, 0.0389404296875, 0.048511505126953125, 0.05808258056640625, 0.06765365600585938, 0.0772247314453125, 0.08679580688476562, 0.09636688232421875, 0.10593795776367188, 0.115509033203125, 0.12508010864257812, 0.13465118408203125, 0.14422225952148438, 0.1537933349609375, 0.16336441040039062, 0.17293548583984375, 0.18250656127929688, 0.19207763671875, 0.20164871215820312, 0.21121978759765625, 0.22079086303710938, 0.2303619384765625, 0.23993301391601562, 0.24950408935546875, 0.2590751647949219, 0.268646240234375, 0.2782173156738281, 0.28778839111328125, 0.2973594665527344, 0.3069305419921875, 0.3165016174316406, 0.32607269287109375, 0.3356437683105469, 0.34521484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 5.0, 16.0, 17.0, 15.0, 13.0, 13.0, 36.0, 42.0, 56.0, 80.0, 123.0, 150.0, 112.0, 82.0, 62.0, 33.0, 31.0, 21.0, 14.0, 13.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.192922592163086e-05, -5.974434316158295e-05, -5.7559460401535034e-05, -5.537457764148712e-05, -5.318969488143921e-05, -5.1004812121391296e-05, -4.8819929361343384e-05, -4.663504660129547e-05, -4.445016384124756e-05, -4.2265281081199646e-05, -4.0080398321151733e-05, -3.789551556110382e-05, -3.571063280105591e-05, -3.3525750041007996e-05, -3.134086728096008e-05, -2.915598452091217e-05, -2.6971101760864258e-05, -2.4786219000816345e-05, -2.2601336240768433e-05, -2.041645348072052e-05, -1.8231570720672607e-05, -1.6046687960624695e-05, -1.3861805200576782e-05, -1.167692244052887e-05, -9.492039680480957e-06, -7.3071569204330444e-06, -5.122274160385132e-06, -2.9373914003372192e-06, -7.525086402893066e-07, 1.432374119758606e-06, 3.6172568798065186e-06, 5.802139639854431e-06, 7.987022399902344e-06, 1.0171905159950256e-05, 1.2356787919998169e-05, 1.4541670680046082e-05, 1.6726553440093994e-05, 1.8911436200141907e-05, 2.109631896018982e-05, 2.3281201720237732e-05, 2.5466084480285645e-05, 2.7650967240333557e-05, 2.983585000038147e-05, 3.202073276042938e-05, 3.4205615520477295e-05, 3.639049828052521e-05, 3.857538104057312e-05, 4.076026380062103e-05, 4.2945146560668945e-05, 4.513002932071686e-05, 4.731491208076477e-05, 4.949979484081268e-05, 5.1684677600860596e-05, 5.386956036090851e-05, 5.605444312095642e-05, 5.8239325881004333e-05, 6.0424208641052246e-05, 6.260909140110016e-05, 6.479397416114807e-05, 6.697885692119598e-05, 6.91637396812439e-05, 7.134862244129181e-05, 7.353350520133972e-05, 7.571838796138763e-05, 7.790327072143555e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 3.0, 4.0, 7.0, 3.0, 10.0, 8.0, 6.0, 13.0, 29.0, 37.0, 45.0, 80.0, 119.0, 203.0, 349.0, 692.0, 1319.0, 3356.0, 10739.0, 54713.0, 674671.0, 260477.0, 29928.0, 6835.0, 2448.0, 1027.0, 560.0, 344.0, 175.0, 118.0, 59.0, 50.0, 28.0, 26.0, 24.0, 15.0, 5.0, 3.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.36279296875, -0.3520698547363281, -0.34134674072265625, -0.3306236267089844, -0.3199005126953125, -0.3091773986816406, -0.29845428466796875, -0.2877311706542969, -0.277008056640625, -0.2662849426269531, -0.25556182861328125, -0.24483871459960938, -0.2341156005859375, -0.22339248657226562, -0.21266937255859375, -0.20194625854492188, -0.19122314453125, -0.18050003051757812, -0.16977691650390625, -0.15905380249023438, -0.1483306884765625, -0.13760757446289062, -0.12688446044921875, -0.11616134643554688, -0.105438232421875, -0.09471511840820312, -0.08399200439453125, -0.07326889038085938, -0.0625457763671875, -0.051822662353515625, -0.04109954833984375, -0.030376434326171875, -0.0196533203125, -0.008930206298828125, 0.00179290771484375, 0.012516021728515625, 0.0232391357421875, 0.033962249755859375, 0.04468536376953125, 0.055408477783203125, 0.066131591796875, 0.07685470581054688, 0.08757781982421875, 0.09830093383789062, 0.1090240478515625, 0.11974716186523438, 0.13047027587890625, 0.14119338989257812, 0.15191650390625, 0.16263961791992188, 0.17336273193359375, 0.18408584594726562, 0.1948089599609375, 0.20553207397460938, 0.21625518798828125, 0.22697830200195312, 0.237701416015625, 0.24842453002929688, 0.25914764404296875, 0.2698707580566406, 0.2805938720703125, 0.2913169860839844, 0.30204010009765625, 0.3127632141113281, 0.323486328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 9.0, 7.0, 8.0, 10.0, 13.0, 12.0, 19.0, 27.0, 39.0, 38.0, 47.0, 60.0, 92.0, 73.0, 88.0, 78.0, 61.0, 65.0, 43.0, 28.0, 34.0, 18.0, 14.0, 21.0, 16.0, 17.0, 9.0, 8.0, 11.0, 4.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2666015625, -0.25919151306152344, -0.2517814636230469, -0.2443714141845703, -0.23696136474609375, -0.2295513153076172, -0.22214126586914062, -0.21473121643066406, -0.2073211669921875, -0.19991111755371094, -0.19250106811523438, -0.1850910186767578, -0.17768096923828125, -0.1702709197998047, -0.16286087036132812, -0.15545082092285156, -0.148040771484375, -0.14063072204589844, -0.13322067260742188, -0.1258106231689453, -0.11840057373046875, -0.11099052429199219, -0.10358047485351562, -0.09617042541503906, -0.0887603759765625, -0.08135032653808594, -0.07394027709960938, -0.06653022766113281, -0.05912017822265625, -0.05171012878417969, -0.044300079345703125, -0.03689002990722656, -0.02947998046875, -0.022069931030273438, -0.014659881591796875, -0.0072498321533203125, 0.00016021728515625, 0.0075702667236328125, 0.014980316162109375, 0.022390365600585938, 0.0298004150390625, 0.03721046447753906, 0.044620513916015625, 0.05203056335449219, 0.05944061279296875, 0.06685066223144531, 0.07426071166992188, 0.08167076110839844, 0.089080810546875, 0.09649085998535156, 0.10390090942382812, 0.11131095886230469, 0.11872100830078125, 0.1261310577392578, 0.13354110717773438, 0.14095115661621094, 0.1483612060546875, 0.15577125549316406, 0.16318130493164062, 0.1705913543701172, 0.17800140380859375, 0.1854114532470703, 0.19282150268554688, 0.20023155212402344, 0.2076416015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 9.0, 27.0, 88.0, 179.0, 290.0, 232.0, 93.0, 35.0, 18.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.70357608795166, -10.484077453613281, -10.264578819274902, -10.045080184936523, -9.825581550598145, -9.606082916259766, -9.386584281921387, -9.167085647583008, -8.947586059570312, -8.728087425231934, -8.508588790893555, -8.289090156555176, -8.069591522216797, -7.850092887878418, -7.630593776702881, -7.411095142364502, -7.191596984863281, -6.972098350524902, -6.752599716186523, -6.5331010818481445, -6.313602447509766, -6.094103813171387, -5.87460470199585, -5.655106067657471, -5.435607433319092, -5.216108798980713, -4.996610164642334, -4.777111530303955, -4.557612419128418, -4.338113784790039, -4.11861515045166, -3.8991165161132812, -3.679617404937744, -3.4601187705993652, -3.2406201362609863, -3.0211212635040283, -2.8016226291656494, -2.5821239948272705, -2.3626251220703125, -2.1431264877319336, -1.9236278533935547, -1.7041292190551758, -1.4846304655075073, -1.2651317119598389, -1.04563307762146, -0.826134443283081, -0.6066356897354126, -0.38713693618774414, -0.16763830184936523, 0.05186039209365845, 0.27135908603668213, 0.4908577799797058, 0.7103564739227295, 0.9298551082611084, 1.1493538618087769, 1.3688526153564453, 1.5883512496948242, 1.8078498840332031, 2.027348518371582, 2.24684739112854, 2.466346025466919, 2.685844659805298, 2.905343532562256, 3.1248421669006348, 3.3443408012390137]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 5.0, 7.0, 9.0, 5.0, 16.0, 15.0, 10.0, 14.0, 21.0, 23.0, 29.0, 30.0, 35.0, 31.0, 52.0, 67.0, 39.0, 69.0, 59.0, 39.0, 44.0, 37.0, 50.0, 36.0, 38.0, 31.0, 33.0, 27.0, 23.0, 17.0, 10.0, 16.0, 4.0, 11.0, 12.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.133335590362549, -3.038327217102051, -2.9433186054229736, -2.8483102321624756, -2.7533018589019775, -2.6582932472229004, -2.5632848739624023, -2.4682765007019043, -2.373267889022827, -2.278259515762329, -2.183250904083252, -2.088242530822754, -1.9932340383529663, -1.8982255458831787, -1.8032171726226807, -1.708208680152893, -1.613200306892395, -1.5181918144226074, -1.4231834411621094, -1.3281749486923218, -1.2331664562225342, -1.1381580829620361, -1.0431495904922485, -0.9481410980224609, -0.8531326651573181, -0.7581242322921753, -0.6631157398223877, -0.5681073069572449, -0.47309884428977966, -0.37809038162231445, -0.28308194875717163, -0.18807345628738403, -0.09306502342224121, 0.001943431794643402, 0.09695188701152802, 0.19196033477783203, 0.28696879744529724, 0.38197726011276245, 0.4769856929779053, 0.5719941854476929, 0.6670026183128357, 0.7620110511779785, 0.8570195436477661, 0.9520279765129089, 1.0470364093780518, 1.1420449018478394, 1.237053394317627, 1.332061767578125, 1.4270702600479126, 1.5220787525177002, 1.6170871257781982, 1.7120956182479858, 1.8071041107177734, 1.9021124839782715, 1.997120976448059, 2.0921294689178467, 2.1871378421783447, 2.2821462154388428, 2.37715482711792, 2.472163200378418, 2.567171573638916, 2.662180185317993, 2.757188558578491, 2.8521971702575684, 2.9472055435180664]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 10.0, 17.0, 20.0, 29.0, 35.0, 69.0, 98.0, 159.0, 391.0, 1915.0, 180569.0, 4003924.0, 5831.0, 621.0, 225.0, 123.0, 82.0, 42.0, 40.0, 22.0, 15.0, 11.0, 7.0, 3.0, 7.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.171875, -2.120391845703125, -2.06890869140625, -2.017425537109375, -1.9659423828125, -1.914459228515625, -1.86297607421875, -1.811492919921875, -1.760009765625, -1.708526611328125, -1.65704345703125, -1.605560302734375, -1.5540771484375, -1.502593994140625, -1.45111083984375, -1.399627685546875, -1.34814453125, -1.296661376953125, -1.24517822265625, -1.193695068359375, -1.1422119140625, -1.090728759765625, -1.03924560546875, -0.987762451171875, -0.936279296875, -0.884796142578125, -0.83331298828125, -0.781829833984375, -0.7303466796875, -0.678863525390625, -0.62738037109375, -0.575897216796875, -0.5244140625, -0.472930908203125, -0.42144775390625, -0.369964599609375, -0.3184814453125, -0.266998291015625, -0.21551513671875, -0.164031982421875, -0.112548828125, -0.061065673828125, -0.00958251953125, 0.041900634765625, 0.0933837890625, 0.144866943359375, 0.19635009765625, 0.247833251953125, 0.29931640625, 0.350799560546875, 0.40228271484375, 0.453765869140625, 0.5052490234375, 0.556732177734375, 0.60821533203125, 0.659698486328125, 0.711181640625, 0.762664794921875, 0.81414794921875, 0.865631103515625, 0.9171142578125, 0.968597412109375, 1.02008056640625, 1.071563720703125, 1.123046875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 7.0, 4.0, 7.0, 10.0, 20.0, 29.0, 17.0, 29.0, 43.0, 41.0, 62.0, 70.0, 74.0, 88.0, 80.0, 71.0, 51.0, 73.0, 55.0, 55.0, 45.0, 22.0, 13.0, 14.0, 4.0, 6.0, 10.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22900390625, -0.21949386596679688, -0.20998382568359375, -0.20047378540039062, -0.1909637451171875, -0.18145370483398438, -0.17194366455078125, -0.16243362426757812, -0.152923583984375, -0.14341354370117188, -0.13390350341796875, -0.12439346313476562, -0.1148834228515625, -0.10537338256835938, -0.09586334228515625, -0.08635330200195312, -0.07684326171875, -0.06733322143554688, -0.05782318115234375, -0.048313140869140625, -0.0388031005859375, -0.029293060302734375, -0.01978302001953125, -0.010272979736328125, -0.000762939453125, 0.008747100830078125, 0.01825714111328125, 0.027767181396484375, 0.0372772216796875, 0.046787261962890625, 0.05629730224609375, 0.06580734252929688, 0.0753173828125, 0.08482742309570312, 0.09433746337890625, 0.10384750366210938, 0.1133575439453125, 0.12286758422851562, 0.13237762451171875, 0.14188766479492188, 0.151397705078125, 0.16090774536132812, 0.17041778564453125, 0.17992782592773438, 0.1894378662109375, 0.19894790649414062, 0.20845794677734375, 0.21796798706054688, 0.22747802734375, 0.23698806762695312, 0.24649810791015625, 0.2560081481933594, 0.2655181884765625, 0.2750282287597656, 0.28453826904296875, 0.2940483093261719, 0.303558349609375, 0.3130683898925781, 0.32257843017578125, 0.3320884704589844, 0.3415985107421875, 0.3511085510253906, 0.36061859130859375, 0.3701286315917969, 0.379638671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 15.0, 37.0, 47.0, 85.0, 195.0, 398.0, 861.0, 2178.0, 5719.0, 19369.0, 116851.0, 3031928.0, 944002.0, 53124.0, 12358.0, 4152.0, 1602.0, 674.0, 348.0, 157.0, 69.0, 41.0, 30.0, 14.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5107421875, -0.49517822265625, -0.4796142578125, -0.46405029296875, -0.448486328125, -0.43292236328125, -0.4173583984375, -0.40179443359375, -0.38623046875, -0.37066650390625, -0.3551025390625, -0.33953857421875, -0.323974609375, -0.30841064453125, -0.2928466796875, -0.27728271484375, -0.26171875, -0.24615478515625, -0.2305908203125, -0.21502685546875, -0.199462890625, -0.18389892578125, -0.1683349609375, -0.15277099609375, -0.13720703125, -0.12164306640625, -0.1060791015625, -0.09051513671875, -0.074951171875, -0.05938720703125, -0.0438232421875, -0.02825927734375, -0.0126953125, 0.00286865234375, 0.0184326171875, 0.03399658203125, 0.049560546875, 0.06512451171875, 0.0806884765625, 0.09625244140625, 0.11181640625, 0.12738037109375, 0.1429443359375, 0.15850830078125, 0.174072265625, 0.18963623046875, 0.2052001953125, 0.22076416015625, 0.236328125, 0.25189208984375, 0.2674560546875, 0.28302001953125, 0.298583984375, 0.31414794921875, 0.3297119140625, 0.34527587890625, 0.36083984375, 0.37640380859375, 0.3919677734375, 0.40753173828125, 0.423095703125, 0.43865966796875, 0.4542236328125, 0.46978759765625, 0.4853515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 9.0, 4.0, 7.0, 13.0, 13.0, 8.0, 25.0, 39.0, 70.0, 106.0, 157.0, 273.0, 499.0, 774.0, 818.0, 506.0, 300.0, 171.0, 73.0, 53.0, 25.0, 24.0, 17.0, 15.0, 14.0, 6.0, 9.0, 8.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.35759735107421875, -0.3448333740234375, -0.33206939697265625, -0.319305419921875, -0.30654144287109375, -0.2937774658203125, -0.28101348876953125, -0.26824951171875, -0.25548553466796875, -0.2427215576171875, -0.22995758056640625, -0.217193603515625, -0.20442962646484375, -0.1916656494140625, -0.17890167236328125, -0.1661376953125, -0.15337371826171875, -0.1406097412109375, -0.12784576416015625, -0.115081787109375, -0.10231781005859375, -0.0895538330078125, -0.07678985595703125, -0.06402587890625, -0.05126190185546875, -0.0384979248046875, -0.02573394775390625, -0.012969970703125, -0.00020599365234375, 0.0125579833984375, 0.02532196044921875, 0.0380859375, 0.05084991455078125, 0.0636138916015625, 0.07637786865234375, 0.089141845703125, 0.10190582275390625, 0.1146697998046875, 0.12743377685546875, 0.14019775390625, 0.15296173095703125, 0.1657257080078125, 0.17848968505859375, 0.191253662109375, 0.20401763916015625, 0.2167816162109375, 0.22954559326171875, 0.2423095703125, 0.25507354736328125, 0.2678375244140625, 0.28060150146484375, 0.293365478515625, 0.30612945556640625, 0.3188934326171875, 0.33165740966796875, 0.34442138671875, 0.35718536376953125, 0.3699493408203125, 0.38271331787109375, 0.395477294921875, 0.40824127197265625, 0.4210052490234375, 0.43376922607421875, 0.446533203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 7.0, 4.0, 5.0, 11.0, 28.0, 82.0, 150.0, 221.0, 240.0, 132.0, 63.0, 22.0, 13.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6484222412109375, -5.500408172607422, -5.352394104003906, -5.204380035400391, -5.056365966796875, -4.908351898193359, -4.760337829589844, -4.612323760986328, -4.4643096923828125, -4.316295623779297, -4.168281555175781, -4.020267486572266, -3.87225341796875, -3.7242393493652344, -3.576225519180298, -3.4282114505767822, -3.2801976203918457, -3.13218355178833, -2.9841694831848145, -2.836155414581299, -2.688141345977783, -2.5401272773742676, -2.392113447189331, -2.2440993785858154, -2.0960853099823, -1.9480712413787842, -1.8000571727752686, -1.6520432233810425, -1.5040291547775269, -1.3560150861740112, -1.2080011367797852, -1.0599870681762695, -0.9119727611541748, -0.7639586925506592, -0.6159446835517883, -0.4679306447505951, -0.31991660594940186, -0.17190253734588623, -0.02388852834701538, 0.12412548065185547, 0.2721395492553711, 0.42015358805656433, 0.5681676268577576, 0.7161816358566284, 0.864195704460144, 1.0122097730636597, 1.1602237224578857, 1.3082377910614014, 1.456251859664917, 1.6042659282684326, 1.7522799968719482, 1.9002939462661743, 2.0483078956604004, 2.196321964263916, 2.3443360328674316, 2.4923501014709473, 2.640364170074463, 2.7883782386779785, 2.936392307281494, 3.0844063758850098, 3.2324204444885254, 3.380434513092041, 3.5284483432769775, 3.676462411880493, 3.824476480484009]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 9.0, 8.0, 14.0, 14.0, 22.0, 26.0, 25.0, 34.0, 26.0, 30.0, 41.0, 41.0, 49.0, 52.0, 47.0, 64.0, 44.0, 67.0, 56.0, 53.0, 48.0, 33.0, 35.0, 22.0, 21.0, 28.0, 13.0, 21.0, 10.0, 5.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9786235094070435, -1.9200031757354736, -1.8613827228546143, -1.8027623891830444, -1.744141936302185, -1.6855216026306152, -1.6269011497497559, -1.568280816078186, -1.5096604824066162, -1.4510401487350464, -1.392419695854187, -1.3337993621826172, -1.2751789093017578, -1.216558575630188, -1.1579382419586182, -1.0993177890777588, -1.0406973361968994, -0.9820769429206848, -0.9234565496444702, -0.8648362159729004, -0.806215763092041, -0.7475954294204712, -0.6889750361442566, -0.630354642868042, -0.5717342495918274, -0.5131138563156128, -0.4544934630393982, -0.395873099565506, -0.3372527062892914, -0.2786323130130768, -0.22001194953918457, -0.16139155626296997, -0.10277104377746582, -0.04415065795183182, 0.014469727873802185, 0.07309010624885559, 0.1317104995250702, 0.1903308928012848, 0.248951256275177, 0.3075716495513916, 0.3661920428276062, 0.4248124361038208, 0.4834328293800354, 0.54205322265625, 0.6006735563278198, 0.6592940092086792, 0.717914342880249, 0.7765347361564636, 0.8351551294326782, 0.8937755227088928, 0.9523959159851074, 1.0110162496566772, 1.0696367025375366, 1.1282570362091064, 1.1868774890899658, 1.2454978227615356, 1.3041181564331055, 1.3627384901046753, 1.4213589429855347, 1.4799792766571045, 1.5385997295379639, 1.5972200632095337, 1.6558403968811035, 1.714460849761963, 1.7730813026428223]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 10.0, 6.0, 16.0, 27.0, 26.0, 47.0, 55.0, 121.0, 202.0, 422.0, 723.0, 1551.0, 3588.0, 8730.0, 23930.0, 74516.0, 271267.0, 455625.0, 141302.0, 41583.0, 14602.0, 5407.0, 2433.0, 1082.0, 571.0, 297.0, 166.0, 92.0, 64.0, 35.0, 27.0, 10.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347900390625, -0.33676910400390625, -0.3256378173828125, -0.31450653076171875, -0.303375244140625, -0.29224395751953125, -0.2811126708984375, -0.26998138427734375, -0.25885009765625, -0.24771881103515625, -0.2365875244140625, -0.22545623779296875, -0.214324951171875, -0.20319366455078125, -0.1920623779296875, -0.18093109130859375, -0.1697998046875, -0.15866851806640625, -0.1475372314453125, -0.13640594482421875, -0.125274658203125, -0.11414337158203125, -0.1030120849609375, -0.09188079833984375, -0.08074951171875, -0.06961822509765625, -0.0584869384765625, -0.04735565185546875, -0.036224365234375, -0.02509307861328125, -0.0139617919921875, -0.00283050537109375, 0.00830078125, 0.01943206787109375, 0.0305633544921875, 0.04169464111328125, 0.052825927734375, 0.06395721435546875, 0.0750885009765625, 0.08621978759765625, 0.09735107421875, 0.10848236083984375, 0.1196136474609375, 0.13074493408203125, 0.141876220703125, 0.15300750732421875, 0.1641387939453125, 0.17527008056640625, 0.1864013671875, 0.19753265380859375, 0.2086639404296875, 0.21979522705078125, 0.230926513671875, 0.24205780029296875, 0.2531890869140625, 0.26432037353515625, 0.27545166015625, 0.28658294677734375, 0.2977142333984375, 0.30884552001953125, 0.319976806640625, 0.33110809326171875, 0.3422393798828125, 0.35337066650390625, 0.364501953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 4.0, 16.0, 10.0, 16.0, 15.0, 28.0, 19.0, 35.0, 34.0, 32.0, 43.0, 38.0, 51.0, 41.0, 51.0, 60.0, 46.0, 62.0, 44.0, 43.0, 43.0, 29.0, 41.0, 26.0, 30.0, 17.0, 20.0, 27.0, 19.0, 9.0, 10.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1829833984375, -0.17661285400390625, -0.1702423095703125, -0.16387176513671875, -0.157501220703125, -0.15113067626953125, -0.1447601318359375, -0.13838958740234375, -0.13201904296875, -0.12564849853515625, -0.1192779541015625, -0.11290740966796875, -0.106536865234375, -0.10016632080078125, -0.0937957763671875, -0.08742523193359375, -0.0810546875, -0.07468414306640625, -0.0683135986328125, -0.06194305419921875, -0.055572509765625, -0.04920196533203125, -0.0428314208984375, -0.03646087646484375, -0.03009033203125, -0.02371978759765625, -0.0173492431640625, -0.01097869873046875, -0.004608154296875, 0.00176239013671875, 0.0081329345703125, 0.01450347900390625, 0.0208740234375, 0.02724456787109375, 0.0336151123046875, 0.03998565673828125, 0.046356201171875, 0.05272674560546875, 0.0590972900390625, 0.06546783447265625, 0.07183837890625, 0.07820892333984375, 0.0845794677734375, 0.09095001220703125, 0.097320556640625, 0.10369110107421875, 0.1100616455078125, 0.11643218994140625, 0.122802734375, 0.12917327880859375, 0.1355438232421875, 0.14191436767578125, 0.148284912109375, 0.15465545654296875, 0.1610260009765625, 0.16739654541015625, 0.17376708984375, 0.18013763427734375, 0.1865081787109375, 0.19287872314453125, 0.199249267578125, 0.20561981201171875, 0.2119903564453125, 0.21836090087890625, 0.2247314453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 11.0, 13.0, 15.0, 26.0, 29.0, 62.0, 69.0, 133.0, 246.0, 482.0, 995.0, 2384.0, 9345.0, 62159.0, 696414.0, 242732.0, 25353.0, 4847.0, 1639.0, 723.0, 329.0, 197.0, 108.0, 88.0, 32.0, 25.0, 22.0, 13.0, 7.0, 11.0, 4.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.77685546875, -0.7562942504882812, -0.7357330322265625, -0.7151718139648438, -0.694610595703125, -0.6740493774414062, -0.6534881591796875, -0.6329269409179688, -0.61236572265625, -0.5918045043945312, -0.5712432861328125, -0.5506820678710938, -0.530120849609375, -0.5095596313476562, -0.4889984130859375, -0.46843719482421875, -0.4478759765625, -0.42731475830078125, -0.4067535400390625, -0.38619232177734375, -0.365631103515625, -0.34506988525390625, -0.3245086669921875, -0.30394744873046875, -0.28338623046875, -0.26282501220703125, -0.2422637939453125, -0.22170257568359375, -0.201141357421875, -0.18058013916015625, -0.1600189208984375, -0.13945770263671875, -0.118896484375, -0.09833526611328125, -0.0777740478515625, -0.05721282958984375, -0.036651611328125, -0.01609039306640625, 0.0044708251953125, 0.02503204345703125, 0.04559326171875, 0.06615447998046875, 0.0867156982421875, 0.10727691650390625, 0.127838134765625, 0.14839935302734375, 0.1689605712890625, 0.18952178955078125, 0.2100830078125, 0.23064422607421875, 0.2512054443359375, 0.27176666259765625, 0.292327880859375, 0.31288909912109375, 0.3334503173828125, 0.35401153564453125, 0.37457275390625, 0.39513397216796875, 0.4156951904296875, 0.43625640869140625, 0.456817626953125, 0.47737884521484375, 0.4979400634765625, 0.5185012817382812, 0.5390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 2.0, 9.0, 11.0, 8.0, 9.0, 15.0, 16.0, 14.0, 17.0, 19.0, 22.0, 21.0, 24.0, 26.0, 31.0, 31.0, 37.0, 36.0, 46.0, 36.0, 40.0, 50.0, 40.0, 42.0, 35.0, 31.0, 39.0, 35.0, 39.0, 41.0, 27.0, 23.0, 22.0, 14.0, 15.0, 9.0, 12.0, 11.0, 9.0, 5.0, 12.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.7177734375, -0.6971664428710938, -0.6765594482421875, -0.6559524536132812, -0.635345458984375, -0.6147384643554688, -0.5941314697265625, -0.5735244750976562, -0.55291748046875, -0.5323104858398438, -0.5117034912109375, -0.49109649658203125, -0.470489501953125, -0.44988250732421875, -0.4292755126953125, -0.40866851806640625, -0.3880615234375, -0.36745452880859375, -0.3468475341796875, -0.32624053955078125, -0.305633544921875, -0.28502655029296875, -0.2644195556640625, -0.24381256103515625, -0.22320556640625, -0.20259857177734375, -0.1819915771484375, -0.16138458251953125, -0.140777587890625, -0.12017059326171875, -0.0995635986328125, -0.07895660400390625, -0.058349609375, -0.03774261474609375, -0.0171356201171875, 0.00347137451171875, 0.024078369140625, 0.04468536376953125, 0.0652923583984375, 0.08589935302734375, 0.10650634765625, 0.12711334228515625, 0.1477203369140625, 0.16832733154296875, 0.188934326171875, 0.20954132080078125, 0.2301483154296875, 0.25075531005859375, 0.2713623046875, 0.29196929931640625, 0.3125762939453125, 0.33318328857421875, 0.353790283203125, 0.37439727783203125, 0.3950042724609375, 0.41561126708984375, 0.43621826171875, 0.45682525634765625, 0.4774322509765625, 0.49803924560546875, 0.518646240234375, 0.5392532348632812, 0.5598602294921875, 0.5804672241210938, 0.60107421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 6.0, 7.0, 18.0, 34.0, 54.0, 86.0, 139.0, 417.0, 1063.0, 3897.0, 24610.0, 709874.0, 287834.0, 15996.0, 2943.0, 838.0, 337.0, 162.0, 82.0, 39.0, 30.0, 21.0, 20.0, 8.0, 7.0, 7.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.53125, -0.5160293579101562, -0.5008087158203125, -0.48558807373046875, -0.470367431640625, -0.45514678955078125, -0.4399261474609375, -0.42470550537109375, -0.40948486328125, -0.39426422119140625, -0.3790435791015625, -0.36382293701171875, -0.348602294921875, -0.33338165283203125, -0.3181610107421875, -0.30294036865234375, -0.2877197265625, -0.27249908447265625, -0.2572784423828125, -0.24205780029296875, -0.226837158203125, -0.21161651611328125, -0.1963958740234375, -0.18117523193359375, -0.16595458984375, -0.15073394775390625, -0.1355133056640625, -0.12029266357421875, -0.105072021484375, -0.08985137939453125, -0.0746307373046875, -0.05941009521484375, -0.044189453125, -0.02896881103515625, -0.0137481689453125, 0.00147247314453125, 0.016693115234375, 0.03191375732421875, 0.0471343994140625, 0.06235504150390625, 0.07757568359375, 0.09279632568359375, 0.1080169677734375, 0.12323760986328125, 0.138458251953125, 0.15367889404296875, 0.1688995361328125, 0.18412017822265625, 0.1993408203125, 0.21456146240234375, 0.2297821044921875, 0.24500274658203125, 0.260223388671875, 0.27544403076171875, 0.2906646728515625, 0.30588531494140625, 0.32110595703125, 0.33632659912109375, 0.3515472412109375, 0.36676788330078125, 0.381988525390625, 0.39720916748046875, 0.4124298095703125, 0.42765045166015625, 0.44287109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 12.0, 19.0, 24.0, 32.0, 57.0, 83.0, 183.0, 173.0, 140.0, 88.0, 53.0, 34.0, 16.0, 18.0, 9.0, 10.0, 8.0, 10.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594989776611328e-05, -8.281227201223373e-05, -7.967464625835419e-05, -7.653702050447464e-05, -7.339939475059509e-05, -7.026176899671555e-05, -6.7124143242836e-05, -6.398651748895645e-05, -6.0848891735076904e-05, -5.771126598119736e-05, -5.457364022731781e-05, -5.143601447343826e-05, -4.8298388719558716e-05, -4.516076296567917e-05, -4.202313721179962e-05, -3.8885511457920074e-05, -3.574788570404053e-05, -3.261025995016098e-05, -2.9472634196281433e-05, -2.6335008442401886e-05, -2.319738268852234e-05, -2.0059756934642792e-05, -1.6922131180763245e-05, -1.3784505426883698e-05, -1.064687967300415e-05, -7.509253919124603e-06, -4.371628165245056e-06, -1.234002411365509e-06, 1.903623342514038e-06, 5.041249096393585e-06, 8.178874850273132e-06, 1.131650060415268e-05, 1.4454126358032227e-05, 1.7591752111911774e-05, 2.072937786579132e-05, 2.3867003619670868e-05, 2.7004629373550415e-05, 3.0142255127429962e-05, 3.327988088130951e-05, 3.6417506635189056e-05, 3.9555132389068604e-05, 4.269275814294815e-05, 4.58303838968277e-05, 4.8968009650707245e-05, 5.210563540458679e-05, 5.524326115846634e-05, 5.8380886912345886e-05, 6.151851266622543e-05, 6.465613842010498e-05, 6.779376417398453e-05, 7.093138992786407e-05, 7.406901568174362e-05, 7.720664143562317e-05, 8.034426718950272e-05, 8.348189294338226e-05, 8.661951869726181e-05, 8.975714445114136e-05, 9.28947702050209e-05, 9.603239595890045e-05, 9.917002171278e-05, 0.00010230764746665955, 0.00010544527322053909, 0.00010858289897441864, 0.00011172052472829819, 0.00011485815048217773]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 13.0, 8.0, 7.0, 12.0, 28.0, 37.0, 56.0, 108.0, 156.0, 332.0, 726.0, 1681.0, 4960.0, 21746.0, 238194.0, 724500.0, 43832.0, 7871.0, 2379.0, 929.0, 436.0, 210.0, 107.0, 70.0, 45.0, 33.0, 14.0, 17.0, 12.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.412353515625, -0.39992523193359375, -0.3874969482421875, -0.37506866455078125, -0.362640380859375, -0.35021209716796875, -0.3377838134765625, -0.32535552978515625, -0.31292724609375, -0.30049896240234375, -0.2880706787109375, -0.27564239501953125, -0.263214111328125, -0.25078582763671875, -0.2383575439453125, -0.22592926025390625, -0.2135009765625, -0.20107269287109375, -0.1886444091796875, -0.17621612548828125, -0.163787841796875, -0.15135955810546875, -0.1389312744140625, -0.12650299072265625, -0.11407470703125, -0.10164642333984375, -0.0892181396484375, -0.07678985595703125, -0.064361572265625, -0.05193328857421875, -0.0395050048828125, -0.02707672119140625, -0.0146484375, -0.00222015380859375, 0.0102081298828125, 0.02263641357421875, 0.035064697265625, 0.04749298095703125, 0.0599212646484375, 0.07234954833984375, 0.08477783203125, 0.09720611572265625, 0.1096343994140625, 0.12206268310546875, 0.134490966796875, 0.14691925048828125, 0.1593475341796875, 0.17177581787109375, 0.1842041015625, 0.19663238525390625, 0.2090606689453125, 0.22148895263671875, 0.233917236328125, 0.24634552001953125, 0.2587738037109375, 0.27120208740234375, 0.28363037109375, 0.29605865478515625, 0.3084869384765625, 0.32091522216796875, 0.333343505859375, 0.34577178955078125, 0.3582000732421875, 0.37062835693359375, 0.383056640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 11.0, 3.0, 8.0, 15.0, 16.0, 26.0, 32.0, 62.0, 78.0, 118.0, 149.0, 130.0, 117.0, 74.0, 45.0, 34.0, 22.0, 9.0, 13.0, 7.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272216796875, -0.26125335693359375, -0.2502899169921875, -0.23932647705078125, -0.228363037109375, -0.21739959716796875, -0.2064361572265625, -0.19547271728515625, -0.18450927734375, -0.17354583740234375, -0.1625823974609375, -0.15161895751953125, -0.140655517578125, -0.12969207763671875, -0.1187286376953125, -0.10776519775390625, -0.0968017578125, -0.08583831787109375, -0.0748748779296875, -0.06391143798828125, -0.052947998046875, -0.04198455810546875, -0.0310211181640625, -0.02005767822265625, -0.00909423828125, 0.00186920166015625, 0.0128326416015625, 0.02379608154296875, 0.034759521484375, 0.04572296142578125, 0.0566864013671875, 0.06764984130859375, 0.07861328125, 0.08957672119140625, 0.1005401611328125, 0.11150360107421875, 0.122467041015625, 0.13343048095703125, 0.1443939208984375, 0.15535736083984375, 0.16632080078125, 0.17728424072265625, 0.1882476806640625, 0.19921112060546875, 0.210174560546875, 0.22113800048828125, 0.2321014404296875, 0.24306488037109375, 0.2540283203125, 0.26499176025390625, 0.2759552001953125, 0.28691864013671875, 0.297882080078125, 0.30884552001953125, 0.3198089599609375, 0.33077239990234375, 0.34173583984375, 0.35269927978515625, 0.3636627197265625, 0.37462615966796875, 0.385589599609375, 0.39655303955078125, 0.4075164794921875, 0.41847991943359375, 0.429443359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 7.0, 7.0, 12.0, 11.0, 31.0, 47.0, 130.0, 173.0, 234.0, 174.0, 85.0, 48.0, 18.0, 11.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3663740158081055, -4.20626163482666, -4.046149730682373, -3.8860373497009277, -3.7259252071380615, -3.5658130645751953, -3.40570068359375, -3.245588541030884, -3.0854763984680176, -2.9253642559051514, -2.765252113342285, -2.60513973236084, -2.4450275897979736, -2.2849154472351074, -2.124803066253662, -1.964690923690796, -1.8045787811279297, -1.6444666385650635, -1.4843543767929077, -1.324242115020752, -1.1641299724578857, -1.0040178298950195, -0.8439055681228638, -0.683793306350708, -0.5236811637878418, -0.3635689616203308, -0.20345675945281982, -0.04334455728530884, 0.11676764488220215, 0.27687984704971313, 0.4369920492172241, 0.5971043109893799, 0.7572159767150879, 0.9173281788825989, 1.0774403810501099, 1.2375526428222656, 1.3976647853851318, 1.557776927947998, 1.7178891897201538, 1.8780014514923096, 2.038113594055176, 2.198225736618042, 2.358337879180908, 2.5184502601623535, 2.6785624027252197, 2.838674545288086, 2.9987869262695312, 3.1588990688323975, 3.3190112113952637, 3.47912335395813, 3.639235496520996, 3.7993478775024414, 3.9594600200653076, 4.119572162628174, 4.279684543609619, 4.439796447753906, 4.599908828735352, 4.760021209716797, 4.920133113861084, 5.080245494842529, 5.240357398986816, 5.400469779968262, 5.560582160949707, 5.720694541931152, 5.8808064460754395]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 15.0, 12.0, 17.0, 19.0, 30.0, 35.0, 42.0, 47.0, 50.0, 79.0, 90.0, 84.0, 86.0, 56.0, 55.0, 77.0, 46.0, 36.0, 26.0, 27.0, 16.0, 18.0, 11.0, 6.0, 7.0, 4.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0773141384124756, -2.92854380607605, -2.779773473739624, -2.6310031414031982, -2.4822328090667725, -2.3334624767303467, -2.184692144393921, -2.035921812057495, -1.8871514797210693, -1.7383811473846436, -1.5896108150482178, -1.440840482711792, -1.2920701503753662, -1.1432998180389404, -0.9945294857025146, -0.8457591533660889, -0.6969888210296631, -0.5482184886932373, -0.3994481563568115, -0.25067782402038574, -0.10190749168395996, 0.04686284065246582, 0.1956331729888916, 0.3444035053253174, 0.49317383766174316, 0.641944169998169, 0.7907145023345947, 0.9394848346710205, 1.0882551670074463, 1.237025499343872, 1.3857958316802979, 1.5345661640167236, 1.6833362579345703, 1.832106590270996, 1.9808769226074219, 2.1296472549438477, 2.2784175872802734, 2.427187919616699, 2.575958251953125, 2.724728584289551, 2.8734989166259766, 3.0222692489624023, 3.171039581298828, 3.319809913635254, 3.4685802459716797, 3.6173505783081055, 3.7661209106445312, 3.914891242980957, 4.063661575317383, 4.212431907653809, 4.361202239990234, 4.50997257232666, 4.658742904663086, 4.807513236999512, 4.9562835693359375, 5.105053901672363, 5.253824234008789, 5.402594566345215, 5.551364898681641, 5.700135231018066, 5.848905563354492, 5.997675895690918, 6.146446228027344, 6.2952165603637695, 6.443986892700195]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 8.0, 16.0, 16.0, 24.0, 41.0, 65.0, 106.0, 184.0, 401.0, 910.0, 2078.0, 4655.0, 12570.0, 56795.0, 819648.0, 3017606.0, 241315.0, 26130.0, 6839.0, 2523.0, 1079.0, 525.0, 299.0, 151.0, 103.0, 62.0, 42.0, 17.0, 16.0, 10.0, 14.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2733001708984375, -0.260467529296875, -0.2476348876953125, -0.23480224609375, -0.2219696044921875, -0.209136962890625, -0.1963043212890625, -0.1834716796875, -0.1706390380859375, -0.157806396484375, -0.1449737548828125, -0.13214111328125, -0.1193084716796875, -0.106475830078125, -0.0936431884765625, -0.080810546875, -0.0679779052734375, -0.055145263671875, -0.0423126220703125, -0.02947998046875, -0.0166473388671875, -0.003814697265625, 0.0090179443359375, 0.0218505859375, 0.0346832275390625, 0.047515869140625, 0.0603485107421875, 0.07318115234375, 0.0860137939453125, 0.098846435546875, 0.1116790771484375, 0.12451171875, 0.1373443603515625, 0.150177001953125, 0.1630096435546875, 0.17584228515625, 0.1886749267578125, 0.201507568359375, 0.2143402099609375, 0.2271728515625, 0.2400054931640625, 0.252838134765625, 0.2656707763671875, 0.27850341796875, 0.2913360595703125, 0.304168701171875, 0.3170013427734375, 0.329833984375, 0.3426666259765625, 0.355499267578125, 0.3683319091796875, 0.38116455078125, 0.3939971923828125, 0.406829833984375, 0.4196624755859375, 0.4324951171875, 0.4453277587890625, 0.458160400390625, 0.4709930419921875, 0.48382568359375, 0.4966583251953125, 0.509490966796875, 0.5223236083984375, 0.53515625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 7.0, 4.0, 13.0, 29.0, 33.0, 53.0, 81.0, 94.0, 98.0, 128.0, 131.0, 94.0, 90.0, 68.0, 32.0, 35.0, 13.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1827392578125, -0.1683788299560547, -0.15401840209960938, -0.13965797424316406, -0.12529754638671875, -0.11093711853027344, -0.09657669067382812, -0.08221626281738281, -0.0678558349609375, -0.05349540710449219, -0.039134979248046875, -0.024774551391601562, -0.01041412353515625, 0.0039463043212890625, 0.018306732177734375, 0.03266716003417969, 0.047027587890625, 0.06138801574707031, 0.07574844360351562, 0.09010887145996094, 0.10446929931640625, 0.11882972717285156, 0.13319015502929688, 0.1475505828857422, 0.1619110107421875, 0.1762714385986328, 0.19063186645507812, 0.20499229431152344, 0.21935272216796875, 0.23371315002441406, 0.24807357788085938, 0.2624340057373047, 0.27679443359375, 0.2911548614501953, 0.3055152893066406, 0.31987571716308594, 0.33423614501953125, 0.34859657287597656, 0.3629570007324219, 0.3773174285888672, 0.3916778564453125, 0.4060382843017578, 0.4203987121582031, 0.43475914001464844, 0.44911956787109375, 0.46347999572753906, 0.4778404235839844, 0.4922008514404297, 0.506561279296875, 0.5209217071533203, 0.5352821350097656, 0.5496425628662109, 0.5640029907226562, 0.5783634185791016, 0.5927238464355469, 0.6070842742919922, 0.6214447021484375, 0.6358051300048828, 0.6501655578613281, 0.6645259857177734, 0.6788864135742188, 0.6932468414306641, 0.7076072692871094, 0.7219676971435547, 0.736328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 10.0, 8.0, 17.0, 19.0, 23.0, 33.0, 63.0, 117.0, 161.0, 267.0, 483.0, 828.0, 1686.0, 3631.0, 8526.0, 24040.0, 89949.0, 791543.0, 2914278.0, 278718.0, 51885.0, 15847.0, 6214.0, 2750.0, 1347.0, 732.0, 409.0, 245.0, 160.0, 94.0, 57.0, 35.0, 26.0, 21.0, 13.0, 11.0, 10.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360595703125, -0.3490753173828125, -0.337554931640625, -0.3260345458984375, -0.31451416015625, -0.3029937744140625, -0.291473388671875, -0.2799530029296875, -0.2684326171875, -0.2569122314453125, -0.245391845703125, -0.2338714599609375, -0.22235107421875, -0.2108306884765625, -0.199310302734375, -0.1877899169921875, -0.17626953125, -0.1647491455078125, -0.153228759765625, -0.1417083740234375, -0.13018798828125, -0.1186676025390625, -0.107147216796875, -0.0956268310546875, -0.0841064453125, -0.0725860595703125, -0.061065673828125, -0.0495452880859375, -0.03802490234375, -0.0265045166015625, -0.014984130859375, -0.0034637451171875, 0.008056640625, 0.0195770263671875, 0.031097412109375, 0.0426177978515625, 0.05413818359375, 0.0656585693359375, 0.077178955078125, 0.0886993408203125, 0.1002197265625, 0.1117401123046875, 0.123260498046875, 0.1347808837890625, 0.14630126953125, 0.1578216552734375, 0.169342041015625, 0.1808624267578125, 0.1923828125, 0.2039031982421875, 0.215423583984375, 0.2269439697265625, 0.23846435546875, 0.2499847412109375, 0.261505126953125, 0.2730255126953125, 0.2845458984375, 0.2960662841796875, 0.307586669921875, 0.3191070556640625, 0.33062744140625, 0.3421478271484375, 0.353668212890625, 0.3651885986328125, 0.376708984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 5.0, 8.0, 7.0, 4.0, 15.0, 15.0, 16.0, 19.0, 26.0, 27.0, 36.0, 71.0, 85.0, 135.0, 231.0, 426.0, 593.0, 706.0, 533.0, 352.0, 259.0, 140.0, 106.0, 57.0, 40.0, 38.0, 20.0, 22.0, 15.0, 12.0, 10.0, 11.0, 8.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4453125, -0.43160247802734375, -0.4178924560546875, -0.40418243408203125, -0.390472412109375, -0.37676239013671875, -0.3630523681640625, -0.34934234619140625, -0.33563232421875, -0.32192230224609375, -0.3082122802734375, -0.29450225830078125, -0.280792236328125, -0.26708221435546875, -0.2533721923828125, -0.23966217041015625, -0.2259521484375, -0.21224212646484375, -0.1985321044921875, -0.18482208251953125, -0.171112060546875, -0.15740203857421875, -0.1436920166015625, -0.12998199462890625, -0.11627197265625, -0.10256195068359375, -0.0888519287109375, -0.07514190673828125, -0.061431884765625, -0.04772186279296875, -0.0340118408203125, -0.02030181884765625, -0.006591796875, 0.00711822509765625, 0.0208282470703125, 0.03453826904296875, 0.048248291015625, 0.06195831298828125, 0.0756683349609375, 0.08937835693359375, 0.10308837890625, 0.11679840087890625, 0.1305084228515625, 0.14421844482421875, 0.157928466796875, 0.17163848876953125, 0.1853485107421875, 0.19905853271484375, 0.2127685546875, 0.22647857666015625, 0.2401885986328125, 0.25389862060546875, 0.267608642578125, 0.28131866455078125, 0.2950286865234375, 0.30873870849609375, 0.32244873046875, 0.33615875244140625, 0.3498687744140625, 0.36357879638671875, 0.377288818359375, 0.39099884033203125, 0.4047088623046875, 0.41841888427734375, 0.43212890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 13.0, 36.0, 75.0, 175.0, 255.0, 200.0, 147.0, 44.0, 20.0, 11.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.917888164520264, -7.71876859664917, -7.519649028778076, -7.320529460906982, -7.121409893035889, -6.922290325164795, -6.723170757293701, -6.524051189422607, -6.324931621551514, -6.12581205368042, -5.926692485809326, -5.727572917938232, -5.528453350067139, -5.329333782196045, -5.130214214324951, -4.931094646453857, -4.731975078582764, -4.53285551071167, -4.333735942840576, -4.134616374969482, -3.9354968070983887, -3.736377239227295, -3.537257671356201, -3.3381381034851074, -3.1390185356140137, -2.93989896774292, -2.740779399871826, -2.5416598320007324, -2.3425402641296387, -2.143420696258545, -1.9443011283874512, -1.7451815605163574, -1.5460615158081055, -1.3469419479370117, -1.147822380065918, -0.9487028121948242, -0.7495832443237305, -0.5504636764526367, -0.35134410858154297, -0.15222454071044922, 0.04689502716064453, 0.24601459503173828, 0.44513416290283203, 0.6442537307739258, 0.8433732986450195, 1.0424928665161133, 1.241612434387207, 1.4407320022583008, 1.6398515701293945, 1.8389711380004883, 2.038090705871582, 2.237210273742676, 2.4363298416137695, 2.6354494094848633, 2.834568977355957, 3.033688545227051, 3.2328081130981445, 3.4319276809692383, 3.631047248840332, 3.830166816711426, 4.0292863845825195, 4.228405952453613, 4.427525520324707, 4.626645088195801, 4.8257646560668945]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 5.0, 13.0, 19.0, 27.0, 41.0, 48.0, 47.0, 58.0, 63.0, 72.0, 88.0, 83.0, 76.0, 56.0, 70.0, 62.0, 38.0, 28.0, 32.0, 29.0, 16.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.794748783111572, -5.671706676483154, -5.548664093017578, -5.42562198638916, -5.302579879760742, -5.179537296295166, -5.056495189666748, -4.93345308303833, -4.810410499572754, -4.687368392944336, -4.56432580947876, -4.441283702850342, -4.318241596221924, -4.195199012756348, -4.07215690612793, -3.9491145610809326, -3.8260724544525146, -3.7030301094055176, -3.5799880027770996, -3.4569456577301025, -3.3339033126831055, -3.2108612060546875, -3.0878188610076904, -2.9647765159606934, -2.8417344093322754, -2.7186920642852783, -2.5956499576568604, -2.4726076126098633, -2.349565267562866, -2.226522922515869, -2.103480815887451, -1.980438470840454, -1.857396125793457, -1.7343538999557495, -1.6113115549087524, -1.488269329071045, -1.3652269840240479, -1.2421847581863403, -1.1191425323486328, -0.9961002469062805, -0.8730579614639282, -0.7500156760215759, -0.6269733905792236, -0.5039311647415161, -0.3808888792991638, -0.2578465938568115, -0.134804368019104, -0.011762082576751709, 0.11128020286560059, 0.2343224734067917, 0.3573647439479828, 0.4804069995880127, 0.603449285030365, 0.7264915704727173, 0.8495337963104248, 0.9725760817527771, 1.0956183671951294, 1.218660593032837, 1.341702938079834, 1.4647451639175415, 1.587787389755249, 1.710829734802246, 1.8338719606399536, 1.9569141864776611, 2.079956531524658]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 2.0, 9.0, 15.0, 29.0, 27.0, 43.0, 86.0, 116.0, 253.0, 445.0, 887.0, 1848.0, 4329.0, 11021.0, 29106.0, 79720.0, 220329.0, 388394.0, 197557.0, 70960.0, 26049.0, 9787.0, 4044.0, 1713.0, 806.0, 413.0, 213.0, 136.0, 93.0, 47.0, 28.0, 22.0, 9.0, 6.0, 4.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.345947265625, -0.33670806884765625, -0.3274688720703125, -0.31822967529296875, -0.308990478515625, -0.29975128173828125, -0.2905120849609375, -0.28127288818359375, -0.27203369140625, -0.26279449462890625, -0.2535552978515625, -0.24431610107421875, -0.235076904296875, -0.22583770751953125, -0.2165985107421875, -0.20735931396484375, -0.1981201171875, -0.18888092041015625, -0.1796417236328125, -0.17040252685546875, -0.161163330078125, -0.15192413330078125, -0.1426849365234375, -0.13344573974609375, -0.12420654296875, -0.11496734619140625, -0.1057281494140625, -0.09648895263671875, -0.087249755859375, -0.07801055908203125, -0.0687713623046875, -0.05953216552734375, -0.05029296875, -0.04105377197265625, -0.0318145751953125, -0.02257537841796875, -0.013336181640625, -0.00409698486328125, 0.0051422119140625, 0.01438140869140625, 0.02362060546875, 0.03285980224609375, 0.0420989990234375, 0.05133819580078125, 0.060577392578125, 0.06981658935546875, 0.0790557861328125, 0.08829498291015625, 0.0975341796875, 0.10677337646484375, 0.1160125732421875, 0.12525177001953125, 0.134490966796875, 0.14373016357421875, 0.1529693603515625, 0.16220855712890625, 0.17144775390625, 0.18068695068359375, 0.1899261474609375, 0.19916534423828125, 0.208404541015625, 0.21764373779296875, 0.2268829345703125, 0.23612213134765625, 0.245361328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 3.0, 12.0, 16.0, 9.0, 18.0, 16.0, 25.0, 36.0, 31.0, 40.0, 45.0, 51.0, 52.0, 62.0, 49.0, 56.0, 44.0, 49.0, 44.0, 56.0, 43.0, 43.0, 31.0, 28.0, 26.0, 19.0, 14.0, 15.0, 16.0, 13.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.15703773498535156, -0.15062332153320312, -0.1442089080810547, -0.13779449462890625, -0.1313800811767578, -0.12496566772460938, -0.11855125427246094, -0.1121368408203125, -0.10572242736816406, -0.09930801391601562, -0.09289360046386719, -0.08647918701171875, -0.08006477355957031, -0.07365036010742188, -0.06723594665527344, -0.060821533203125, -0.05440711975097656, -0.047992706298828125, -0.04157829284667969, -0.03516387939453125, -0.028749465942382812, -0.022335052490234375, -0.015920639038085938, -0.0095062255859375, -0.0030918121337890625, 0.003322601318359375, 0.009737014770507812, 0.01615142822265625, 0.022565841674804688, 0.028980255126953125, 0.03539466857910156, 0.04180908203125, 0.04822349548339844, 0.054637908935546875, 0.06105232238769531, 0.06746673583984375, 0.07388114929199219, 0.08029556274414062, 0.08670997619628906, 0.0931243896484375, 0.09953880310058594, 0.10595321655273438, 0.11236763000488281, 0.11878204345703125, 0.1251964569091797, 0.13161087036132812, 0.13802528381347656, 0.144439697265625, 0.15085411071777344, 0.15726852416992188, 0.1636829376220703, 0.17009735107421875, 0.1765117645263672, 0.18292617797851562, 0.18934059143066406, 0.1957550048828125, 0.20216941833496094, 0.20858383178710938, 0.2149982452392578, 0.22141265869140625, 0.2278270721435547, 0.23424148559570312, 0.24065589904785156, 0.2470703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 16.0, 18.0, 23.0, 35.0, 37.0, 67.0, 111.0, 158.0, 204.0, 296.0, 464.0, 829.0, 1508.0, 3784.0, 16036.0, 167405.0, 775045.0, 67802.0, 8891.0, 2624.0, 1296.0, 656.0, 384.0, 284.0, 178.0, 124.0, 73.0, 67.0, 35.0, 32.0, 21.0, 13.0, 12.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7275390625, -0.704315185546875, -0.68109130859375, -0.657867431640625, -0.6346435546875, -0.611419677734375, -0.58819580078125, -0.564971923828125, -0.541748046875, -0.518524169921875, -0.49530029296875, -0.472076416015625, -0.4488525390625, -0.425628662109375, -0.40240478515625, -0.379180908203125, -0.35595703125, -0.332733154296875, -0.30950927734375, -0.286285400390625, -0.2630615234375, -0.239837646484375, -0.21661376953125, -0.193389892578125, -0.170166015625, -0.146942138671875, -0.12371826171875, -0.100494384765625, -0.0772705078125, -0.054046630859375, -0.03082275390625, -0.007598876953125, 0.015625, 0.038848876953125, 0.06207275390625, 0.085296630859375, 0.1085205078125, 0.131744384765625, 0.15496826171875, 0.178192138671875, 0.201416015625, 0.224639892578125, 0.24786376953125, 0.271087646484375, 0.2943115234375, 0.317535400390625, 0.34075927734375, 0.363983154296875, 0.38720703125, 0.410430908203125, 0.43365478515625, 0.456878662109375, 0.4801025390625, 0.503326416015625, 0.52655029296875, 0.549774169921875, 0.572998046875, 0.596221923828125, 0.61944580078125, 0.642669677734375, 0.6658935546875, 0.689117431640625, 0.71234130859375, 0.735565185546875, 0.7587890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 4.0, 9.0, 4.0, 10.0, 6.0, 4.0, 11.0, 14.0, 14.0, 23.0, 23.0, 22.0, 30.0, 36.0, 42.0, 36.0, 39.0, 37.0, 36.0, 55.0, 34.0, 49.0, 50.0, 36.0, 47.0, 31.0, 37.0, 25.0, 25.0, 32.0, 18.0, 19.0, 23.0, 16.0, 17.0, 12.0, 14.0, 10.0, 9.0, 8.0, 10.0, 6.0, 4.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7158203125, -0.6929092407226562, -0.6699981689453125, -0.6470870971679688, -0.624176025390625, -0.6012649536132812, -0.5783538818359375, -0.5554428100585938, -0.53253173828125, -0.5096206665039062, -0.4867095947265625, -0.46379852294921875, -0.440887451171875, -0.41797637939453125, -0.3950653076171875, -0.37215423583984375, -0.3492431640625, -0.32633209228515625, -0.3034210205078125, -0.28050994873046875, -0.257598876953125, -0.23468780517578125, -0.2117767333984375, -0.18886566162109375, -0.16595458984375, -0.14304351806640625, -0.1201324462890625, -0.09722137451171875, -0.074310302734375, -0.05139923095703125, -0.0284881591796875, -0.00557708740234375, 0.017333984375, 0.04024505615234375, 0.0631561279296875, 0.08606719970703125, 0.108978271484375, 0.13188934326171875, 0.1548004150390625, 0.17771148681640625, 0.20062255859375, 0.22353363037109375, 0.2464447021484375, 0.26935577392578125, 0.292266845703125, 0.31517791748046875, 0.3380889892578125, 0.36100006103515625, 0.3839111328125, 0.40682220458984375, 0.4297332763671875, 0.45264434814453125, 0.475555419921875, 0.49846649169921875, 0.5213775634765625, 0.5442886352539062, 0.56719970703125, 0.5901107788085938, 0.6130218505859375, 0.6359329223632812, 0.658843994140625, 0.6817550659179688, 0.7046661376953125, 0.7275772094726562, 0.75048828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 11.0, 13.0, 26.0, 23.0, 51.0, 87.0, 120.0, 199.0, 305.0, 475.0, 816.0, 1657.0, 3545.0, 9640.0, 32063.0, 146696.0, 688900.0, 121038.0, 27557.0, 8473.0, 3286.0, 1521.0, 841.0, 453.0, 246.0, 182.0, 100.0, 73.0, 47.0, 31.0, 32.0, 16.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2239990234375, -0.2161235809326172, -0.20824813842773438, -0.20037269592285156, -0.19249725341796875, -0.18462181091308594, -0.17674636840820312, -0.1688709259033203, -0.1609954833984375, -0.1531200408935547, -0.14524459838867188, -0.13736915588378906, -0.12949371337890625, -0.12161827087402344, -0.11374282836914062, -0.10586738586425781, -0.097991943359375, -0.09011650085449219, -0.08224105834960938, -0.07436561584472656, -0.06649017333984375, -0.05861473083496094, -0.050739288330078125, -0.04286384582519531, -0.0349884033203125, -0.027112960815429688, -0.019237518310546875, -0.011362075805664062, -0.00348663330078125, 0.0043888092041015625, 0.012264251708984375, 0.020139694213867188, 0.02801513671875, 0.03589057922363281, 0.043766021728515625, 0.05164146423339844, 0.05951690673828125, 0.06739234924316406, 0.07526779174804688, 0.08314323425292969, 0.0910186767578125, 0.09889411926269531, 0.10676956176757812, 0.11464500427246094, 0.12252044677734375, 0.13039588928222656, 0.13827133178710938, 0.1461467742919922, 0.154022216796875, 0.1618976593017578, 0.16977310180664062, 0.17764854431152344, 0.18552398681640625, 0.19339942932128906, 0.20127487182617188, 0.2091503143310547, 0.2170257568359375, 0.2249011993408203, 0.23277664184570312, 0.24065208435058594, 0.24852752685546875, 0.25640296936035156, 0.2642784118652344, 0.2721538543701172, 0.280029296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 0.0, 2.0, 7.0, 2.0, 9.0, 11.0, 5.0, 8.0, 11.0, 8.0, 15.0, 18.0, 24.0, 29.0, 31.0, 33.0, 50.0, 63.0, 75.0, 79.0, 70.0, 105.0, 64.0, 56.0, 40.0, 31.0, 27.0, 23.0, 19.0, 19.0, 5.0, 13.0, 9.0, 10.0, 5.0, 4.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.717443466186523e-05, -6.520934402942657e-05, -6.324425339698792e-05, -6.127916276454926e-05, -5.9314072132110596e-05, -5.7348981499671936e-05, -5.5383890867233276e-05, -5.341880023479462e-05, -5.145370960235596e-05, -4.94886189699173e-05, -4.752352833747864e-05, -4.555843770503998e-05, -4.359334707260132e-05, -4.162825644016266e-05, -3.9663165807724e-05, -3.769807517528534e-05, -3.573298454284668e-05, -3.376789391040802e-05, -3.180280327796936e-05, -2.98377126455307e-05, -2.787262201309204e-05, -2.590753138065338e-05, -2.394244074821472e-05, -2.1977350115776062e-05, -2.0012259483337402e-05, -1.8047168850898743e-05, -1.6082078218460083e-05, -1.4116987586021423e-05, -1.2151896953582764e-05, -1.0186806321144104e-05, -8.221715688705444e-06, -6.256625056266785e-06, -4.291534423828125e-06, -2.3264437913894653e-06, -3.6135315895080566e-07, 1.603737473487854e-06, 3.5688281059265137e-06, 5.533918738365173e-06, 7.499009370803833e-06, 9.464100003242493e-06, 1.1429190635681152e-05, 1.3394281268119812e-05, 1.535937190055847e-05, 1.732446253299713e-05, 1.928955316543579e-05, 2.125464379787445e-05, 2.321973443031311e-05, 2.518482506275177e-05, 2.714991569519043e-05, 2.911500632762909e-05, 3.108009696006775e-05, 3.304518759250641e-05, 3.501027822494507e-05, 3.697536885738373e-05, 3.894045948982239e-05, 4.090555012226105e-05, 4.287064075469971e-05, 4.483573138713837e-05, 4.6800822019577026e-05, 4.8765912652015686e-05, 5.0731003284454346e-05, 5.2696093916893005e-05, 5.4661184549331665e-05, 5.6626275181770325e-05, 5.8591365814208984e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 5.0, 6.0, 16.0, 23.0, 42.0, 47.0, 72.0, 103.0, 186.0, 263.0, 440.0, 801.0, 1730.0, 4087.0, 12358.0, 51673.0, 521423.0, 387331.0, 48578.0, 11806.0, 3902.0, 1624.0, 779.0, 438.0, 289.0, 171.0, 116.0, 80.0, 52.0, 47.0, 26.0, 12.0, 11.0, 12.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.369384765625, -0.3591194152832031, -0.34885406494140625, -0.3385887145996094, -0.3283233642578125, -0.3180580139160156, -0.30779266357421875, -0.2975273132324219, -0.287261962890625, -0.2769966125488281, -0.26673126220703125, -0.2564659118652344, -0.2462005615234375, -0.23593521118164062, -0.22566986083984375, -0.21540451049804688, -0.20513916015625, -0.19487380981445312, -0.18460845947265625, -0.17434310913085938, -0.1640777587890625, -0.15381240844726562, -0.14354705810546875, -0.13328170776367188, -0.123016357421875, -0.11275100708007812, -0.10248565673828125, -0.09222030639648438, -0.0819549560546875, -0.07168960571289062, -0.06142425537109375, -0.051158905029296875, -0.0408935546875, -0.030628204345703125, -0.02036285400390625, -0.010097503662109375, 0.0001678466796875, 0.010433197021484375, 0.02069854736328125, 0.030963897705078125, 0.041229248046875, 0.051494598388671875, 0.06175994873046875, 0.07202529907226562, 0.0822906494140625, 0.09255599975585938, 0.10282135009765625, 0.11308670043945312, 0.12335205078125, 0.13361740112304688, 0.14388275146484375, 0.15414810180664062, 0.1644134521484375, 0.17467880249023438, 0.18494415283203125, 0.19520950317382812, 0.205474853515625, 0.21574020385742188, 0.22600555419921875, 0.23627090454101562, 0.2465362548828125, 0.2568016052246094, 0.26706695556640625, 0.2773323059082031, 0.28759765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 5.0, 6.0, 12.0, 9.0, 14.0, 15.0, 17.0, 20.0, 25.0, 26.0, 40.0, 38.0, 64.0, 55.0, 74.0, 105.0, 80.0, 79.0, 63.0, 54.0, 35.0, 29.0, 28.0, 25.0, 18.0, 17.0, 9.0, 9.0, 5.0, 5.0, 4.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.22510528564453125, -0.2175445556640625, -0.20998382568359375, -0.202423095703125, -0.19486236572265625, -0.1873016357421875, -0.17974090576171875, -0.17218017578125, -0.16461944580078125, -0.1570587158203125, -0.14949798583984375, -0.141937255859375, -0.13437652587890625, -0.1268157958984375, -0.11925506591796875, -0.1116943359375, -0.10413360595703125, -0.0965728759765625, -0.08901214599609375, -0.081451416015625, -0.07389068603515625, -0.0663299560546875, -0.05876922607421875, -0.05120849609375, -0.04364776611328125, -0.0360870361328125, -0.02852630615234375, -0.020965576171875, -0.01340484619140625, -0.0058441162109375, 0.00171661376953125, 0.00927734375, 0.01683807373046875, 0.0243988037109375, 0.03195953369140625, 0.039520263671875, 0.04708099365234375, 0.0546417236328125, 0.06220245361328125, 0.06976318359375, 0.07732391357421875, 0.0848846435546875, 0.09244537353515625, 0.100006103515625, 0.10756683349609375, 0.1151275634765625, 0.12268829345703125, 0.1302490234375, 0.13780975341796875, 0.1453704833984375, 0.15293121337890625, 0.160491943359375, 0.16805267333984375, 0.1756134033203125, 0.18317413330078125, 0.19073486328125, 0.19829559326171875, 0.2058563232421875, 0.21341705322265625, 0.220977783203125, 0.22853851318359375, 0.2360992431640625, 0.24365997314453125, 0.251220703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 3.0, 2.0, 1.0, 4.0, 5.0, 11.0, 14.0, 34.0, 88.0, 182.0, 356.0, 173.0, 81.0, 31.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1904296875, -8.952518463134766, -8.714607238769531, -8.476696014404297, -8.238784790039062, -8.000873565673828, -7.762962341308594, -7.525051116943359, -7.287139892578125, -7.049228668212891, -6.811317443847656, -6.573406219482422, -6.3354949951171875, -6.097583770751953, -5.859672546386719, -5.621761322021484, -5.38385009765625, -5.145938873291016, -4.908027648925781, -4.670116424560547, -4.4322052001953125, -4.194293975830078, -3.9563827514648438, -3.7184715270996094, -3.480559825897217, -3.2426486015319824, -3.004737377166748, -2.7668261528015137, -2.5289149284362793, -2.291003704071045, -2.0530924797058105, -1.8151811361312866, -1.5772700309753418, -1.3393588066101074, -1.101447582244873, -0.8635362982749939, -0.6256250739097595, -0.38771378993988037, -0.149802565574646, 0.08810865879058838, 0.32601988315582275, 0.5639311075210571, 0.8018423318862915, 1.0397536754608154, 1.2776648998260498, 1.5155761241912842, 1.7534873485565186, 1.991398572921753, 2.2293097972869873, 2.4672210216522217, 2.705132246017456, 2.9430434703826904, 3.180954694747925, 3.4188661575317383, 3.6567773818969727, 3.894688606262207, 4.132599830627441, 4.370511054992676, 4.60842227935791, 4.8463335037231445, 5.084244728088379, 5.322155952453613, 5.560067176818848, 5.797978401184082, 6.035889625549316]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 6.0, 11.0, 10.0, 18.0, 18.0, 20.0, 19.0, 27.0, 33.0, 34.0, 31.0, 39.0, 45.0, 45.0, 54.0, 63.0, 70.0, 62.0, 42.0, 47.0, 41.0, 30.0, 29.0, 33.0, 24.0, 24.0, 15.0, 16.0, 15.0, 16.0, 7.0, 7.0, 5.0, 10.0, 9.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8518059253692627, -2.7538490295410156, -2.6558923721313477, -2.5579354763031006, -2.4599785804748535, -2.3620219230651855, -2.2640650272369385, -2.1661081314086914, -2.0681514739990234, -1.970194697380066, -1.8722378015518188, -1.7742810249328613, -1.6763241291046143, -1.5783673524856567, -1.4804105758666992, -1.3824536800384521, -1.284496784210205, -1.1865400075912476, -1.0885831117630005, -0.990626335144043, -0.8926694989204407, -0.7947126626968384, -0.6967558860778809, -0.5987990498542786, -0.5008422136306763, -0.402885377407074, -0.30492857098579407, -0.20697176456451416, -0.10901492834091187, -0.01105809211730957, 0.08689868450164795, 0.18485552072525024, 0.28281211853027344, 0.38076895475387573, 0.47872576117515564, 0.5766825675964355, 0.6746394038200378, 0.7725962400436401, 0.8705530166625977, 0.9685098528862, 1.0664666891098022, 1.1644234657287598, 1.2623803615570068, 1.3603371381759644, 1.4582939147949219, 1.556250810623169, 1.6542075872421265, 1.752164363861084, 1.850121259689331, 1.9480780363082886, 2.046034812927246, 2.143991708755493, 2.2419486045837402, 2.339905261993408, 2.4378621578216553, 2.5358190536499023, 2.6337757110595703, 2.7317326068878174, 2.8296892642974854, 2.9276461601257324, 3.0256030559539795, 3.1235599517822266, 3.2215166091918945, 3.3194735050201416, 3.4174304008483887]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 1.0, 6.0, 5.0, 8.0, 6.0, 12.0, 9.0, 11.0, 13.0, 21.0, 24.0, 37.0, 39.0, 64.0, 87.0, 123.0, 163.0, 265.0, 398.0, 667.0, 1180.0, 2229.0, 4833.0, 12445.0, 46322.0, 321404.0, 2423853.0, 1218586.0, 121526.0, 24413.0, 7915.0, 3413.0, 1703.0, 959.0, 542.0, 343.0, 225.0, 138.0, 94.0, 56.0, 44.0, 26.0, 19.0, 16.0, 7.0, 4.0, 6.0, 4.0, 7.0, 5.0, 6.0, 4.0, 0.0, 1.0], "bins": [-0.3701171875, -0.36005401611328125, -0.3499908447265625, -0.33992767333984375, -0.329864501953125, -0.31980133056640625, -0.3097381591796875, -0.29967498779296875, -0.28961181640625, -0.27954864501953125, -0.2694854736328125, -0.25942230224609375, -0.249359130859375, -0.23929595947265625, -0.2292327880859375, -0.21916961669921875, -0.2091064453125, -0.19904327392578125, -0.1889801025390625, -0.17891693115234375, -0.168853759765625, -0.15879058837890625, -0.1487274169921875, -0.13866424560546875, -0.12860107421875, -0.11853790283203125, -0.1084747314453125, -0.09841156005859375, -0.088348388671875, -0.07828521728515625, -0.0682220458984375, -0.05815887451171875, -0.048095703125, -0.03803253173828125, -0.0279693603515625, -0.01790618896484375, -0.007843017578125, 0.00222015380859375, 0.0122833251953125, 0.02234649658203125, 0.03240966796875, 0.04247283935546875, 0.0525360107421875, 0.06259918212890625, 0.072662353515625, 0.08272552490234375, 0.0927886962890625, 0.10285186767578125, 0.1129150390625, 0.12297821044921875, 0.1330413818359375, 0.14310455322265625, 0.153167724609375, 0.16323089599609375, 0.1732940673828125, 0.18335723876953125, 0.19342041015625, 0.20348358154296875, 0.2135467529296875, 0.22360992431640625, 0.233673095703125, 0.24373626708984375, 0.2537994384765625, 0.26386260986328125, 0.27392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 13.0, 12.0, 10.0, 21.0, 24.0, 25.0, 51.0, 34.0, 44.0, 59.0, 48.0, 64.0, 53.0, 55.0, 52.0, 50.0, 41.0, 54.0, 53.0, 39.0, 37.0, 23.0, 19.0, 28.0, 22.0, 16.0, 7.0, 9.0, 5.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.233154296875, -0.22641563415527344, -0.21967697143554688, -0.2129383087158203, -0.20619964599609375, -0.1994609832763672, -0.19272232055664062, -0.18598365783691406, -0.1792449951171875, -0.17250633239746094, -0.16576766967773438, -0.1590290069580078, -0.15229034423828125, -0.1455516815185547, -0.13881301879882812, -0.13207435607910156, -0.125335693359375, -0.11859703063964844, -0.11185836791992188, -0.10511970520019531, -0.09838104248046875, -0.09164237976074219, -0.08490371704101562, -0.07816505432128906, -0.0714263916015625, -0.06468772888183594, -0.057949066162109375, -0.05121040344238281, -0.04447174072265625, -0.03773307800292969, -0.030994415283203125, -0.024255752563476562, -0.01751708984375, -0.010778427124023438, -0.004039764404296875, 0.0026988983154296875, 0.00943756103515625, 0.016176223754882812, 0.022914886474609375, 0.029653549194335938, 0.0363922119140625, 0.04313087463378906, 0.049869537353515625, 0.05660820007324219, 0.06334686279296875, 0.07008552551269531, 0.07682418823242188, 0.08356285095214844, 0.090301513671875, 0.09704017639160156, 0.10377883911132812, 0.11051750183105469, 0.11725616455078125, 0.12399482727050781, 0.13073348999023438, 0.13747215270996094, 0.1442108154296875, 0.15094947814941406, 0.15768814086914062, 0.1644268035888672, 0.17116546630859375, 0.1779041290283203, 0.18464279174804688, 0.19138145446777344, 0.1981201171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 22.0, 32.0, 78.0, 120.0, 253.0, 542.0, 1216.0, 3685.0, 12380.0, 65399.0, 1348196.0, 2629915.0, 106610.0, 17584.0, 4930.0, 1693.0, 744.0, 390.0, 216.0, 106.0, 60.0, 36.0, 25.0, 13.0, 8.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.408203125, -0.39194488525390625, -0.3756866455078125, -0.35942840576171875, -0.343170166015625, -0.32691192626953125, -0.3106536865234375, -0.29439544677734375, -0.27813720703125, -0.26187896728515625, -0.2456207275390625, -0.22936248779296875, -0.213104248046875, -0.19684600830078125, -0.1805877685546875, -0.16432952880859375, -0.1480712890625, -0.13181304931640625, -0.1155548095703125, -0.09929656982421875, -0.083038330078125, -0.06678009033203125, -0.0505218505859375, -0.03426361083984375, -0.01800537109375, -0.00174713134765625, 0.0145111083984375, 0.03076934814453125, 0.047027587890625, 0.06328582763671875, 0.0795440673828125, 0.09580230712890625, 0.112060546875, 0.12831878662109375, 0.1445770263671875, 0.16083526611328125, 0.177093505859375, 0.19335174560546875, 0.2096099853515625, 0.22586822509765625, 0.24212646484375, 0.25838470458984375, 0.2746429443359375, 0.29090118408203125, 0.307159423828125, 0.32341766357421875, 0.3396759033203125, 0.35593414306640625, 0.3721923828125, 0.38845062255859375, 0.4047088623046875, 0.42096710205078125, 0.437225341796875, 0.45348358154296875, 0.4697418212890625, 0.48600006103515625, 0.50225830078125, 0.5185165405273438, 0.5347747802734375, 0.5510330200195312, 0.567291259765625, 0.5835494995117188, 0.5998077392578125, 0.6160659790039062, 0.63232421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 7.0, 12.0, 11.0, 18.0, 26.0, 55.0, 89.0, 127.0, 259.0, 458.0, 694.0, 761.0, 622.0, 376.0, 199.0, 119.0, 68.0, 50.0, 32.0, 16.0, 14.0, 14.0, 16.0, 5.0, 5.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.437957763671875, -0.42132568359375, -0.404693603515625, -0.3880615234375, -0.371429443359375, -0.35479736328125, -0.338165283203125, -0.321533203125, -0.304901123046875, -0.28826904296875, -0.271636962890625, -0.2550048828125, -0.238372802734375, -0.22174072265625, -0.205108642578125, -0.1884765625, -0.171844482421875, -0.15521240234375, -0.138580322265625, -0.1219482421875, -0.105316162109375, -0.08868408203125, -0.072052001953125, -0.055419921875, -0.038787841796875, -0.02215576171875, -0.005523681640625, 0.0111083984375, 0.027740478515625, 0.04437255859375, 0.061004638671875, 0.07763671875, 0.094268798828125, 0.11090087890625, 0.127532958984375, 0.1441650390625, 0.160797119140625, 0.17742919921875, 0.194061279296875, 0.210693359375, 0.227325439453125, 0.24395751953125, 0.260589599609375, 0.2772216796875, 0.293853759765625, 0.31048583984375, 0.327117919921875, 0.34375, 0.360382080078125, 0.37701416015625, 0.393646240234375, 0.4102783203125, 0.426910400390625, 0.44354248046875, 0.460174560546875, 0.476806640625, 0.493438720703125, 0.51007080078125, 0.526702880859375, 0.5433349609375, 0.559967041015625, 0.57659912109375, 0.593231201171875, 0.60986328125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 9.0, 26.0, 67.0, 166.0, 303.0, 248.0, 113.0, 31.0, 13.0, 15.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.12754487991333, -2.899425983428955, -2.671307325363159, -2.4431886672973633, -2.2150697708129883, -1.9869509935379028, -1.7588322162628174, -1.530713438987732, -1.3025946617126465, -1.074475884437561, -0.8463571071624756, -0.6182383298873901, -0.3901195526123047, -0.16200077533721924, 0.06611800193786621, 0.29423677921295166, 0.5223555564880371, 0.7504743337631226, 0.978593111038208, 1.2067118883132935, 1.434830665588379, 1.6629494428634644, 1.8910682201385498, 2.1191868782043457, 2.3473057746887207, 2.5754246711730957, 2.8035433292388916, 3.0316619873046875, 3.2597808837890625, 3.4878997802734375, 3.7160184383392334, 3.9441370964050293, 4.1722564697265625, 4.4003753662109375, 4.6284942626953125, 4.856612682342529, 5.084731578826904, 5.312850475311279, 5.540968894958496, 5.769087791442871, 5.997206687927246, 6.225325584411621, 6.453444480895996, 6.681562900543213, 6.909681797027588, 7.137800693511963, 7.36591911315918, 7.594038009643555, 7.82215690612793, 8.050275802612305, 8.27839469909668, 8.506513595581055, 8.73463249206543, 8.962750434875488, 9.190869331359863, 9.418988227844238, 9.647107124328613, 9.875226020812988, 10.103344917297363, 10.331463813781738, 10.559581756591797, 10.787700653076172, 11.015819549560547, 11.243938446044922, 11.472057342529297]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 11.0, 4.0, 6.0, 9.0, 7.0, 9.0, 16.0, 14.0, 24.0, 15.0, 33.0, 27.0, 33.0, 40.0, 40.0, 50.0, 52.0, 48.0, 59.0, 51.0, 58.0, 53.0, 41.0, 45.0, 42.0, 30.0, 39.0, 29.0, 31.0, 14.0, 13.0, 10.0, 16.0, 7.0, 9.0, 7.0, 0.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-2.778782844543457, -2.709764242172241, -2.6407454013824463, -2.5717267990112305, -2.5027081966400146, -2.433689594268799, -2.364670753479004, -2.295652151107788, -2.2266335487365723, -2.1576149463653564, -2.0885961055755615, -2.0195775032043457, -1.9505589008331299, -1.8815401792526245, -1.8125214576721191, -1.7435028553009033, -1.6744840145111084, -1.605465292930603, -1.5364466905593872, -1.4674279689788818, -1.398409366607666, -1.3293906450271606, -1.2603719234466553, -1.1913533210754395, -1.122334599494934, -1.0533158779144287, -0.9842972755432129, -0.9152785539627075, -0.8462598919868469, -0.7772412300109863, -0.708222508430481, -0.6392038464546204, -0.5701851844787598, -0.5011665225028992, -0.4321478307247162, -0.3631291389465332, -0.2941104769706726, -0.225091814994812, -0.15607312321662903, -0.08705443143844604, -0.01803576946258545, 0.05098290741443634, 0.12000158429145813, 0.18902026116847992, 0.2580389380455017, 0.3270576000213623, 0.3960762917995453, 0.46509498357772827, 0.5341136455535889, 0.6031323075294495, 0.6721509695053101, 0.7411696910858154, 0.810188353061676, 0.8792070150375366, 0.948225736618042, 1.0172443389892578, 1.0862630605697632, 1.1552817821502686, 1.2243003845214844, 1.2933191061019897, 1.3623378276824951, 1.431356430053711, 1.5003751516342163, 1.5693938732147217, 1.6384124755859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 14.0, 13.0, 20.0, 26.0, 35.0, 42.0, 86.0, 105.0, 178.0, 333.0, 681.0, 1454.0, 3528.0, 9504.0, 31508.0, 119577.0, 464211.0, 313287.0, 72180.0, 20083.0, 6610.0, 2671.0, 1091.0, 510.0, 305.0, 165.0, 106.0, 59.0, 55.0, 31.0, 23.0, 15.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.5126953125, -0.49877166748046875, -0.4848480224609375, -0.47092437744140625, -0.457000732421875, -0.44307708740234375, -0.4291534423828125, -0.41522979736328125, -0.40130615234375, -0.38738250732421875, -0.3734588623046875, -0.35953521728515625, -0.345611572265625, -0.33168792724609375, -0.3177642822265625, -0.30384063720703125, -0.2899169921875, -0.27599334716796875, -0.2620697021484375, -0.24814605712890625, -0.234222412109375, -0.22029876708984375, -0.2063751220703125, -0.19245147705078125, -0.17852783203125, -0.16460418701171875, -0.1506805419921875, -0.13675689697265625, -0.122833251953125, -0.10890960693359375, -0.0949859619140625, -0.08106231689453125, -0.067138671875, -0.05321502685546875, -0.0392913818359375, -0.02536773681640625, -0.011444091796875, 0.00247955322265625, 0.0164031982421875, 0.03032684326171875, 0.04425048828125, 0.05817413330078125, 0.0720977783203125, 0.08602142333984375, 0.099945068359375, 0.11386871337890625, 0.1277923583984375, 0.14171600341796875, 0.1556396484375, 0.16956329345703125, 0.1834869384765625, 0.19741058349609375, 0.211334228515625, 0.22525787353515625, 0.2391815185546875, 0.25310516357421875, 0.26702880859375, 0.28095245361328125, 0.2948760986328125, 0.30879974365234375, 0.322723388671875, 0.33664703369140625, 0.3505706787109375, 0.36449432373046875, 0.37841796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 4.0, 7.0, 9.0, 10.0, 14.0, 20.0, 15.0, 10.0, 23.0, 20.0, 27.0, 30.0, 40.0, 42.0, 35.0, 38.0, 50.0, 39.0, 54.0, 45.0, 43.0, 46.0, 41.0, 49.0, 36.0, 28.0, 34.0, 33.0, 39.0, 16.0, 19.0, 17.0, 9.0, 11.0, 10.0, 8.0, 3.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1634521484375, -0.15784263610839844, -0.15223312377929688, -0.1466236114501953, -0.14101409912109375, -0.1354045867919922, -0.12979507446289062, -0.12418556213378906, -0.1185760498046875, -0.11296653747558594, -0.10735702514648438, -0.10174751281738281, -0.09613800048828125, -0.09052848815917969, -0.08491897583007812, -0.07930946350097656, -0.073699951171875, -0.06809043884277344, -0.062480926513671875, -0.05687141418457031, -0.05126190185546875, -0.04565238952636719, -0.040042877197265625, -0.03443336486816406, -0.0288238525390625, -0.023214340209960938, -0.017604827880859375, -0.011995315551757812, -0.00638580322265625, -0.0007762908935546875, 0.004833221435546875, 0.010442733764648438, 0.01605224609375, 0.021661758422851562, 0.027271270751953125, 0.03288078308105469, 0.03849029541015625, 0.04409980773925781, 0.049709320068359375, 0.05531883239746094, 0.0609283447265625, 0.06653785705566406, 0.07214736938476562, 0.07775688171386719, 0.08336639404296875, 0.08897590637207031, 0.09458541870117188, 0.10019493103027344, 0.105804443359375, 0.11141395568847656, 0.11702346801757812, 0.12263298034667969, 0.12824249267578125, 0.1338520050048828, 0.13946151733398438, 0.14507102966308594, 0.1506805419921875, 0.15629005432128906, 0.16189956665039062, 0.1675090789794922, 0.17311859130859375, 0.1787281036376953, 0.18433761596679688, 0.18994712829589844, 0.195556640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 6.0, 4.0, 7.0, 11.0, 11.0, 24.0, 37.0, 35.0, 55.0, 87.0, 172.0, 288.0, 410.0, 812.0, 1636.0, 4379.0, 20389.0, 295978.0, 683105.0, 31358.0, 5534.0, 1947.0, 972.0, 477.0, 287.0, 189.0, 97.0, 80.0, 39.0, 36.0, 22.0, 19.0, 16.0, 5.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.0615234375, -1.0321197509765625, -1.002716064453125, -0.9733123779296875, -0.94390869140625, -0.9145050048828125, -0.885101318359375, -0.8556976318359375, -0.8262939453125, -0.7968902587890625, -0.767486572265625, -0.7380828857421875, -0.70867919921875, -0.6792755126953125, -0.649871826171875, -0.6204681396484375, -0.591064453125, -0.5616607666015625, -0.532257080078125, -0.5028533935546875, -0.47344970703125, -0.4440460205078125, -0.414642333984375, -0.3852386474609375, -0.3558349609375, -0.3264312744140625, -0.297027587890625, -0.2676239013671875, -0.23822021484375, -0.2088165283203125, -0.179412841796875, -0.1500091552734375, -0.12060546875, -0.0912017822265625, -0.061798095703125, -0.0323944091796875, -0.00299072265625, 0.0264129638671875, 0.055816650390625, 0.0852203369140625, 0.1146240234375, 0.1440277099609375, 0.173431396484375, 0.2028350830078125, 0.23223876953125, 0.2616424560546875, 0.291046142578125, 0.3204498291015625, 0.349853515625, 0.3792572021484375, 0.408660888671875, 0.4380645751953125, 0.46746826171875, 0.4968719482421875, 0.526275634765625, 0.5556793212890625, 0.5850830078125, 0.6144866943359375, 0.643890380859375, 0.6732940673828125, 0.70269775390625, 0.7321014404296875, 0.761505126953125, 0.7909088134765625, 0.8203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 0.0, 8.0, 8.0, 9.0, 16.0, 12.0, 21.0, 17.0, 30.0, 17.0, 34.0, 36.0, 26.0, 41.0, 42.0, 39.0, 50.0, 44.0, 69.0, 46.0, 50.0, 41.0, 38.0, 42.0, 32.0, 40.0, 34.0, 31.0, 21.0, 17.0, 14.0, 20.0, 11.0, 12.0, 2.0, 1.0, 12.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.689453125, -0.6655426025390625, -0.641632080078125, -0.6177215576171875, -0.59381103515625, -0.5699005126953125, -0.545989990234375, -0.5220794677734375, -0.4981689453125, -0.4742584228515625, -0.450347900390625, -0.4264373779296875, -0.40252685546875, -0.3786163330078125, -0.354705810546875, -0.3307952880859375, -0.306884765625, -0.2829742431640625, -0.259063720703125, -0.2351531982421875, -0.21124267578125, -0.1873321533203125, -0.163421630859375, -0.1395111083984375, -0.1156005859375, -0.0916900634765625, -0.067779541015625, -0.0438690185546875, -0.01995849609375, 0.0039520263671875, 0.027862548828125, 0.0517730712890625, 0.07568359375, 0.0995941162109375, 0.123504638671875, 0.1474151611328125, 0.17132568359375, 0.1952362060546875, 0.219146728515625, 0.2430572509765625, 0.2669677734375, 0.2908782958984375, 0.314788818359375, 0.3386993408203125, 0.36260986328125, 0.3865203857421875, 0.410430908203125, 0.4343414306640625, 0.458251953125, 0.4821624755859375, 0.506072998046875, 0.5299835205078125, 0.55389404296875, 0.5778045654296875, 0.601715087890625, 0.6256256103515625, 0.6495361328125, 0.6734466552734375, 0.697357177734375, 0.7212677001953125, 0.74517822265625, 0.7690887451171875, 0.792999267578125, 0.8169097900390625, 0.8408203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 7.0, 4.0, 5.0, 9.0, 17.0, 21.0, 34.0, 35.0, 54.0, 92.0, 175.0, 293.0, 552.0, 1450.0, 5232.0, 32998.0, 770572.0, 214686.0, 16867.0, 3274.0, 1096.0, 477.0, 224.0, 121.0, 76.0, 42.0, 35.0, 24.0, 18.0, 12.0, 10.0, 12.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302734375, -0.5146026611328125, -0.498931884765625, -0.4832611083984375, -0.46759033203125, -0.4519195556640625, -0.436248779296875, -0.4205780029296875, -0.4049072265625, -0.3892364501953125, -0.373565673828125, -0.3578948974609375, -0.34222412109375, -0.3265533447265625, -0.310882568359375, -0.2952117919921875, -0.279541015625, -0.2638702392578125, -0.248199462890625, -0.2325286865234375, -0.21685791015625, -0.2011871337890625, -0.185516357421875, -0.1698455810546875, -0.1541748046875, -0.1385040283203125, -0.122833251953125, -0.1071624755859375, -0.09149169921875, -0.0758209228515625, -0.060150146484375, -0.0444793701171875, -0.02880859375, -0.0131378173828125, 0.002532958984375, 0.0182037353515625, 0.03387451171875, 0.0495452880859375, 0.065216064453125, 0.0808868408203125, 0.0965576171875, 0.1122283935546875, 0.127899169921875, 0.1435699462890625, 0.15924072265625, 0.1749114990234375, 0.190582275390625, 0.2062530517578125, 0.221923828125, 0.2375946044921875, 0.253265380859375, 0.2689361572265625, 0.28460693359375, 0.3002777099609375, 0.315948486328125, 0.3316192626953125, 0.3472900390625, 0.3629608154296875, 0.378631591796875, 0.3943023681640625, 0.40997314453125, 0.4256439208984375, 0.441314697265625, 0.4569854736328125, 0.47265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 5.0, 9.0, 12.0, 26.0, 25.0, 44.0, 94.0, 145.0, 213.0, 166.0, 88.0, 43.0, 27.0, 28.0, 9.0, 19.0, 7.0, 5.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00018095970153808594, -0.0001763841137290001, -0.00017180852591991425, -0.0001672329381108284, -0.00016265735030174255, -0.0001580817624926567, -0.00015350617468357086, -0.00014893058687448502, -0.00014435499906539917, -0.00013977941125631332, -0.00013520382344722748, -0.00013062823563814163, -0.00012605264782905579, -0.00012147706001996994, -0.0001169014722108841, -0.00011232588440179825, -0.0001077502965927124, -0.00010317470878362656, -9.859912097454071e-05, -9.402353316545486e-05, -8.944794535636902e-05, -8.487235754728317e-05, -8.029676973819733e-05, -7.572118192911148e-05, -7.114559412002563e-05, -6.657000631093979e-05, -6.199441850185394e-05, -5.74188306927681e-05, -5.284324288368225e-05, -4.8267655074596405e-05, -4.369206726551056e-05, -3.911647945642471e-05, -3.454089164733887e-05, -2.996530383825302e-05, -2.5389716029167175e-05, -2.081412822008133e-05, -1.6238540410995483e-05, -1.1662952601909637e-05, -7.0873647928237915e-06, -2.5117769837379456e-06, 2.0638108253479004e-06, 6.639398634433746e-06, 1.1214986443519592e-05, 1.5790574252605438e-05, 2.0366162061691284e-05, 2.494174987077713e-05, 2.9517337679862976e-05, 3.409292548894882e-05, 3.866851329803467e-05, 4.3244101107120514e-05, 4.781968891620636e-05, 5.2395276725292206e-05, 5.697086453437805e-05, 6.15464523434639e-05, 6.612204015254974e-05, 7.069762796163559e-05, 7.527321577072144e-05, 7.984880357980728e-05, 8.442439138889313e-05, 8.899997919797897e-05, 9.357556700706482e-05, 9.815115481615067e-05, 0.00010272674262523651, 0.00010730233043432236, 0.0001118779182434082]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 7.0, 6.0, 15.0, 16.0, 12.0, 26.0, 32.0, 56.0, 87.0, 109.0, 161.0, 254.0, 425.0, 647.0, 1119.0, 2075.0, 4292.0, 10875.0, 41094.0, 364753.0, 556660.0, 44491.0, 11852.0, 4378.0, 2146.0, 1072.0, 626.0, 408.0, 259.0, 172.0, 123.0, 88.0, 47.0, 32.0, 35.0, 23.0, 25.0, 16.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.353515625, -0.34281158447265625, -0.3321075439453125, -0.32140350341796875, -0.310699462890625, -0.29999542236328125, -0.2892913818359375, -0.27858734130859375, -0.26788330078125, -0.25717926025390625, -0.2464752197265625, -0.23577117919921875, -0.225067138671875, -0.21436309814453125, -0.2036590576171875, -0.19295501708984375, -0.1822509765625, -0.17154693603515625, -0.1608428955078125, -0.15013885498046875, -0.139434814453125, -0.12873077392578125, -0.1180267333984375, -0.10732269287109375, -0.09661865234375, -0.08591461181640625, -0.0752105712890625, -0.06450653076171875, -0.053802490234375, -0.04309844970703125, -0.0323944091796875, -0.02169036865234375, -0.010986328125, -0.00028228759765625, 0.0104217529296875, 0.02112579345703125, 0.031829833984375, 0.04253387451171875, 0.0532379150390625, 0.06394195556640625, 0.07464599609375, 0.08535003662109375, 0.0960540771484375, 0.10675811767578125, 0.117462158203125, 0.12816619873046875, 0.1388702392578125, 0.14957427978515625, 0.1602783203125, 0.17098236083984375, 0.1816864013671875, 0.19239044189453125, 0.203094482421875, 0.21379852294921875, 0.2245025634765625, 0.23520660400390625, 0.24591064453125, 0.25661468505859375, 0.2673187255859375, 0.27802276611328125, 0.288726806640625, 0.29943084716796875, 0.3101348876953125, 0.32083892822265625, 0.33154296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 15.0, 8.0, 19.0, 18.0, 17.0, 33.0, 43.0, 103.0, 148.0, 162.0, 140.0, 91.0, 51.0, 30.0, 31.0, 17.0, 10.0, 8.0, 6.0, 9.0, 2.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.37744140625, -0.36582183837890625, -0.3542022705078125, -0.34258270263671875, -0.330963134765625, -0.31934356689453125, -0.3077239990234375, -0.29610443115234375, -0.28448486328125, -0.27286529541015625, -0.2612457275390625, -0.24962615966796875, -0.238006591796875, -0.22638702392578125, -0.2147674560546875, -0.20314788818359375, -0.1915283203125, -0.17990875244140625, -0.1682891845703125, -0.15666961669921875, -0.145050048828125, -0.13343048095703125, -0.1218109130859375, -0.11019134521484375, -0.09857177734375, -0.08695220947265625, -0.0753326416015625, -0.06371307373046875, -0.052093505859375, -0.04047393798828125, -0.0288543701171875, -0.01723480224609375, -0.005615234375, 0.00600433349609375, 0.0176239013671875, 0.02924346923828125, 0.040863037109375, 0.05248260498046875, 0.0641021728515625, 0.07572174072265625, 0.08734130859375, 0.09896087646484375, 0.1105804443359375, 0.12220001220703125, 0.133819580078125, 0.14543914794921875, 0.1570587158203125, 0.16867828369140625, 0.1802978515625, 0.19191741943359375, 0.2035369873046875, 0.21515655517578125, 0.226776123046875, 0.23839569091796875, 0.2500152587890625, 0.26163482666015625, 0.27325439453125, 0.28487396240234375, 0.2964935302734375, 0.30811309814453125, 0.319732666015625, 0.33135223388671875, 0.3429718017578125, 0.35459136962890625, 0.3662109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 16.0, 27.0, 115.0, 452.0, 266.0, 71.0, 21.0, 9.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.24772834777832, -9.903389930725098, -9.559051513671875, -9.214713096618652, -8.87037467956543, -8.526037216186523, -8.1816987991333, -7.837360382080078, -7.4930219650268555, -7.148683547973633, -6.80434513092041, -6.460007190704346, -6.115668773651123, -5.7713303565979, -5.426992416381836, -5.082653999328613, -4.738315582275391, -4.393977165222168, -4.049638748168945, -3.705300807952881, -3.360962390899658, -3.0166239738464355, -2.672285795211792, -2.3279476165771484, -1.9836091995239258, -1.6392709016799927, -1.2949326038360596, -0.9505943059921265, -0.6062560081481934, -0.26191771030426025, 0.08242058753967285, 0.4267587661743164, 0.7710971832275391, 1.1154354810714722, 1.4597737789154053, 1.8041120767593384, 2.1484503746032715, 2.492788791656494, 2.8371269702911377, 3.1814651489257812, 3.525803565979004, 3.8701419830322266, 4.214480400085449, 4.558818340301514, 4.903156757354736, 5.247495174407959, 5.591833114624023, 5.936171531677246, 6.280509948730469, 6.624848365783691, 6.969186782836914, 7.3135247230529785, 7.657863140106201, 8.002201080322266, 8.346539497375488, 8.690877914428711, 9.035216331481934, 9.379554748535156, 9.723893165588379, 10.068231582641602, 10.412569046020508, 10.75690746307373, 11.101245880126953, 11.445584297180176, 11.789922714233398]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 9.0, 4.0, 7.0, 12.0, 18.0, 13.0, 25.0, 26.0, 29.0, 27.0, 38.0, 43.0, 60.0, 62.0, 94.0, 88.0, 80.0, 49.0, 57.0, 53.0, 37.0, 31.0, 28.0, 23.0, 17.0, 26.0, 8.0, 12.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.993409633636475, -4.8741559982299805, -4.754902362823486, -4.635648727416992, -4.51639461517334, -4.397140979766846, -4.277887344360352, -4.158633708953857, -4.039380073547363, -3.920126438140869, -3.800872564315796, -3.6816189289093018, -3.5623652935028076, -3.4431114196777344, -3.3238577842712402, -3.204604148864746, -3.0853500366210938, -2.9660964012145996, -2.8468425273895264, -2.7275888919830322, -2.608335256576538, -2.489081382751465, -2.3698277473449707, -2.2505741119384766, -2.1313204765319824, -2.0120668411254883, -1.8928130865097046, -1.773559331893921, -1.6543055772781372, -1.5350518226623535, -1.4157981872558594, -1.2965444326400757, -1.177290678024292, -1.0580369234085083, -0.9387832283973694, -0.8195295333862305, -0.7002757787704468, -0.5810220837593079, -0.46176838874816895, -0.34251463413238525, -0.22326093912124634, -0.10400722175836563, 0.015246495604515076, 0.13450020551681519, 0.2537539303302765, 0.3730076551437378, 0.4922613501548767, 0.6115151047706604, 0.7307687997817993, 0.8500224947929382, 0.9692762494087219, 1.0885299444198608, 1.2077836990356445, 1.3270373344421387, 1.4462910890579224, 1.565544843673706, 1.6847984790802002, 1.8040522336959839, 1.923305869102478, 2.0425596237182617, 2.161813259124756, 2.281067132949829, 2.4003207683563232, 2.5195746421813965, 2.6388282775878906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 11.0, 18.0, 17.0, 25.0, 40.0, 54.0, 92.0, 152.0, 184.0, 322.0, 626.0, 1037.0, 2478.0, 6043.0, 23071.0, 234077.0, 3238777.0, 634763.0, 38289.0, 8469.0, 2892.0, 1335.0, 628.0, 326.0, 178.0, 116.0, 83.0, 43.0, 29.0, 31.0, 13.0, 14.0, 6.0, 3.0, 6.0, 4.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.480712890625, -0.46552276611328125, -0.4503326416015625, -0.43514251708984375, -0.419952392578125, -0.40476226806640625, -0.3895721435546875, -0.37438201904296875, -0.35919189453125, -0.34400177001953125, -0.3288116455078125, -0.31362152099609375, -0.298431396484375, -0.28324127197265625, -0.2680511474609375, -0.25286102294921875, -0.2376708984375, -0.22248077392578125, -0.2072906494140625, -0.19210052490234375, -0.176910400390625, -0.16172027587890625, -0.1465301513671875, -0.13134002685546875, -0.11614990234375, -0.10095977783203125, -0.0857696533203125, -0.07057952880859375, -0.055389404296875, -0.04019927978515625, -0.0250091552734375, -0.00981903076171875, 0.00537109375, 0.02056121826171875, 0.0357513427734375, 0.05094146728515625, 0.066131591796875, 0.08132171630859375, 0.0965118408203125, 0.11170196533203125, 0.12689208984375, 0.14208221435546875, 0.1572723388671875, 0.17246246337890625, 0.187652587890625, 0.20284271240234375, 0.2180328369140625, 0.23322296142578125, 0.2484130859375, 0.26360321044921875, 0.2787933349609375, 0.29398345947265625, 0.309173583984375, 0.32436370849609375, 0.3395538330078125, 0.35474395751953125, 0.36993408203125, 0.38512420654296875, 0.4003143310546875, 0.41550445556640625, 0.430694580078125, 0.44588470458984375, 0.4610748291015625, 0.47626495361328125, 0.491455078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 12.0, 20.0, 22.0, 22.0, 25.0, 31.0, 57.0, 56.0, 57.0, 61.0, 74.0, 76.0, 68.0, 73.0, 65.0, 58.0, 53.0, 37.0, 30.0, 34.0, 17.0, 13.0, 8.0, 12.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2320556640625, -0.2233104705810547, -0.21456527709960938, -0.20582008361816406, -0.19707489013671875, -0.18832969665527344, -0.17958450317382812, -0.1708393096923828, -0.1620941162109375, -0.1533489227294922, -0.14460372924804688, -0.13585853576660156, -0.12711334228515625, -0.11836814880371094, -0.10962295532226562, -0.10087776184082031, -0.092132568359375, -0.08338737487792969, -0.07464218139648438, -0.06589698791503906, -0.05715179443359375, -0.04840660095214844, -0.039661407470703125, -0.030916213989257812, -0.0221710205078125, -0.013425827026367188, -0.004680633544921875, 0.0040645599365234375, 0.01280975341796875, 0.021554946899414062, 0.030300140380859375, 0.03904533386230469, 0.04779052734375, 0.05653572082519531, 0.06528091430664062, 0.07402610778808594, 0.08277130126953125, 0.09151649475097656, 0.10026168823242188, 0.10900688171386719, 0.1177520751953125, 0.1264972686767578, 0.13524246215820312, 0.14398765563964844, 0.15273284912109375, 0.16147804260253906, 0.17022323608398438, 0.1789684295654297, 0.187713623046875, 0.1964588165283203, 0.20520401000976562, 0.21394920349121094, 0.22269439697265625, 0.23143959045410156, 0.24018478393554688, 0.2489299774169922, 0.2576751708984375, 0.2664203643798828, 0.2751655578613281, 0.28391075134277344, 0.29265594482421875, 0.30140113830566406, 0.3101463317871094, 0.3188915252685547, 0.32763671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 9.0, 2.0, 3.0, 3.0, 4.0, 12.0, 15.0, 21.0, 39.0, 47.0, 79.0, 155.0, 248.0, 418.0, 834.0, 1707.0, 4246.0, 13775.0, 102342.0, 3543644.0, 488196.0, 27176.0, 6530.0, 2530.0, 1088.0, 510.0, 262.0, 163.0, 88.0, 32.0, 34.0, 21.0, 23.0, 8.0, 5.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.574676513671875, -0.55316162109375, -0.531646728515625, -0.5101318359375, -0.488616943359375, -0.46710205078125, -0.445587158203125, -0.424072265625, -0.402557373046875, -0.38104248046875, -0.359527587890625, -0.3380126953125, -0.316497802734375, -0.29498291015625, -0.273468017578125, -0.251953125, -0.230438232421875, -0.20892333984375, -0.187408447265625, -0.1658935546875, -0.144378662109375, -0.12286376953125, -0.101348876953125, -0.079833984375, -0.058319091796875, -0.03680419921875, -0.015289306640625, 0.0062255859375, 0.027740478515625, 0.04925537109375, 0.070770263671875, 0.09228515625, 0.113800048828125, 0.13531494140625, 0.156829833984375, 0.1783447265625, 0.199859619140625, 0.22137451171875, 0.242889404296875, 0.264404296875, 0.285919189453125, 0.30743408203125, 0.328948974609375, 0.3504638671875, 0.371978759765625, 0.39349365234375, 0.415008544921875, 0.4365234375, 0.458038330078125, 0.47955322265625, 0.501068115234375, 0.5225830078125, 0.544097900390625, 0.56561279296875, 0.587127685546875, 0.608642578125, 0.630157470703125, 0.65167236328125, 0.673187255859375, 0.6947021484375, 0.716217041015625, 0.73773193359375, 0.759246826171875, 0.78076171875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 4.0, 5.0, 5.0, 4.0, 10.0, 13.0, 18.0, 39.0, 56.0, 72.0, 102.0, 224.0, 376.0, 603.0, 772.0, 677.0, 465.0, 242.0, 140.0, 80.0, 44.0, 32.0, 21.0, 14.0, 10.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50341796875, -0.48697662353515625, -0.4705352783203125, -0.45409393310546875, -0.437652587890625, -0.42121124267578125, -0.4047698974609375, -0.38832855224609375, -0.37188720703125, -0.35544586181640625, -0.3390045166015625, -0.32256317138671875, -0.306121826171875, -0.28968048095703125, -0.2732391357421875, -0.25679779052734375, -0.2403564453125, -0.22391510009765625, -0.2074737548828125, -0.19103240966796875, -0.174591064453125, -0.15814971923828125, -0.1417083740234375, -0.12526702880859375, -0.10882568359375, -0.09238433837890625, -0.0759429931640625, -0.05950164794921875, -0.043060302734375, -0.02661895751953125, -0.0101776123046875, 0.00626373291015625, 0.022705078125, 0.03914642333984375, 0.0555877685546875, 0.07202911376953125, 0.088470458984375, 0.10491180419921875, 0.1213531494140625, 0.13779449462890625, 0.15423583984375, 0.17067718505859375, 0.1871185302734375, 0.20355987548828125, 0.220001220703125, 0.23644256591796875, 0.2528839111328125, 0.26932525634765625, 0.2857666015625, 0.30220794677734375, 0.3186492919921875, 0.33509063720703125, 0.351531982421875, 0.36797332763671875, 0.3844146728515625, 0.40085601806640625, 0.41729736328125, 0.43373870849609375, 0.4501800537109375, 0.46662139892578125, 0.483062744140625, 0.49950408935546875, 0.5159454345703125, 0.5323867797851562, 0.548828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 3.0, 8.0, 26.0, 72.0, 197.0, 333.0, 231.0, 78.0, 30.0, 10.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7305350303649902, -3.4562556743621826, -3.181976318359375, -2.9076967239379883, -2.6334176063537598, -2.359138011932373, -2.0848586559295654, -1.8105792999267578, -1.5362999439239502, -1.2620205879211426, -0.9877411723136902, -0.7134617567062378, -0.4391824007034302, -0.16490304470062256, 0.10937643051147461, 0.3836557865142822, 0.6579351425170898, 0.9322144985198975, 1.206493854522705, 1.4807733297348022, 1.7550526857376099, 2.029332160949707, 2.3036115169525146, 2.5778908729553223, 2.85217022895813, 3.1264495849609375, 3.400728940963745, 3.6750082969665527, 3.9492878913879395, 4.223567008972168, 4.497846603393555, 4.772126197814941, 5.046405792236328, 5.320685386657715, 5.594964504241943, 5.86924409866333, 6.143523216247559, 6.417802810668945, 6.692082405090332, 6.9663615226745605, 7.240640640258789, 7.514920234680176, 7.789199352264404, 8.063478469848633, 8.33775806427002, 8.612037658691406, 8.886317253112793, 9.16059684753418, 9.43487548828125, 9.709155082702637, 9.983434677124023, 10.257713317871094, 10.53199291229248, 10.806272506713867, 11.080552101135254, 11.35483169555664, 11.629111289978027, 11.903390884399414, 12.1776704788208, 12.451949119567871, 12.726228713989258, 13.000508308410645, 13.274787902832031, 13.549066543579102, 13.823346138000488]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 9.0, 9.0, 17.0, 20.0, 33.0, 37.0, 30.0, 44.0, 59.0, 65.0, 67.0, 81.0, 57.0, 66.0, 67.0, 50.0, 52.0, 54.0, 54.0, 34.0, 17.0, 22.0, 23.0, 12.0, 8.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.321829319000244, -3.2249057292938232, -3.1279819011688232, -3.0310583114624023, -2.9341347217559814, -2.8372111320495605, -2.7402873039245605, -2.6433637142181396, -2.5464401245117188, -2.449516534805298, -2.352592706680298, -2.255669116973877, -2.158745527267456, -2.061821937561035, -1.9648981094360352, -1.8679745197296143, -1.7710508108139038, -1.6741271018981934, -1.5772035121917725, -1.480279803276062, -1.3833562135696411, -1.2864325046539307, -1.1895089149475098, -1.0925852060317993, -0.9956615567207336, -0.898737907409668, -0.8018142580986023, -0.7048906087875366, -0.6079668998718262, -0.5110433101654053, -0.4141196012496948, -0.31719595193862915, -0.22027230262756348, -0.1233486458659172, -0.026424989104270935, 0.07049867510795593, 0.1674223244190216, 0.2643459737300873, 0.36126965284347534, 0.458193302154541, 0.5551169514656067, 0.6520406007766724, 0.748964250087738, 0.8458878993988037, 0.9428116083145142, 1.039735198020935, 1.1366589069366455, 1.2335824966430664, 1.3305062055587769, 1.4274299144744873, 1.5243535041809082, 1.6212772130966187, 1.7182008028030396, 1.81512451171875, 1.912048101425171, 2.008971691131592, 2.105895519256592, 2.2028191089630127, 2.2997429370880127, 2.3966665267944336, 2.4935901165008545, 2.5905137062072754, 2.6874375343322754, 2.7843611240386963, 2.881284713745117]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 8.0, 12.0, 16.0, 15.0, 26.0, 48.0, 63.0, 98.0, 181.0, 281.0, 572.0, 1260.0, 3285.0, 10430.0, 47085.0, 313141.0, 545058.0, 100018.0, 18348.0, 5104.0, 1800.0, 762.0, 382.0, 197.0, 110.0, 73.0, 42.0, 37.0, 21.0, 14.0, 14.0, 11.0, 9.0, 10.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462158203125, -0.4468574523925781, -0.43155670166015625, -0.4162559509277344, -0.4009552001953125, -0.3856544494628906, -0.37035369873046875, -0.3550529479980469, -0.339752197265625, -0.3244514465332031, -0.30915069580078125, -0.2938499450683594, -0.2785491943359375, -0.2632484436035156, -0.24794769287109375, -0.23264694213867188, -0.21734619140625, -0.20204544067382812, -0.18674468994140625, -0.17144393920898438, -0.1561431884765625, -0.14084243774414062, -0.12554168701171875, -0.11024093627929688, -0.094940185546875, -0.07963943481445312, -0.06433868408203125, -0.049037933349609375, -0.0337371826171875, -0.018436431884765625, -0.00313568115234375, 0.012165069580078125, 0.0274658203125, 0.042766571044921875, 0.05806732177734375, 0.07336807250976562, 0.0886688232421875, 0.10396957397460938, 0.11927032470703125, 0.13457107543945312, 0.149871826171875, 0.16517257690429688, 0.18047332763671875, 0.19577407836914062, 0.2110748291015625, 0.22637557983398438, 0.24167633056640625, 0.2569770812988281, 0.27227783203125, 0.2875785827636719, 0.30287933349609375, 0.3181800842285156, 0.3334808349609375, 0.3487815856933594, 0.36408233642578125, 0.3793830871582031, 0.394683837890625, 0.4099845886230469, 0.42528533935546875, 0.4405860900878906, 0.4558868408203125, 0.4711875915527344, 0.48648834228515625, 0.5017890930175781, 0.51708984375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 12.0, 17.0, 14.0, 19.0, 28.0, 44.0, 34.0, 38.0, 65.0, 52.0, 60.0, 65.0, 65.0, 62.0, 60.0, 45.0, 50.0, 42.0, 37.0, 31.0, 36.0, 33.0, 15.0, 12.0, 9.0, 8.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2322998046875, -0.22443199157714844, -0.21656417846679688, -0.2086963653564453, -0.20082855224609375, -0.1929607391357422, -0.18509292602539062, -0.17722511291503906, -0.1693572998046875, -0.16148948669433594, -0.15362167358398438, -0.1457538604736328, -0.13788604736328125, -0.1300182342529297, -0.12215042114257812, -0.11428260803222656, -0.106414794921875, -0.09854698181152344, -0.09067916870117188, -0.08281135559082031, -0.07494354248046875, -0.06707572937011719, -0.059207916259765625, -0.05134010314941406, -0.0434722900390625, -0.03560447692871094, -0.027736663818359375, -0.019868850708007812, -0.01200103759765625, -0.0041332244873046875, 0.003734588623046875, 0.011602401733398438, 0.01947021484375, 0.027338027954101562, 0.035205841064453125, 0.04307365417480469, 0.05094146728515625, 0.05880928039550781, 0.06667709350585938, 0.07454490661621094, 0.0824127197265625, 0.09028053283691406, 0.09814834594726562, 0.10601615905761719, 0.11388397216796875, 0.12175178527832031, 0.12961959838867188, 0.13748741149902344, 0.145355224609375, 0.15322303771972656, 0.16109085083007812, 0.1689586639404297, 0.17682647705078125, 0.1846942901611328, 0.19256210327148438, 0.20042991638183594, 0.2082977294921875, 0.21616554260253906, 0.22403335571289062, 0.2319011688232422, 0.23976898193359375, 0.2476367950439453, 0.2555046081542969, 0.26337242126464844, 0.271240234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 8.0, 3.0, 0.0, 5.0, 10.0, 7.0, 15.0, 11.0, 16.0, 25.0, 28.0, 26.0, 50.0, 48.0, 79.0, 119.0, 190.0, 305.0, 502.0, 994.0, 2101.0, 5221.0, 17605.0, 79401.0, 551313.0, 309822.0, 58675.0, 13677.0, 4419.0, 1734.0, 808.0, 437.0, 292.0, 175.0, 120.0, 72.0, 65.0, 45.0, 37.0, 27.0, 17.0, 20.0, 10.0, 9.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.39404296875, -0.38129425048828125, -0.3685455322265625, -0.35579681396484375, -0.343048095703125, -0.33029937744140625, -0.3175506591796875, -0.30480194091796875, -0.29205322265625, -0.27930450439453125, -0.2665557861328125, -0.25380706787109375, -0.241058349609375, -0.22830963134765625, -0.2155609130859375, -0.20281219482421875, -0.1900634765625, -0.17731475830078125, -0.1645660400390625, -0.15181732177734375, -0.139068603515625, -0.12631988525390625, -0.1135711669921875, -0.10082244873046875, -0.08807373046875, -0.07532501220703125, -0.0625762939453125, -0.04982757568359375, -0.037078857421875, -0.02433013916015625, -0.0115814208984375, 0.00116729736328125, 0.013916015625, 0.02666473388671875, 0.0394134521484375, 0.05216217041015625, 0.064910888671875, 0.07765960693359375, 0.0904083251953125, 0.10315704345703125, 0.11590576171875, 0.12865447998046875, 0.1414031982421875, 0.15415191650390625, 0.166900634765625, 0.17964935302734375, 0.1923980712890625, 0.20514678955078125, 0.2178955078125, 0.23064422607421875, 0.2433929443359375, 0.25614166259765625, 0.268890380859375, 0.28163909912109375, 0.2943878173828125, 0.30713653564453125, 0.31988525390625, 0.33263397216796875, 0.3453826904296875, 0.35813140869140625, 0.370880126953125, 0.38362884521484375, 0.3963775634765625, 0.40912628173828125, 0.421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 9.0, 5.0, 9.0, 9.0, 11.0, 13.0, 30.0, 20.0, 34.0, 36.0, 40.0, 46.0, 60.0, 56.0, 58.0, 63.0, 67.0, 58.0, 44.0, 42.0, 49.0, 32.0, 32.0, 33.0, 34.0, 24.0, 22.0, 14.0, 12.0, 16.0, 4.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84716796875, -0.821563720703125, -0.79595947265625, -0.770355224609375, -0.7447509765625, -0.719146728515625, -0.69354248046875, -0.667938232421875, -0.642333984375, -0.616729736328125, -0.59112548828125, -0.565521240234375, -0.5399169921875, -0.514312744140625, -0.48870849609375, -0.463104248046875, -0.4375, -0.411895751953125, -0.38629150390625, -0.360687255859375, -0.3350830078125, -0.309478759765625, -0.28387451171875, -0.258270263671875, -0.232666015625, -0.207061767578125, -0.18145751953125, -0.155853271484375, -0.1302490234375, -0.104644775390625, -0.07904052734375, -0.053436279296875, -0.02783203125, -0.002227783203125, 0.02337646484375, 0.048980712890625, 0.0745849609375, 0.100189208984375, 0.12579345703125, 0.151397705078125, 0.177001953125, 0.202606201171875, 0.22821044921875, 0.253814697265625, 0.2794189453125, 0.305023193359375, 0.33062744140625, 0.356231689453125, 0.3818359375, 0.407440185546875, 0.43304443359375, 0.458648681640625, 0.4842529296875, 0.509857177734375, 0.53546142578125, 0.561065673828125, 0.586669921875, 0.612274169921875, 0.63787841796875, 0.663482666015625, 0.6890869140625, 0.714691162109375, 0.74029541015625, 0.765899658203125, 0.79150390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 7.0, 5.0, 12.0, 24.0, 23.0, 50.0, 50.0, 96.0, 139.0, 221.0, 330.0, 571.0, 982.0, 1616.0, 3326.0, 7542.0, 22444.0, 91526.0, 609471.0, 237703.0, 48086.0, 13581.0, 5194.0, 2442.0, 1221.0, 713.0, 430.0, 258.0, 169.0, 98.0, 76.0, 34.0, 23.0, 26.0, 17.0, 8.0, 13.0, 3.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.216796875, -0.21090316772460938, -0.20500946044921875, -0.19911575317382812, -0.1932220458984375, -0.18732833862304688, -0.18143463134765625, -0.17554092407226562, -0.169647216796875, -0.16375350952148438, -0.15785980224609375, -0.15196609497070312, -0.1460723876953125, -0.14017868041992188, -0.13428497314453125, -0.12839126586914062, -0.12249755859375, -0.11660385131835938, -0.11071014404296875, -0.10481643676757812, -0.0989227294921875, -0.09302902221679688, -0.08713531494140625, -0.08124160766601562, -0.075347900390625, -0.06945419311523438, -0.06356048583984375, -0.057666778564453125, -0.0517730712890625, -0.045879364013671875, -0.03998565673828125, -0.034091949462890625, -0.0281982421875, -0.022304534912109375, -0.01641082763671875, -0.010517120361328125, -0.0046234130859375, 0.001270294189453125, 0.00716400146484375, 0.013057708740234375, 0.018951416015625, 0.024845123291015625, 0.03073883056640625, 0.036632537841796875, 0.0425262451171875, 0.048419952392578125, 0.05431365966796875, 0.060207366943359375, 0.06610107421875, 0.07199478149414062, 0.07788848876953125, 0.08378219604492188, 0.0896759033203125, 0.09556961059570312, 0.10146331787109375, 0.10735702514648438, 0.113250732421875, 0.11914443969726562, 0.12503814697265625, 0.13093185424804688, 0.1368255615234375, 0.14271926879882812, 0.14861297607421875, 0.15450668334960938, 0.160400390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 3.0, 10.0, 6.0, 13.0, 29.0, 41.0, 58.0, 99.0, 160.0, 203.0, 133.0, 82.0, 54.0, 36.0, 23.0, 16.0, 12.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55055046081543e-05, -6.242562085390091e-05, -5.934573709964752e-05, -5.6265853345394135e-05, -5.318596959114075e-05, -5.010608583688736e-05, -4.702620208263397e-05, -4.3946318328380585e-05, -4.08664345741272e-05, -3.778655081987381e-05, -3.470666706562042e-05, -3.1626783311367035e-05, -2.8546899557113647e-05, -2.546701580286026e-05, -2.2387132048606873e-05, -1.9307248294353485e-05, -1.6227364540100098e-05, -1.314748078584671e-05, -1.0067597031593323e-05, -6.987713277339935e-06, -3.907829523086548e-06, -8.279457688331604e-07, 2.251937985420227e-06, 5.3318217396736145e-06, 8.411705493927002e-06, 1.149158924818039e-05, 1.4571473002433777e-05, 1.7651356756687164e-05, 2.0731240510940552e-05, 2.381112426519394e-05, 2.6891008019447327e-05, 2.9970891773700714e-05, 3.30507755279541e-05, 3.613065928220749e-05, 3.9210543036460876e-05, 4.2290426790714264e-05, 4.537031054496765e-05, 4.845019429922104e-05, 5.1530078053474426e-05, 5.4609961807727814e-05, 5.76898455619812e-05, 6.076972931623459e-05, 6.384961307048798e-05, 6.692949682474136e-05, 7.000938057899475e-05, 7.308926433324814e-05, 7.616914808750153e-05, 7.924903184175491e-05, 8.23289155960083e-05, 8.540879935026169e-05, 8.848868310451508e-05, 9.156856685876846e-05, 9.464845061302185e-05, 9.772833436727524e-05, 0.00010080821812152863, 0.00010388810187578201, 0.0001069679856300354, 0.00011004786938428879, 0.00011312775313854218, 0.00011620763689279556, 0.00011928752064704895, 0.00012236740440130234, 0.00012544728815555573, 0.0001285271719098091, 0.0001316070556640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 10.0, 16.0, 25.0, 53.0, 52.0, 76.0, 133.0, 205.0, 299.0, 545.0, 928.0, 1743.0, 3413.0, 7121.0, 16353.0, 43543.0, 139881.0, 554117.0, 186986.0, 55548.0, 20241.0, 8456.0, 4061.0, 2025.0, 1095.0, 629.0, 361.0, 215.0, 151.0, 80.0, 59.0, 39.0, 24.0, 14.0, 12.0, 11.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1287841796875, -0.12412071228027344, -0.11945724487304688, -0.11479377746582031, -0.11013031005859375, -0.10546684265136719, -0.10080337524414062, -0.09613990783691406, -0.0914764404296875, -0.08681297302246094, -0.08214950561523438, -0.07748603820800781, -0.07282257080078125, -0.06815910339355469, -0.06349563598632812, -0.05883216857910156, -0.054168701171875, -0.04950523376464844, -0.044841766357421875, -0.04017829895019531, -0.03551483154296875, -0.030851364135742188, -0.026187896728515625, -0.021524429321289062, -0.0168609619140625, -0.012197494506835938, -0.007534027099609375, -0.0028705596923828125, 0.00179290771484375, 0.0064563751220703125, 0.011119842529296875, 0.015783309936523438, 0.02044677734375, 0.025110244750976562, 0.029773712158203125, 0.03443717956542969, 0.03910064697265625, 0.04376411437988281, 0.048427581787109375, 0.05309104919433594, 0.0577545166015625, 0.06241798400878906, 0.06708145141601562, 0.07174491882324219, 0.07640838623046875, 0.08107185363769531, 0.08573532104492188, 0.09039878845214844, 0.095062255859375, 0.09972572326660156, 0.10438919067382812, 0.10905265808105469, 0.11371612548828125, 0.11837959289550781, 0.12304306030273438, 0.12770652770996094, 0.1323699951171875, 0.13703346252441406, 0.14169692993164062, 0.1463603973388672, 0.15102386474609375, 0.1556873321533203, 0.16035079956054688, 0.16501426696777344, 0.169677734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 1.0, 4.0, 13.0, 5.0, 11.0, 16.0, 17.0, 22.0, 28.0, 54.0, 64.0, 58.0, 73.0, 93.0, 108.0, 93.0, 76.0, 66.0, 40.0, 33.0, 26.0, 19.0, 18.0, 12.0, 11.0, 9.0, 7.0, 0.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1983642578125, -0.1925525665283203, -0.18674087524414062, -0.18092918395996094, -0.17511749267578125, -0.16930580139160156, -0.16349411010742188, -0.1576824188232422, -0.1518707275390625, -0.1460590362548828, -0.14024734497070312, -0.13443565368652344, -0.12862396240234375, -0.12281227111816406, -0.11700057983398438, -0.11118888854980469, -0.105377197265625, -0.09956550598144531, -0.09375381469726562, -0.08794212341308594, -0.08213043212890625, -0.07631874084472656, -0.07050704956054688, -0.06469535827636719, -0.0588836669921875, -0.05307197570800781, -0.047260284423828125, -0.04144859313964844, -0.03563690185546875, -0.029825210571289062, -0.024013519287109375, -0.018201828002929688, -0.01239013671875, -0.0065784454345703125, -0.000766754150390625, 0.0050449371337890625, 0.01085662841796875, 0.016668319702148438, 0.022480010986328125, 0.028291702270507812, 0.0341033935546875, 0.03991508483886719, 0.045726776123046875, 0.05153846740722656, 0.05735015869140625, 0.06316184997558594, 0.06897354125976562, 0.07478523254394531, 0.080596923828125, 0.08640861511230469, 0.09222030639648438, 0.09803199768066406, 0.10384368896484375, 0.10965538024902344, 0.11546707153320312, 0.12127876281738281, 0.1270904541015625, 0.1329021453857422, 0.13871383666992188, 0.14452552795410156, 0.15033721923828125, 0.15614891052246094, 0.16196060180664062, 0.1677722930908203, 0.173583984375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 6.0, 13.0, 14.0, 42.0, 69.0, 123.0, 249.0, 212.0, 112.0, 66.0, 36.0, 21.0, 11.0, 3.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0836119651794434, -2.9430084228515625, -2.8024048805236816, -2.661801338195801, -2.52119779586792, -2.380594253540039, -2.2399909496307373, -2.0993874073028564, -1.9587838649749756, -1.8181803226470947, -1.6775767803192139, -1.5369733572006226, -1.3963698148727417, -1.2557662725448608, -1.1151628494262695, -0.9745593070983887, -0.8339557647705078, -0.693352222442627, -0.5527487397193909, -0.4121452271938324, -0.2715417146682739, -0.13093817234039307, 0.009665310382843018, 0.1502687931060791, 0.29087233543395996, 0.43147584795951843, 0.5720793604850769, 0.712682843208313, 0.8532863855361938, 0.9938899278640747, 1.134493350982666, 1.2750968933105469, 1.415700912475586, 1.5563044548034668, 1.6969079971313477, 1.837511420249939, 1.9781149625778198, 2.1187186241149902, 2.259321928024292, 2.399925470352173, 2.5405290126800537, 2.6811325550079346, 2.8217360973358154, 2.9623396396636963, 3.102942943572998, 3.243546485900879, 3.3841500282287598, 3.5247535705566406, 3.6653571128845215, 3.8059606552124023, 3.946564197540283, 4.087167739868164, 4.227771282196045, 4.368374824523926, 4.508978366851807, 4.6495819091796875, 4.79018497467041, 4.930788516998291, 5.071392059326172, 5.211995601654053, 5.352599143981934, 5.4932026863098145, 5.633806228637695, 5.774409294128418, 5.915013313293457]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 11.0, 10.0, 15.0, 19.0, 28.0, 39.0, 26.0, 26.0, 35.0, 50.0, 85.0, 117.0, 104.0, 91.0, 55.0, 62.0, 45.0, 33.0, 27.0, 30.0, 18.0, 10.0, 11.0, 14.0, 6.0, 11.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7150139808654785, -2.5972235202789307, -2.479433059692383, -2.361642837524414, -2.243852376937866, -2.1260619163513184, -2.0082714557647705, -1.8904811143875122, -1.772690773010254, -1.654900312423706, -1.5371099710464478, -1.4193195104599, -1.3015291690826416, -1.1837387084960938, -1.065948247909546, -0.9481579065322876, -0.8303674459457397, -0.7125770449638367, -0.5947866439819336, -0.47699621319770813, -0.35920581221580505, -0.2414153814315796, -0.12362498044967651, -0.0058345794677734375, 0.11195582151412964, 0.22974622249603271, 0.3475366234779358, 0.46532705426216125, 0.5831174850463867, 0.7009078860282898, 0.8186982870101929, 0.936488687992096, 1.054279088973999, 1.1720695495605469, 1.2898598909378052, 1.407650351524353, 1.5254406929016113, 1.6432311534881592, 1.761021614074707, 1.8788119554519653, 1.9966022968292236, 2.1143927574157715, 2.2321832180023193, 2.349973440170288, 2.467763900756836, 2.585554361343384, 2.7033448219299316, 2.8211350440979004, 2.9389257431030273, 3.056716203689575, 3.174506664276123, 3.292296886444092, 3.4100873470306396, 3.5278778076171875, 3.6456682682037354, 3.763458728790283, 3.881248950958252, 3.9990394115448, 4.116829872131348, 4.234620094299316, 4.352410793304443, 4.470201015472412, 4.587991237640381, 4.705781936645508, 4.823572158813477]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 10.0, 9.0, 15.0, 11.0, 27.0, 38.0, 48.0, 97.0, 149.0, 367.0, 805.0, 2545.0, 12215.0, 241450.0, 3712282.0, 208886.0, 11417.0, 2494.0, 808.0, 331.0, 133.0, 57.0, 33.0, 21.0, 9.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-0.97021484375, -0.948883056640625, -0.92755126953125, -0.906219482421875, -0.8848876953125, -0.863555908203125, -0.84222412109375, -0.820892333984375, -0.799560546875, -0.778228759765625, -0.75689697265625, -0.735565185546875, -0.7142333984375, -0.692901611328125, -0.67156982421875, -0.650238037109375, -0.62890625, -0.607574462890625, -0.58624267578125, -0.564910888671875, -0.5435791015625, -0.522247314453125, -0.50091552734375, -0.479583740234375, -0.458251953125, -0.436920166015625, -0.41558837890625, -0.394256591796875, -0.3729248046875, -0.351593017578125, -0.33026123046875, -0.308929443359375, -0.28759765625, -0.266265869140625, -0.24493408203125, -0.223602294921875, -0.2022705078125, -0.180938720703125, -0.15960693359375, -0.138275146484375, -0.116943359375, -0.095611572265625, -0.07427978515625, -0.052947998046875, -0.0316162109375, -0.010284423828125, 0.01104736328125, 0.032379150390625, 0.0537109375, 0.075042724609375, 0.09637451171875, 0.117706298828125, 0.1390380859375, 0.160369873046875, 0.18170166015625, 0.203033447265625, 0.224365234375, 0.245697021484375, 0.26702880859375, 0.288360595703125, 0.3096923828125, 0.331024169921875, 0.35235595703125, 0.373687744140625, 0.39501953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 9.0, 16.0, 13.0, 20.0, 27.0, 32.0, 32.0, 43.0, 59.0, 50.0, 63.0, 49.0, 65.0, 58.0, 59.0, 44.0, 51.0, 46.0, 42.0, 50.0, 40.0, 31.0, 20.0, 26.0, 12.0, 6.0, 4.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.249298095703125, -0.24151611328125, -0.233734130859375, -0.2259521484375, -0.218170166015625, -0.21038818359375, -0.202606201171875, -0.19482421875, -0.187042236328125, -0.17926025390625, -0.171478271484375, -0.1636962890625, -0.155914306640625, -0.14813232421875, -0.140350341796875, -0.132568359375, -0.124786376953125, -0.11700439453125, -0.109222412109375, -0.1014404296875, -0.093658447265625, -0.08587646484375, -0.078094482421875, -0.0703125, -0.062530517578125, -0.05474853515625, -0.046966552734375, -0.0391845703125, -0.031402587890625, -0.02362060546875, -0.015838623046875, -0.008056640625, -0.000274658203125, 0.00750732421875, 0.015289306640625, 0.0230712890625, 0.030853271484375, 0.03863525390625, 0.046417236328125, 0.05419921875, 0.061981201171875, 0.06976318359375, 0.077545166015625, 0.0853271484375, 0.093109130859375, 0.10089111328125, 0.108673095703125, 0.116455078125, 0.124237060546875, 0.13201904296875, 0.139801025390625, 0.1475830078125, 0.155364990234375, 0.16314697265625, 0.170928955078125, 0.1787109375, 0.186492919921875, 0.19427490234375, 0.202056884765625, 0.2098388671875, 0.217620849609375, 0.22540283203125, 0.233184814453125, 0.240966796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 5.0, 13.0, 23.0, 22.0, 41.0, 87.0, 122.0, 191.0, 399.0, 758.0, 1929.0, 6044.0, 41018.0, 2519324.0, 1583916.0, 31612.0, 5395.0, 1712.0, 743.0, 392.0, 184.0, 125.0, 82.0, 53.0, 30.0, 22.0, 14.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8046875, -0.7809829711914062, -0.7572784423828125, -0.7335739135742188, -0.709869384765625, -0.6861648559570312, -0.6624603271484375, -0.6387557983398438, -0.61505126953125, -0.5913467407226562, -0.5676422119140625, -0.5439376831054688, -0.520233154296875, -0.49652862548828125, -0.4728240966796875, -0.44911956787109375, -0.4254150390625, -0.40171051025390625, -0.3780059814453125, -0.35430145263671875, -0.330596923828125, -0.30689239501953125, -0.2831878662109375, -0.25948333740234375, -0.23577880859375, -0.21207427978515625, -0.1883697509765625, -0.16466522216796875, -0.140960693359375, -0.11725616455078125, -0.0935516357421875, -0.06984710693359375, -0.046142578125, -0.02243804931640625, 0.0012664794921875, 0.02497100830078125, 0.048675537109375, 0.07238006591796875, 0.0960845947265625, 0.11978912353515625, 0.14349365234375, 0.16719818115234375, 0.1909027099609375, 0.21460723876953125, 0.238311767578125, 0.26201629638671875, 0.2857208251953125, 0.30942535400390625, 0.3331298828125, 0.35683441162109375, 0.3805389404296875, 0.40424346923828125, 0.427947998046875, 0.45165252685546875, 0.4753570556640625, 0.49906158447265625, 0.52276611328125, 0.5464706420898438, 0.5701751708984375, 0.5938796997070312, 0.617584228515625, 0.6412887573242188, 0.6649932861328125, 0.6886978149414062, 0.71240234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 9.0, 19.0, 24.0, 41.0, 45.0, 72.0, 136.0, 283.0, 436.0, 648.0, 769.0, 608.0, 390.0, 245.0, 122.0, 67.0, 45.0, 32.0, 17.0, 15.0, 12.0, 6.0, 8.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6149444580078125, -0.598052978515625, -0.5811614990234375, -0.56427001953125, -0.5473785400390625, -0.530487060546875, -0.5135955810546875, -0.4967041015625, -0.4798126220703125, -0.462921142578125, -0.4460296630859375, -0.42913818359375, -0.4122467041015625, -0.395355224609375, -0.3784637451171875, -0.361572265625, -0.3446807861328125, -0.327789306640625, -0.3108978271484375, -0.29400634765625, -0.2771148681640625, -0.260223388671875, -0.2433319091796875, -0.2264404296875, -0.2095489501953125, -0.192657470703125, -0.1757659912109375, -0.15887451171875, -0.1419830322265625, -0.125091552734375, -0.1082000732421875, -0.09130859375, -0.0744171142578125, -0.057525634765625, -0.0406341552734375, -0.02374267578125, -0.0068511962890625, 0.010040283203125, 0.0269317626953125, 0.0438232421875, 0.0607147216796875, 0.077606201171875, 0.0944976806640625, 0.11138916015625, 0.1282806396484375, 0.145172119140625, 0.1620635986328125, 0.178955078125, 0.1958465576171875, 0.212738037109375, 0.2296295166015625, 0.24652099609375, 0.2634124755859375, 0.280303955078125, 0.2971954345703125, 0.3140869140625, 0.3309783935546875, 0.347869873046875, 0.3647613525390625, 0.38165283203125, 0.3985443115234375, 0.415435791015625, 0.4323272705078125, 0.44921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 14.0, 29.0, 85.0, 165.0, 266.0, 233.0, 120.0, 48.0, 14.0, 11.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.062931060791016, -4.849284648895264, -4.635638236999512, -4.42199182510376, -4.208345413208008, -3.994699239730835, -3.781053066253662, -3.56740665435791, -3.353760242462158, -3.1401138305664062, -2.9264674186706543, -2.7128212451934814, -2.4991748332977295, -2.2855284214019775, -2.0718822479248047, -1.8582358360290527, -1.6445894241333008, -1.4309430122375488, -1.2172967195510864, -1.003650426864624, -0.7900040149688721, -0.5763576030731201, -0.3627113103866577, -0.1490650177001953, 0.06458139419555664, 0.2782277464866638, 0.491874098777771, 0.7055204510688782, 0.9191668033599854, 1.1328132152557373, 1.3464595079421997, 1.560105800628662, 1.773752212524414, 1.987398624420166, 2.201045036315918, 2.414691209793091, 2.6283376216888428, 2.8419840335845947, 3.0556302070617676, 3.2692766189575195, 3.4829230308532715, 3.6965694427490234, 3.9102158546447754, 4.123862266540527, 4.337508201599121, 4.551155090332031, 4.764801025390625, 4.978447437286377, 5.192093849182129, 5.405740261077881, 5.619386672973633, 5.833033084869385, 6.046679496765137, 6.2603254318237305, 6.473971843719482, 6.687618255615234, 6.901264667510986, 7.114911079406738, 7.32855749130249, 7.542203903198242, 7.755849838256836, 7.969496726989746, 8.18314266204834, 8.39678955078125, 8.610435485839844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 6.0, 12.0, 8.0, 18.0, 19.0, 19.0, 24.0, 33.0, 35.0, 39.0, 41.0, 43.0, 50.0, 56.0, 71.0, 78.0, 47.0, 57.0, 41.0, 49.0, 39.0, 36.0, 36.0, 29.0, 16.0, 21.0, 22.0, 9.0, 9.0, 12.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7593796253204346, -1.687211513519287, -1.61504328250885, -1.5428751707077026, -1.4707069396972656, -1.3985388278961182, -1.3263707160949707, -1.2542026042938232, -1.1820343732833862, -1.1098662614822388, -1.0376980304718018, -0.9655299186706543, -0.8933617472648621, -0.8211935758590698, -0.7490254640579224, -0.6768572926521301, -0.6046891212463379, -0.5325209498405457, -0.4603528082370758, -0.38818466663360596, -0.3160164952278137, -0.24384832382202148, -0.17168018221855164, -0.09951204061508179, -0.02734386920928955, 0.04482428729534149, 0.11699244379997253, 0.18916060030460358, 0.2613287568092346, 0.33349692821502686, 0.4056650698184967, 0.47783321142196655, 0.5500011444091797, 0.6221693158149719, 0.6943374872207642, 0.7665055990219116, 0.8386737704277039, 0.9108419418334961, 0.9830100536346436, 1.055178165435791, 1.127346396446228, 1.1995145082473755, 1.2716827392578125, 1.34385085105896, 1.4160189628601074, 1.4881871938705444, 1.560355305671692, 1.632523536682129, 1.7046916484832764, 1.7768597602844238, 1.8490279912948608, 1.9211961030960083, 1.9933643341064453, 2.0655324459075928, 2.1377005577087402, 2.2098686695098877, 2.282036781311035, 2.3542048931121826, 2.42637300491333, 2.4985413551330566, 2.570709466934204, 2.6428775787353516, 2.715045690536499, 2.7872138023376465, 2.859382152557373]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 12.0, 8.0, 10.0, 23.0, 28.0, 53.0, 82.0, 134.0, 269.0, 485.0, 1079.0, 2669.0, 7353.0, 25499.0, 126005.0, 601766.0, 226641.0, 39564.0, 10467.0, 3589.0, 1406.0, 595.0, 323.0, 188.0, 90.0, 66.0, 40.0, 21.0, 25.0, 12.0, 11.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.51904296875, -0.5036201477050781, -0.48819732666015625, -0.4727745056152344, -0.4573516845703125, -0.4419288635253906, -0.42650604248046875, -0.4110832214355469, -0.395660400390625, -0.3802375793457031, -0.36481475830078125, -0.3493919372558594, -0.3339691162109375, -0.3185462951660156, -0.30312347412109375, -0.2877006530761719, -0.27227783203125, -0.2568550109863281, -0.24143218994140625, -0.22600936889648438, -0.2105865478515625, -0.19516372680664062, -0.17974090576171875, -0.16431808471679688, -0.148895263671875, -0.13347244262695312, -0.11804962158203125, -0.10262680053710938, -0.0872039794921875, -0.07178115844726562, -0.05635833740234375, -0.040935516357421875, -0.0255126953125, -0.010089874267578125, 0.00533294677734375, 0.020755767822265625, 0.0361785888671875, 0.051601409912109375, 0.06702423095703125, 0.08244705200195312, 0.097869873046875, 0.11329269409179688, 0.12871551513671875, 0.14413833618164062, 0.1595611572265625, 0.17498397827148438, 0.19040679931640625, 0.20582962036132812, 0.22125244140625, 0.23667526245117188, 0.25209808349609375, 0.2675209045410156, 0.2829437255859375, 0.2983665466308594, 0.31378936767578125, 0.3292121887207031, 0.344635009765625, 0.3600578308105469, 0.37548065185546875, 0.3909034729003906, 0.4063262939453125, 0.4217491149902344, 0.43717193603515625, 0.4525947570800781, 0.468017578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 9.0, 6.0, 16.0, 17.0, 25.0, 29.0, 38.0, 32.0, 38.0, 41.0, 55.0, 66.0, 62.0, 61.0, 75.0, 67.0, 61.0, 50.0, 53.0, 38.0, 45.0, 33.0, 23.0, 22.0, 14.0, 10.0, 11.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2985038757324219, -0.28914642333984375, -0.2797889709472656, -0.2704315185546875, -0.2610740661621094, -0.25171661376953125, -0.24235916137695312, -0.233001708984375, -0.22364425659179688, -0.21428680419921875, -0.20492935180664062, -0.1955718994140625, -0.18621444702148438, -0.17685699462890625, -0.16749954223632812, -0.15814208984375, -0.14878463745117188, -0.13942718505859375, -0.13006973266601562, -0.1207122802734375, -0.11135482788085938, -0.10199737548828125, -0.09263992309570312, -0.083282470703125, -0.07392501831054688, -0.06456756591796875, -0.055210113525390625, -0.0458526611328125, -0.036495208740234375, -0.02713775634765625, -0.017780303955078125, -0.0084228515625, 0.000934600830078125, 0.01029205322265625, 0.019649505615234375, 0.0290069580078125, 0.038364410400390625, 0.04772186279296875, 0.057079315185546875, 0.066436767578125, 0.07579421997070312, 0.08515167236328125, 0.09450912475585938, 0.1038665771484375, 0.11322402954101562, 0.12258148193359375, 0.13193893432617188, 0.14129638671875, 0.15065383911132812, 0.16001129150390625, 0.16936874389648438, 0.1787261962890625, 0.18808364868164062, 0.19744110107421875, 0.20679855346679688, 0.216156005859375, 0.22551345825195312, 0.23487091064453125, 0.24422836303710938, 0.2535858154296875, 0.2629432678222656, 0.27230072021484375, 0.2816581726074219, 0.291015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 3.0, 11.0, 8.0, 11.0, 15.0, 25.0, 33.0, 37.0, 49.0, 66.0, 145.0, 181.0, 246.0, 369.0, 754.0, 1379.0, 3575.0, 11707.0, 59832.0, 743980.0, 191472.0, 23858.0, 5977.0, 2252.0, 1044.0, 509.0, 347.0, 201.0, 121.0, 91.0, 67.0, 39.0, 36.0, 19.0, 29.0, 15.0, 13.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.701171875, -0.6815567016601562, -0.6619415283203125, -0.6423263549804688, -0.622711181640625, -0.6030960083007812, -0.5834808349609375, -0.5638656616210938, -0.54425048828125, -0.5246353149414062, -0.5050201416015625, -0.48540496826171875, -0.465789794921875, -0.44617462158203125, -0.4265594482421875, -0.40694427490234375, -0.3873291015625, -0.36771392822265625, -0.3480987548828125, -0.32848358154296875, -0.308868408203125, -0.28925323486328125, -0.2696380615234375, -0.25002288818359375, -0.23040771484375, -0.21079254150390625, -0.1911773681640625, -0.17156219482421875, -0.151947021484375, -0.13233184814453125, -0.1127166748046875, -0.09310150146484375, -0.073486328125, -0.05387115478515625, -0.0342559814453125, -0.01464080810546875, 0.004974365234375, 0.02458953857421875, 0.0442047119140625, 0.06381988525390625, 0.08343505859375, 0.10305023193359375, 0.1226654052734375, 0.14228057861328125, 0.161895751953125, 0.18151092529296875, 0.2011260986328125, 0.22074127197265625, 0.2403564453125, 0.25997161865234375, 0.2795867919921875, 0.29920196533203125, 0.318817138671875, 0.33843231201171875, 0.3580474853515625, 0.37766265869140625, 0.39727783203125, 0.41689300537109375, 0.4365081787109375, 0.45612335205078125, 0.475738525390625, 0.49535369873046875, 0.5149688720703125, 0.5345840454101562, 0.55419921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 11.0, 4.0, 8.0, 7.0, 10.0, 12.0, 19.0, 20.0, 26.0, 35.0, 29.0, 41.0, 57.0, 59.0, 63.0, 70.0, 71.0, 58.0, 43.0, 48.0, 57.0, 33.0, 35.0, 32.0, 26.0, 17.0, 23.0, 14.0, 18.0, 6.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83642578125, -0.8070144653320312, -0.7776031494140625, -0.7481918334960938, -0.718780517578125, -0.6893692016601562, -0.6599578857421875, -0.6305465698242188, -0.60113525390625, -0.5717239379882812, -0.5423126220703125, -0.5129013061523438, -0.483489990234375, -0.45407867431640625, -0.4246673583984375, -0.39525604248046875, -0.3658447265625, -0.33643341064453125, -0.3070220947265625, -0.27761077880859375, -0.248199462890625, -0.21878814697265625, -0.1893768310546875, -0.15996551513671875, -0.13055419921875, -0.10114288330078125, -0.0717315673828125, -0.04232025146484375, -0.012908935546875, 0.01650238037109375, 0.0459136962890625, 0.07532501220703125, 0.104736328125, 0.13414764404296875, 0.1635589599609375, 0.19297027587890625, 0.222381591796875, 0.25179290771484375, 0.2812042236328125, 0.31061553955078125, 0.34002685546875, 0.36943817138671875, 0.3988494873046875, 0.42826080322265625, 0.457672119140625, 0.48708343505859375, 0.5164947509765625, 0.5459060668945312, 0.5753173828125, 0.6047286987304688, 0.6341400146484375, 0.6635513305664062, 0.692962646484375, 0.7223739624023438, 0.7517852783203125, 0.7811965942382812, 0.81060791015625, 0.8400192260742188, 0.8694305419921875, 0.8988418579101562, 0.928253173828125, 0.9576644897460938, 0.9870758056640625, 1.0164871215820312, 1.0458984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 10.0, 17.0, 38.0, 49.0, 114.0, 188.0, 340.0, 674.0, 1866.0, 5081.0, 17478.0, 80395.0, 780646.0, 126938.0, 24023.0, 6594.0, 2238.0, 916.0, 423.0, 224.0, 111.0, 68.0, 34.0, 24.0, 20.0, 13.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238525390625, -0.229888916015625, -0.22125244140625, -0.212615966796875, -0.2039794921875, -0.195343017578125, -0.18670654296875, -0.178070068359375, -0.16943359375, -0.160797119140625, -0.15216064453125, -0.143524169921875, -0.1348876953125, -0.126251220703125, -0.11761474609375, -0.108978271484375, -0.100341796875, -0.091705322265625, -0.08306884765625, -0.074432373046875, -0.0657958984375, -0.057159423828125, -0.04852294921875, -0.039886474609375, -0.03125, -0.022613525390625, -0.01397705078125, -0.005340576171875, 0.0032958984375, 0.011932373046875, 0.02056884765625, 0.029205322265625, 0.037841796875, 0.046478271484375, 0.05511474609375, 0.063751220703125, 0.0723876953125, 0.081024169921875, 0.08966064453125, 0.098297119140625, 0.10693359375, 0.115570068359375, 0.12420654296875, 0.132843017578125, 0.1414794921875, 0.150115966796875, 0.15875244140625, 0.167388916015625, 0.176025390625, 0.184661865234375, 0.19329833984375, 0.201934814453125, 0.2105712890625, 0.219207763671875, 0.22784423828125, 0.236480712890625, 0.2451171875, 0.253753662109375, 0.26239013671875, 0.271026611328125, 0.2796630859375, 0.288299560546875, 0.29693603515625, 0.305572509765625, 0.314208984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 4.0, 2.0, 10.0, 6.0, 7.0, 8.0, 17.0, 9.0, 12.0, 25.0, 41.0, 34.0, 60.0, 91.0, 118.0, 129.0, 118.0, 72.0, 50.0, 42.0, 26.0, 27.0, 15.0, 10.0, 15.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0439109802246094e-05, -5.844142287969589e-05, -5.644373595714569e-05, -5.444604903459549e-05, -5.244836211204529e-05, -5.045067518949509e-05, -4.8452988266944885e-05, -4.6455301344394684e-05, -4.445761442184448e-05, -4.245992749929428e-05, -4.046224057674408e-05, -3.846455365419388e-05, -3.646686673164368e-05, -3.4469179809093475e-05, -3.2471492886543274e-05, -3.0473805963993073e-05, -2.847611904144287e-05, -2.647843211889267e-05, -2.4480745196342468e-05, -2.2483058273792267e-05, -2.0485371351242065e-05, -1.8487684428691864e-05, -1.6489997506141663e-05, -1.4492310583591461e-05, -1.249462366104126e-05, -1.0496936738491058e-05, -8.499249815940857e-06, -6.5015628933906555e-06, -4.503875970840454e-06, -2.5061890482902527e-06, -5.085021257400513e-07, 1.4891847968101501e-06, 3.4868717193603516e-06, 5.484558641910553e-06, 7.482245564460754e-06, 9.479932487010956e-06, 1.1477619409561157e-05, 1.3475306332111359e-05, 1.547299325466156e-05, 1.747068017721176e-05, 1.9468367099761963e-05, 2.1466054022312164e-05, 2.3463740944862366e-05, 2.5461427867412567e-05, 2.745911478996277e-05, 2.945680171251297e-05, 3.145448863506317e-05, 3.345217555761337e-05, 3.5449862480163574e-05, 3.7447549402713776e-05, 3.944523632526398e-05, 4.144292324781418e-05, 4.344061017036438e-05, 4.543829709291458e-05, 4.743598401546478e-05, 4.9433670938014984e-05, 5.1431357860565186e-05, 5.342904478311539e-05, 5.542673170566559e-05, 5.742441862821579e-05, 5.942210555076599e-05, 6.141979247331619e-05, 6.34174793958664e-05, 6.54151663184166e-05, 6.74128532409668e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 14.0, 13.0, 22.0, 35.0, 55.0, 99.0, 166.0, 286.0, 560.0, 1118.0, 2498.0, 6366.0, 19333.0, 79158.0, 728112.0, 162589.0, 31993.0, 9606.0, 3431.0, 1439.0, 723.0, 372.0, 206.0, 124.0, 91.0, 49.0, 22.0, 16.0, 18.0, 5.0, 7.0, 8.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.265625, -0.2579689025878906, -0.25031280517578125, -0.24265670776367188, -0.2350006103515625, -0.22734451293945312, -0.21968841552734375, -0.21203231811523438, -0.204376220703125, -0.19672012329101562, -0.18906402587890625, -0.18140792846679688, -0.1737518310546875, -0.16609573364257812, -0.15843963623046875, -0.15078353881835938, -0.14312744140625, -0.13547134399414062, -0.12781524658203125, -0.12015914916992188, -0.1125030517578125, -0.10484695434570312, -0.09719085693359375, -0.08953475952148438, -0.081878662109375, -0.07422256469726562, -0.06656646728515625, -0.058910369873046875, -0.0512542724609375, -0.043598175048828125, -0.03594207763671875, -0.028285980224609375, -0.0206298828125, -0.012973785400390625, -0.00531768798828125, 0.002338409423828125, 0.0099945068359375, 0.017650604248046875, 0.02530670166015625, 0.032962799072265625, 0.040618896484375, 0.048274993896484375, 0.05593109130859375, 0.06358718872070312, 0.0712432861328125, 0.07889938354492188, 0.08655548095703125, 0.09421157836914062, 0.10186767578125, 0.10952377319335938, 0.11717987060546875, 0.12483596801757812, 0.1324920654296875, 0.14014816284179688, 0.14780426025390625, 0.15546035766601562, 0.163116455078125, 0.17077255249023438, 0.17842864990234375, 0.18608474731445312, 0.1937408447265625, 0.20139694213867188, 0.20905303955078125, 0.21670913696289062, 0.224365234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 2.0, 3.0, 7.0, 11.0, 2.0, 15.0, 11.0, 19.0, 25.0, 34.0, 21.0, 38.0, 49.0, 76.0, 118.0, 118.0, 95.0, 76.0, 55.0, 41.0, 31.0, 31.0, 19.0, 13.0, 17.0, 17.0, 9.0, 9.0, 7.0, 2.0, 4.0, 8.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14453125, -0.1386089324951172, -0.13268661499023438, -0.12676429748535156, -0.12084197998046875, -0.11491966247558594, -0.10899734497070312, -0.10307502746582031, -0.0971527099609375, -0.09123039245605469, -0.08530807495117188, -0.07938575744628906, -0.07346343994140625, -0.06754112243652344, -0.061618804931640625, -0.05569648742675781, -0.049774169921875, -0.04385185241699219, -0.037929534912109375, -0.03200721740722656, -0.02608489990234375, -0.020162582397460938, -0.014240264892578125, -0.008317947387695312, -0.0023956298828125, 0.0035266876220703125, 0.009449005126953125, 0.015371322631835938, 0.02129364013671875, 0.027215957641601562, 0.033138275146484375, 0.03906059265136719, 0.04498291015625, 0.05090522766113281, 0.056827545166015625, 0.06274986267089844, 0.06867218017578125, 0.07459449768066406, 0.08051681518554688, 0.08643913269042969, 0.0923614501953125, 0.09828376770019531, 0.10420608520507812, 0.11012840270996094, 0.11605072021484375, 0.12197303771972656, 0.12789535522460938, 0.1338176727294922, 0.139739990234375, 0.1456623077392578, 0.15158462524414062, 0.15750694274902344, 0.16342926025390625, 0.16935157775878906, 0.17527389526367188, 0.1811962127685547, 0.1871185302734375, 0.1930408477783203, 0.19896316528320312, 0.20488548278808594, 0.21080780029296875, 0.21673011779785156, 0.22265243530273438, 0.2285747528076172, 0.2344970703125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 13.0, 45.0, 76.0, 146.0, 314.0, 141.0, 107.0, 56.0, 29.0, 17.0, 10.0, 5.0, 8.0, 3.0, 5.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.1587564945220947, -3.0032198429107666, -2.8476834297180176, -2.6921467781066895, -2.5366103649139404, -2.3810737133026123, -2.2255373001098633, -2.070000648498535, -1.9144641160964966, -1.758927583694458, -1.6033910512924194, -1.4478545188903809, -1.2923178672790527, -1.1367814540863037, -0.9812448024749756, -0.825708270072937, -0.6701717376708984, -0.5146352052688599, -0.3590986430644989, -0.20356208086013794, -0.048025548458099365, 0.10751098394393921, 0.26304757595062256, 0.41858410835266113, 0.5741206407546997, 0.7296571731567383, 0.8851937055587769, 1.0407302379608154, 1.1962668895721436, 1.3518033027648926, 1.5073399543762207, 1.6628764867782593, 1.8184127807617188, 1.9739493131637573, 2.129485845565796, 2.285022497177124, 2.440558910369873, 2.596095561981201, 2.7516322135925293, 2.9071686267852783, 3.0627050399780273, 3.2182416915893555, 3.3737781047821045, 3.5293147563934326, 3.6848511695861816, 3.8403878211975098, 3.995924472808838, 4.151460647583008, 4.306997299194336, 4.462533950805664, 4.618070602416992, 4.773606777191162, 4.92914342880249, 5.084680080413818, 5.2402167320251465, 5.395752906799316, 5.551290035247803, 5.706826686859131, 5.862363338470459, 6.017899513244629, 6.173436164855957, 6.328972816467285, 6.484509468078613, 6.640046119689941, 6.795582294464111]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 6.0, 5.0, 7.0, 13.0, 14.0, 17.0, 26.0, 22.0, 17.0, 38.0, 35.0, 41.0, 55.0, 38.0, 101.0, 120.0, 94.0, 52.0, 49.0, 45.0, 38.0, 31.0, 19.0, 17.0, 22.0, 13.0, 10.0, 12.0, 16.0, 6.0, 6.0, 7.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.068901062011719, -3.94315767288208, -3.8174142837524414, -3.6916708946228027, -3.565927505493164, -3.4401841163635254, -3.3144407272338867, -3.188697338104248, -3.0629539489746094, -2.9372105598449707, -2.811467170715332, -2.6857237815856934, -2.5599803924560547, -2.434237003326416, -2.3084936141967773, -2.1827502250671387, -2.057007074356079, -1.9312636852264404, -1.8055202960968018, -1.679776906967163, -1.5540335178375244, -1.4282901287078857, -1.3025468587875366, -1.176803469657898, -1.0510600805282593, -0.9253166913986206, -0.7995733022689819, -0.673829972743988, -0.5480865836143494, -0.4223431944847107, -0.2965998649597168, -0.17085647583007812, -0.045113325119018555, 0.08063004910945892, 0.2063734233379364, 0.3321167826652527, 0.45786017179489136, 0.58360356092453, 0.7093468904495239, 0.8350902795791626, 0.9608336687088013, 1.08657705783844, 1.2123204469680786, 1.3380637168884277, 1.4638071060180664, 1.589550495147705, 1.7152938842773438, 1.8410372734069824, 1.966780662536621, 2.0925240516662598, 2.2182674407958984, 2.344010829925537, 2.469754219055176, 2.5954976081848145, 2.721240997314453, 2.846984386444092, 2.9727277755737305, 3.098471164703369, 3.224214553833008, 3.3499579429626465, 3.475701332092285, 3.601444721221924, 3.7271881103515625, 3.852931499481201, 3.9786746501922607]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 4.0, 8.0, 10.0, 12.0, 15.0, 21.0, 23.0, 31.0, 53.0, 89.0, 133.0, 222.0, 465.0, 995.0, 2513.0, 9906.0, 191950.0, 3766183.0, 205591.0, 11411.0, 2775.0, 950.0, 448.0, 228.0, 108.0, 55.0, 26.0, 9.0, 10.0, 4.0, 10.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.1005859375, -1.0758590698242188, -1.0511322021484375, -1.0264053344726562, -1.001678466796875, -0.9769515991210938, -0.9522247314453125, -0.9274978637695312, -0.90277099609375, -0.8780441284179688, -0.8533172607421875, -0.8285903930664062, -0.803863525390625, -0.7791366577148438, -0.7544097900390625, -0.7296829223632812, -0.7049560546875, -0.6802291870117188, -0.6555023193359375, -0.6307754516601562, -0.606048583984375, -0.5813217163085938, -0.5565948486328125, -0.5318679809570312, -0.50714111328125, -0.48241424560546875, -0.4576873779296875, -0.43296051025390625, -0.408233642578125, -0.38350677490234375, -0.3587799072265625, -0.33405303955078125, -0.309326171875, -0.28459930419921875, -0.2598724365234375, -0.23514556884765625, -0.210418701171875, -0.18569183349609375, -0.1609649658203125, -0.13623809814453125, -0.11151123046875, -0.08678436279296875, -0.0620574951171875, -0.03733062744140625, -0.012603759765625, 0.01212310791015625, 0.0368499755859375, 0.06157684326171875, 0.0863037109375, 0.11103057861328125, 0.1357574462890625, 0.16048431396484375, 0.185211181640625, 0.20993804931640625, 0.2346649169921875, 0.25939178466796875, 0.28411865234375, 0.30884552001953125, 0.3335723876953125, 0.35829925537109375, 0.383026123046875, 0.40775299072265625, 0.4324798583984375, 0.45720672607421875, 0.48193359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 5.0, 1.0, 9.0, 9.0, 14.0, 14.0, 21.0, 14.0, 18.0, 26.0, 19.0, 32.0, 42.0, 33.0, 29.0, 44.0, 39.0, 40.0, 40.0, 50.0, 44.0, 35.0, 38.0, 39.0, 46.0, 40.0, 31.0, 28.0, 22.0, 32.0, 22.0, 23.0, 18.0, 14.0, 13.0, 7.0, 9.0, 13.0, 6.0, 4.0, 3.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17333984375, -0.16715431213378906, -0.16096878051757812, -0.1547832489013672, -0.14859771728515625, -0.1424121856689453, -0.13622665405273438, -0.13004112243652344, -0.1238555908203125, -0.11767005920410156, -0.11148452758789062, -0.10529899597167969, -0.09911346435546875, -0.09292793273925781, -0.08674240112304688, -0.08055686950683594, -0.074371337890625, -0.06818580627441406, -0.062000274658203125, -0.05581474304199219, -0.04962921142578125, -0.04344367980957031, -0.037258148193359375, -0.031072616577148438, -0.0248870849609375, -0.018701553344726562, -0.012516021728515625, -0.0063304901123046875, -0.00014495849609375, 0.0060405731201171875, 0.012226104736328125, 0.018411636352539062, 0.02459716796875, 0.030782699584960938, 0.036968231201171875, 0.04315376281738281, 0.04933929443359375, 0.05552482604980469, 0.061710357666015625, 0.06789588928222656, 0.0740814208984375, 0.08026695251464844, 0.08645248413085938, 0.09263801574707031, 0.09882354736328125, 0.10500907897949219, 0.11119461059570312, 0.11738014221191406, 0.123565673828125, 0.12975120544433594, 0.13593673706054688, 0.1421222686767578, 0.14830780029296875, 0.1544933319091797, 0.16067886352539062, 0.16686439514160156, 0.1730499267578125, 0.17923545837402344, 0.18542098999023438, 0.1916065216064453, 0.19779205322265625, 0.2039775848388672, 0.21016311645507812, 0.21634864807128906, 0.2225341796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 13.0, 23.0, 50.0, 89.0, 196.0, 596.0, 3100.0, 123808.0, 4050448.0, 13954.0, 1396.0, 348.0, 146.0, 59.0, 27.0, 14.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8369140625, -1.779998779296875, -1.72308349609375, -1.666168212890625, -1.6092529296875, -1.552337646484375, -1.49542236328125, -1.438507080078125, -1.381591796875, -1.324676513671875, -1.26776123046875, -1.210845947265625, -1.1539306640625, -1.097015380859375, -1.04010009765625, -0.983184814453125, -0.92626953125, -0.869354248046875, -0.81243896484375, -0.755523681640625, -0.6986083984375, -0.641693115234375, -0.58477783203125, -0.527862548828125, -0.470947265625, -0.414031982421875, -0.35711669921875, -0.300201416015625, -0.2432861328125, -0.186370849609375, -0.12945556640625, -0.072540283203125, -0.015625, 0.041290283203125, 0.09820556640625, 0.155120849609375, 0.2120361328125, 0.268951416015625, 0.32586669921875, 0.382781982421875, 0.439697265625, 0.496612548828125, 0.55352783203125, 0.610443115234375, 0.6673583984375, 0.724273681640625, 0.78118896484375, 0.838104248046875, 0.89501953125, 0.951934814453125, 1.00885009765625, 1.065765380859375, 1.1226806640625, 1.179595947265625, 1.23651123046875, 1.293426513671875, 1.350341796875, 1.407257080078125, 1.46417236328125, 1.521087646484375, 1.5780029296875, 1.634918212890625, 1.69183349609375, 1.748748779296875, 1.8056640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 8.0, 14.0, 15.0, 25.0, 63.0, 110.0, 234.0, 546.0, 1037.0, 1023.0, 554.0, 231.0, 91.0, 52.0, 19.0, 23.0, 10.0, 12.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.2263565063476562, -1.1978302001953125, -1.1693038940429688, -1.140777587890625, -1.1122512817382812, -1.0837249755859375, -1.0551986694335938, -1.02667236328125, -0.9981460571289062, -0.9696197509765625, -0.9410934448242188, -0.912567138671875, -0.8840408325195312, -0.8555145263671875, -0.8269882202148438, -0.7984619140625, -0.7699356079101562, -0.7414093017578125, -0.7128829956054688, -0.684356689453125, -0.6558303833007812, -0.6273040771484375, -0.5987777709960938, -0.57025146484375, -0.5417251586914062, -0.5131988525390625, -0.48467254638671875, -0.456146240234375, -0.42761993408203125, -0.3990936279296875, -0.37056732177734375, -0.342041015625, -0.31351470947265625, -0.2849884033203125, -0.25646209716796875, -0.227935791015625, -0.19940948486328125, -0.1708831787109375, -0.14235687255859375, -0.11383056640625, -0.08530426025390625, -0.0567779541015625, -0.02825164794921875, 0.000274658203125, 0.02880096435546875, 0.0573272705078125, 0.08585357666015625, 0.1143798828125, 0.14290618896484375, 0.1714324951171875, 0.19995880126953125, 0.228485107421875, 0.25701141357421875, 0.2855377197265625, 0.31406402587890625, 0.34259033203125, 0.37111663818359375, 0.3996429443359375, 0.42816925048828125, 0.456695556640625, 0.48522186279296875, 0.5137481689453125, 0.5422744750976562, 0.57080078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 17.0, 38.0, 64.0, 112.0, 199.0, 227.0, 151.0, 77.0, 47.0, 20.0, 13.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.544035911560059, -7.336273193359375, -7.128509998321533, -6.92074728012085, -6.712984085083008, -6.505221366882324, -6.297458648681641, -6.089695453643799, -5.881932735443115, -5.674170017242432, -5.46640682220459, -5.258644104003906, -5.0508809089660645, -4.843118190765381, -4.635354995727539, -4.4275922775268555, -4.219829559326172, -4.012066841125488, -3.8043036460876465, -3.596540927886963, -3.3887779712677, -3.1810150146484375, -2.973252058029175, -2.765489101409912, -2.5577259063720703, -2.3499629497528076, -2.142199993133545, -1.9344371557235718, -1.7266743183135986, -1.518911361694336, -1.3111484050750732, -1.1033855676651, -0.895622730255127, -0.687859833240509, -0.4800969064235687, -0.2723339796066284, -0.0645710825920105, 0.14319181442260742, 0.3509547710418701, 0.5587176084518433, 0.766480565071106, 0.9742434620857239, 1.1820063591003418, 1.3897693157196045, 1.5975322723388672, 1.8052951097488403, 2.0130581855773926, 2.220820903778076, 2.428583860397339, 2.6363468170166016, 2.8441097736358643, 3.051872730255127, 3.2596354484558105, 3.4673984050750732, 3.675161361694336, 3.8829240798950195, 4.090687274932861, 4.298449993133545, 4.506213188171387, 4.71397590637207, 4.921739101409912, 5.129501819610596, 5.3372650146484375, 5.545027732849121, 5.752790451049805]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 2.0, 4.0, 5.0, 11.0, 11.0, 11.0, 13.0, 21.0, 15.0, 21.0, 28.0, 33.0, 26.0, 38.0, 34.0, 41.0, 41.0, 43.0, 41.0, 40.0, 45.0, 37.0, 47.0, 46.0, 56.0, 40.0, 34.0, 24.0, 40.0, 25.0, 14.0, 21.0, 15.0, 19.0, 10.0, 8.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6541683673858643, -2.574930429458618, -2.495692253112793, -2.416454315185547, -2.337216377258301, -2.2579784393310547, -2.1787402629852295, -2.0995023250579834, -2.0202643871307373, -1.9410263299942017, -1.8617883920669556, -1.78255033493042, -1.7033123970031738, -1.6240743398666382, -1.5448362827301025, -1.4655983448028564, -1.3863602876663208, -1.3071222305297852, -1.227884292602539, -1.1486462354660034, -1.0694082975387573, -0.9901702404022217, -0.9109322428703308, -0.8316942453384399, -0.7524562478065491, -0.6732182502746582, -0.5939802527427673, -0.5147422552108765, -0.4355042278766632, -0.35626623034477234, -0.2770282030105591, -0.1977902054786682, -0.11855220794677734, -0.03931420296430588, 0.03992380201816559, 0.11916181445121765, 0.19839981198310852, 0.2776378095149994, 0.35687583684921265, 0.4361138343811035, 0.5153518319129944, 0.5945898294448853, 0.6738278269767761, 0.753065824508667, 0.8323038816452026, 0.9115418195724487, 0.9907798767089844, 1.0700178146362305, 1.1492558717727661, 1.2284939289093018, 1.3077318668365479, 1.3869699239730835, 1.4662078619003296, 1.5454459190368652, 1.6246838569641113, 1.703921914100647, 1.7831599712371826, 1.8623980283737183, 1.9416359663009644, 2.0208740234375, 2.100111961364746, 2.179349899291992, 2.2585880756378174, 2.3378260135650635, 2.4170639514923096]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 21.0, 37.0, 69.0, 134.0, 271.0, 564.0, 1331.0, 3519.0, 10578.0, 38908.0, 212105.0, 610451.0, 130557.0, 27380.0, 7845.0, 2771.0, 1121.0, 443.0, 202.0, 108.0, 53.0, 24.0, 14.0, 11.0, 10.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4549140930175781, -0.43888092041015625, -0.4228477478027344, -0.4068145751953125, -0.3907814025878906, -0.37474822998046875, -0.3587150573730469, -0.342681884765625, -0.3266487121582031, -0.31061553955078125, -0.2945823669433594, -0.2785491943359375, -0.2625160217285156, -0.24648284912109375, -0.23044967651367188, -0.21441650390625, -0.19838333129882812, -0.18235015869140625, -0.16631698608398438, -0.1502838134765625, -0.13425064086914062, -0.11821746826171875, -0.10218429565429688, -0.086151123046875, -0.07011795043945312, -0.05408477783203125, -0.038051605224609375, -0.0220184326171875, -0.005985260009765625, 0.01004791259765625, 0.026081085205078125, 0.0421142578125, 0.058147430419921875, 0.07418060302734375, 0.09021377563476562, 0.1062469482421875, 0.12228012084960938, 0.13831329345703125, 0.15434646606445312, 0.170379638671875, 0.18641281127929688, 0.20244598388671875, 0.21847915649414062, 0.2345123291015625, 0.2505455017089844, 0.26657867431640625, 0.2826118469238281, 0.29864501953125, 0.3146781921386719, 0.33071136474609375, 0.3467445373535156, 0.3627777099609375, 0.3788108825683594, 0.39484405517578125, 0.4108772277832031, 0.426910400390625, 0.4429435729980469, 0.45897674560546875, 0.4750099182128906, 0.4910430908203125, 0.5070762634277344, 0.5231094360351562, 0.5391426086425781, 0.55517578125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 3.0, 8.0, 11.0, 13.0, 17.0, 16.0, 16.0, 19.0, 29.0, 17.0, 24.0, 30.0, 26.0, 45.0, 49.0, 45.0, 47.0, 38.0, 60.0, 50.0, 40.0, 49.0, 29.0, 40.0, 35.0, 45.0, 27.0, 26.0, 22.0, 23.0, 23.0, 14.0, 8.0, 19.0, 6.0, 6.0, 4.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2538776397705078, -0.24652481079101562, -0.23917198181152344, -0.23181915283203125, -0.22446632385253906, -0.21711349487304688, -0.2097606658935547, -0.2024078369140625, -0.1950550079345703, -0.18770217895507812, -0.18034934997558594, -0.17299652099609375, -0.16564369201660156, -0.15829086303710938, -0.1509380340576172, -0.143585205078125, -0.1362323760986328, -0.12887954711914062, -0.12152671813964844, -0.11417388916015625, -0.10682106018066406, -0.09946823120117188, -0.09211540222167969, -0.0847625732421875, -0.07740974426269531, -0.07005691528320312, -0.06270408630371094, -0.05535125732421875, -0.04799842834472656, -0.040645599365234375, -0.03329277038574219, -0.02593994140625, -0.018587112426757812, -0.011234283447265625, -0.0038814544677734375, 0.00347137451171875, 0.010824203491210938, 0.018177032470703125, 0.025529861450195312, 0.0328826904296875, 0.04023551940917969, 0.047588348388671875, 0.05494117736816406, 0.06229400634765625, 0.06964683532714844, 0.07699966430664062, 0.08435249328613281, 0.091705322265625, 0.09905815124511719, 0.10641098022460938, 0.11376380920410156, 0.12111663818359375, 0.12846946716308594, 0.13582229614257812, 0.1431751251220703, 0.1505279541015625, 0.1578807830810547, 0.16523361206054688, 0.17258644104003906, 0.17993927001953125, 0.18729209899902344, 0.19464492797851562, 0.2019977569580078, 0.2093505859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 8.0, 7.0, 11.0, 8.0, 22.0, 29.0, 30.0, 48.0, 72.0, 88.0, 125.0, 211.0, 306.0, 506.0, 818.0, 1715.0, 4567.0, 21056.0, 327083.0, 658753.0, 24003.0, 4949.0, 1802.0, 875.0, 457.0, 296.0, 177.0, 144.0, 112.0, 71.0, 49.0, 40.0, 32.0, 21.0, 20.0, 8.0, 14.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7880859375, -0.7618484497070312, -0.7356109619140625, -0.7093734741210938, -0.683135986328125, -0.6568984985351562, -0.6306610107421875, -0.6044235229492188, -0.57818603515625, -0.5519485473632812, -0.5257110595703125, -0.49947357177734375, -0.473236083984375, -0.44699859619140625, -0.4207611083984375, -0.39452362060546875, -0.3682861328125, -0.34204864501953125, -0.3158111572265625, -0.28957366943359375, -0.263336181640625, -0.23709869384765625, -0.2108612060546875, -0.18462371826171875, -0.15838623046875, -0.13214874267578125, -0.1059112548828125, -0.07967376708984375, -0.053436279296875, -0.02719879150390625, -0.0009613037109375, 0.02527618408203125, 0.051513671875, 0.07775115966796875, 0.1039886474609375, 0.13022613525390625, 0.156463623046875, 0.18270111083984375, 0.2089385986328125, 0.23517608642578125, 0.26141357421875, 0.28765106201171875, 0.3138885498046875, 0.34012603759765625, 0.366363525390625, 0.39260101318359375, 0.4188385009765625, 0.44507598876953125, 0.4713134765625, 0.49755096435546875, 0.5237884521484375, 0.5500259399414062, 0.576263427734375, 0.6025009155273438, 0.6287384033203125, 0.6549758911132812, 0.68121337890625, 0.7074508666992188, 0.7336883544921875, 0.7599258422851562, 0.786163330078125, 0.8124008178710938, 0.8386383056640625, 0.8648757934570312, 0.89111328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 10.0, 4.0, 14.0, 13.0, 20.0, 22.0, 15.0, 24.0, 26.0, 55.0, 37.0, 56.0, 55.0, 72.0, 67.0, 68.0, 46.0, 57.0, 57.0, 34.0, 43.0, 39.0, 29.0, 25.0, 22.0, 16.0, 12.0, 8.0, 9.0, 7.0, 8.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.2177734375, -1.1834716796875, -1.149169921875, -1.1148681640625, -1.08056640625, -1.0462646484375, -1.011962890625, -0.9776611328125, -0.943359375, -0.9090576171875, -0.874755859375, -0.8404541015625, -0.80615234375, -0.7718505859375, -0.737548828125, -0.7032470703125, -0.6689453125, -0.6346435546875, -0.600341796875, -0.5660400390625, -0.53173828125, -0.4974365234375, -0.463134765625, -0.4288330078125, -0.39453125, -0.3602294921875, -0.325927734375, -0.2916259765625, -0.25732421875, -0.2230224609375, -0.188720703125, -0.1544189453125, -0.1201171875, -0.0858154296875, -0.051513671875, -0.0172119140625, 0.01708984375, 0.0513916015625, 0.085693359375, 0.1199951171875, 0.154296875, 0.1885986328125, 0.222900390625, 0.2572021484375, 0.29150390625, 0.3258056640625, 0.360107421875, 0.3944091796875, 0.4287109375, 0.4630126953125, 0.497314453125, 0.5316162109375, 0.56591796875, 0.6002197265625, 0.634521484375, 0.6688232421875, 0.703125, 0.7374267578125, 0.771728515625, 0.8060302734375, 0.84033203125, 0.8746337890625, 0.908935546875, 0.9432373046875, 0.9775390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 9.0, 11.0, 16.0, 15.0, 19.0, 24.0, 39.0, 49.0, 89.0, 145.0, 237.0, 472.0, 1066.0, 2531.0, 6960.0, 26476.0, 233860.0, 724179.0, 37585.0, 9176.0, 3037.0, 1219.0, 532.0, 298.0, 167.0, 117.0, 69.0, 46.0, 33.0, 24.0, 17.0, 7.0, 5.0, 8.0, 4.0, 1.0, 2.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.27025604248046875, -0.2609710693359375, -0.25168609619140625, -0.242401123046875, -0.23311614990234375, -0.2238311767578125, -0.21454620361328125, -0.20526123046875, -0.19597625732421875, -0.1866912841796875, -0.17740631103515625, -0.168121337890625, -0.15883636474609375, -0.1495513916015625, -0.14026641845703125, -0.1309814453125, -0.12169647216796875, -0.1124114990234375, -0.10312652587890625, -0.093841552734375, -0.08455657958984375, -0.0752716064453125, -0.06598663330078125, -0.05670166015625, -0.04741668701171875, -0.0381317138671875, -0.02884674072265625, -0.019561767578125, -0.01027679443359375, -0.0009918212890625, 0.00829315185546875, 0.017578125, 0.02686309814453125, 0.0361480712890625, 0.04543304443359375, 0.054718017578125, 0.06400299072265625, 0.0732879638671875, 0.08257293701171875, 0.09185791015625, 0.10114288330078125, 0.1104278564453125, 0.11971282958984375, 0.128997802734375, 0.13828277587890625, 0.1475677490234375, 0.15685272216796875, 0.1661376953125, 0.17542266845703125, 0.1847076416015625, 0.19399261474609375, 0.203277587890625, 0.21256256103515625, 0.2218475341796875, 0.23113250732421875, 0.24041748046875, 0.24970245361328125, 0.2589874267578125, 0.26827239990234375, 0.277557373046875, 0.28684234619140625, 0.2961273193359375, 0.30541229248046875, 0.314697265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 2.0, 10.0, 15.0, 8.0, 17.0, 14.0, 26.0, 44.0, 49.0, 75.0, 144.0, 184.0, 122.0, 79.0, 47.0, 33.0, 21.0, 19.0, 17.0, 14.0, 11.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.314847946166992e-05, -8.073262870311737e-05, -7.831677794456482e-05, -7.590092718601227e-05, -7.348507642745972e-05, -7.106922566890717e-05, -6.865337491035461e-05, -6.623752415180206e-05, -6.382167339324951e-05, -6.140582263469696e-05, -5.898997187614441e-05, -5.657412111759186e-05, -5.415827035903931e-05, -5.1742419600486755e-05, -4.9326568841934204e-05, -4.691071808338165e-05, -4.44948673248291e-05, -4.207901656627655e-05, -3.9663165807724e-05, -3.724731504917145e-05, -3.4831464290618896e-05, -3.2415613532066345e-05, -2.9999762773513794e-05, -2.7583912014961243e-05, -2.516806125640869e-05, -2.275221049785614e-05, -2.033635973930359e-05, -1.7920508980751038e-05, -1.5504658222198486e-05, -1.3088807463645935e-05, -1.0672956705093384e-05, -8.257105946540833e-06, -5.841255187988281e-06, -3.42540442943573e-06, -1.0095536708831787e-06, 1.4062970876693726e-06, 3.822147846221924e-06, 6.237998604774475e-06, 8.653849363327026e-06, 1.1069700121879578e-05, 1.3485550880432129e-05, 1.590140163898468e-05, 1.831725239753723e-05, 2.0733103156089783e-05, 2.3148953914642334e-05, 2.5564804673194885e-05, 2.7980655431747437e-05, 3.0396506190299988e-05, 3.281235694885254e-05, 3.522820770740509e-05, 3.764405846595764e-05, 4.005990922451019e-05, 4.2475759983062744e-05, 4.4891610741615295e-05, 4.730746150016785e-05, 4.97233122587204e-05, 5.213916301727295e-05, 5.45550137758255e-05, 5.697086453437805e-05, 5.93867152929306e-05, 6.180256605148315e-05, 6.42184168100357e-05, 6.663426756858826e-05, 6.905011832714081e-05, 7.146596908569336e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 16.0, 16.0, 22.0, 15.0, 33.0, 47.0, 92.0, 160.0, 317.0, 584.0, 1374.0, 3859.0, 16413.0, 142565.0, 826703.0, 44530.0, 7648.0, 2212.0, 876.0, 433.0, 226.0, 143.0, 92.0, 47.0, 42.0, 23.0, 13.0, 9.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.37841796875, -0.3676872253417969, -0.35695648193359375, -0.3462257385253906, -0.3354949951171875, -0.3247642517089844, -0.31403350830078125, -0.3033027648925781, -0.292572021484375, -0.2818412780761719, -0.27111053466796875, -0.2603797912597656, -0.2496490478515625, -0.23891830444335938, -0.22818756103515625, -0.21745681762695312, -0.20672607421875, -0.19599533081054688, -0.18526458740234375, -0.17453384399414062, -0.1638031005859375, -0.15307235717773438, -0.14234161376953125, -0.13161087036132812, -0.120880126953125, -0.11014938354492188, -0.09941864013671875, -0.08868789672851562, -0.0779571533203125, -0.06722640991210938, -0.05649566650390625, -0.045764923095703125, -0.0350341796875, -0.024303436279296875, -0.01357269287109375, -0.002841949462890625, 0.0078887939453125, 0.018619537353515625, 0.02935028076171875, 0.040081024169921875, 0.050811767578125, 0.061542510986328125, 0.07227325439453125, 0.08300399780273438, 0.0937347412109375, 0.10446548461914062, 0.11519622802734375, 0.12592697143554688, 0.13665771484375, 0.14738845825195312, 0.15811920166015625, 0.16884994506835938, 0.1795806884765625, 0.19031143188476562, 0.20104217529296875, 0.21177291870117188, 0.222503662109375, 0.23323440551757812, 0.24396514892578125, 0.2546958923339844, 0.2654266357421875, 0.2761573791503906, 0.28688812255859375, 0.2976188659667969, 0.308349609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 13.0, 7.0, 14.0, 22.0, 26.0, 27.0, 45.0, 62.0, 80.0, 106.0, 156.0, 121.0, 79.0, 60.0, 28.0, 31.0, 31.0, 9.0, 15.0, 12.0, 9.0, 2.0, 7.0, 5.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.22324180603027344, -0.21516036987304688, -0.2070789337158203, -0.19899749755859375, -0.1909160614013672, -0.18283462524414062, -0.17475318908691406, -0.1666717529296875, -0.15859031677246094, -0.15050888061523438, -0.1424274444580078, -0.13434600830078125, -0.1262645721435547, -0.11818313598632812, -0.11010169982910156, -0.102020263671875, -0.09393882751464844, -0.08585739135742188, -0.07777595520019531, -0.06969451904296875, -0.06161308288574219, -0.053531646728515625, -0.04545021057128906, -0.0373687744140625, -0.029287338256835938, -0.021205902099609375, -0.013124465942382812, -0.00504302978515625, 0.0030384063720703125, 0.011119842529296875, 0.019201278686523438, 0.02728271484375, 0.03536415100097656, 0.043445587158203125, 0.05152702331542969, 0.05960845947265625, 0.06768989562988281, 0.07577133178710938, 0.08385276794433594, 0.0919342041015625, 0.10001564025878906, 0.10809707641601562, 0.11617851257324219, 0.12425994873046875, 0.1323413848876953, 0.14042282104492188, 0.14850425720214844, 0.156585693359375, 0.16466712951660156, 0.17274856567382812, 0.1808300018310547, 0.18891143798828125, 0.1969928741455078, 0.20507431030273438, 0.21315574645996094, 0.2212371826171875, 0.22931861877441406, 0.23740005493164062, 0.2454814910888672, 0.25356292724609375, 0.2616443634033203, 0.2697257995605469, 0.27780723571777344, 0.285888671875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 17.0, 44.0, 180.0, 497.0, 162.0, 53.0, 26.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.823816299438477, -10.490530967712402, -10.157246589660645, -9.82396125793457, -9.490676879882812, -9.157391548156738, -8.82410717010498, -8.490821838378906, -8.157537460327148, -7.824252605438232, -7.490967750549316, -7.1576828956604, -6.824398040771484, -6.49111270904541, -6.157827854156494, -5.824542999267578, -5.491257667541504, -5.157972812652588, -4.824687957763672, -4.491403102874756, -4.15811824798584, -3.8248331546783447, -3.4915480613708496, -3.1582632064819336, -2.8249783515930176, -2.4916934967041016, -2.1584086418151855, -1.8251235485076904, -1.4918386936187744, -1.1585538387298584, -0.8252688646316528, -0.49198389053344727, -0.15869998931884766, 0.17458492517471313, 0.5078698396682739, 0.8411547541618347, 1.1744396686553955, 1.5077245235443115, 1.841009497642517, 2.1742944717407227, 2.5075793266296387, 2.8408641815185547, 3.1741490364074707, 3.507434129714966, 3.840718984603882, 4.174003601074219, 4.507288932800293, 4.840573787689209, 5.173858642578125, 5.507143497467041, 5.840428352355957, 6.173713207244873, 6.506998062133789, 6.840283393859863, 7.173568248748779, 7.506853103637695, 7.840137958526611, 8.173422813415527, 8.506708145141602, 8.83999252319336, 9.173277854919434, 9.506562232971191, 9.839847564697266, 10.173131942749023, 10.506417274475098]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 8.0, 9.0, 12.0, 15.0, 16.0, 17.0, 19.0, 24.0, 21.0, 38.0, 38.0, 35.0, 41.0, 56.0, 113.0, 177.0, 74.0, 43.0, 35.0, 30.0, 38.0, 24.0, 20.0, 20.0, 13.0, 11.0, 5.0, 10.0, 13.0, 3.0, 3.0, 0.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.095769882202148, -4.942098140716553, -4.788426399230957, -4.6347551345825195, -4.481083393096924, -4.327411651611328, -4.173740386962891, -4.020068645477295, -3.866396903991699, -3.7127251625061035, -3.559053659439087, -3.4053821563720703, -3.2517104148864746, -3.098038673400879, -2.9443671703338623, -2.7906956672668457, -2.63702392578125, -2.4833521842956543, -2.3296806812286377, -2.176009178161621, -2.0223374366760254, -1.8686658143997192, -1.714994192123413, -1.561322569847107, -1.4076509475708008, -1.2539793252944946, -1.1003077030181885, -0.9466360807418823, -0.7929644584655762, -0.63929283618927, -0.48562121391296387, -0.3319495916366577, -0.17827749252319336, -0.024605870246887207, 0.12906575202941895, 0.2827373743057251, 0.43640899658203125, 0.5900806188583374, 0.7437522411346436, 0.8974238634109497, 1.0510954856872559, 1.204767107963562, 1.3584387302398682, 1.5121103525161743, 1.6657819747924805, 1.8194535970687866, 1.9731252193450928, 2.1267967224121094, 2.280468463897705, 2.434140205383301, 2.5878117084503174, 2.741483211517334, 2.8951549530029297, 3.0488266944885254, 3.202498197555542, 3.3561697006225586, 3.5098414421081543, 3.66351318359375, 3.8171846866607666, 3.970856189727783, 4.124527931213379, 4.278199672698975, 4.43187141418457, 4.585542678833008, 4.7392144203186035]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 5.0, 11.0, 6.0, 5.0, 16.0, 20.0, 25.0, 42.0, 56.0, 86.0, 177.0, 302.0, 606.0, 1296.0, 3063.0, 8143.0, 30412.0, 241956.0, 2146053.0, 1578612.0, 149106.0, 22588.0, 6818.0, 2642.0, 1123.0, 516.0, 279.0, 120.0, 83.0, 48.0, 11.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.765625, -0.7469062805175781, -0.7281875610351562, -0.7094688415527344, -0.6907501220703125, -0.6720314025878906, -0.6533126831054688, -0.6345939636230469, -0.615875244140625, -0.5971565246582031, -0.5784378051757812, -0.5597190856933594, -0.5410003662109375, -0.5222816467285156, -0.5035629272460938, -0.4848442077636719, -0.46612548828125, -0.4474067687988281, -0.42868804931640625, -0.4099693298339844, -0.3912506103515625, -0.3725318908691406, -0.35381317138671875, -0.3350944519042969, -0.316375732421875, -0.2976570129394531, -0.27893829345703125, -0.2602195739746094, -0.2415008544921875, -0.22278213500976562, -0.20406341552734375, -0.18534469604492188, -0.1666259765625, -0.14790725708007812, -0.12918853759765625, -0.11046981811523438, -0.0917510986328125, -0.07303237915039062, -0.05431365966796875, -0.035594940185546875, -0.016876220703125, 0.001842498779296875, 0.02056121826171875, 0.039279937744140625, 0.0579986572265625, 0.07671737670898438, 0.09543609619140625, 0.11415481567382812, 0.13287353515625, 0.15159225463867188, 0.17031097412109375, 0.18902969360351562, 0.2077484130859375, 0.22646713256835938, 0.24518585205078125, 0.2639045715332031, 0.282623291015625, 0.3013420104980469, 0.32006072998046875, 0.3387794494628906, 0.3574981689453125, 0.3762168884277344, 0.39493560791015625, 0.4136543273925781, 0.432373046875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 2.0, 4.0, 8.0, 6.0, 17.0, 16.0, 18.0, 19.0, 17.0, 14.0, 27.0, 35.0, 36.0, 33.0, 27.0, 30.0, 34.0, 50.0, 45.0, 45.0, 54.0, 32.0, 48.0, 35.0, 45.0, 38.0, 33.0, 37.0, 27.0, 27.0, 22.0, 18.0, 21.0, 20.0, 8.0, 9.0, 7.0, 5.0, 5.0, 4.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.230224609375, -0.22306442260742188, -0.21590423583984375, -0.20874404907226562, -0.2015838623046875, -0.19442367553710938, -0.18726348876953125, -0.18010330200195312, -0.172943115234375, -0.16578292846679688, -0.15862274169921875, -0.15146255493164062, -0.1443023681640625, -0.13714218139648438, -0.12998199462890625, -0.12282180786132812, -0.11566162109375, -0.10850143432617188, -0.10134124755859375, -0.09418106079101562, -0.0870208740234375, -0.07986068725585938, -0.07270050048828125, -0.06554031372070312, -0.058380126953125, -0.051219940185546875, -0.04405975341796875, -0.036899566650390625, -0.0297393798828125, -0.022579193115234375, -0.01541900634765625, -0.008258819580078125, -0.0010986328125, 0.006061553955078125, 0.01322174072265625, 0.020381927490234375, 0.0275421142578125, 0.034702301025390625, 0.04186248779296875, 0.049022674560546875, 0.056182861328125, 0.06334304809570312, 0.07050323486328125, 0.07766342163085938, 0.0848236083984375, 0.09198379516601562, 0.09914398193359375, 0.10630416870117188, 0.11346435546875, 0.12062454223632812, 0.12778472900390625, 0.13494491577148438, 0.1421051025390625, 0.14926528930664062, 0.15642547607421875, 0.16358566284179688, 0.170745849609375, 0.17790603637695312, 0.18506622314453125, 0.19222640991210938, 0.1993865966796875, 0.20654678344726562, 0.21370697021484375, 0.22086715698242188, 0.22802734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 10.0, 13.0, 23.0, 104.0, 373.0, 1605.0, 103175.0, 4085393.0, 2795.0, 567.0, 136.0, 48.0, 21.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.87200927734375, -3.6971435546875, -3.52227783203125, -3.347412109375, -3.17254638671875, -2.9976806640625, -2.82281494140625, -2.64794921875, -2.47308349609375, -2.2982177734375, -2.12335205078125, -1.948486328125, -1.77362060546875, -1.5987548828125, -1.42388916015625, -1.2490234375, -1.07415771484375, -0.8992919921875, -0.72442626953125, -0.549560546875, -0.37469482421875, -0.1998291015625, -0.02496337890625, 0.14990234375, 0.32476806640625, 0.4996337890625, 0.67449951171875, 0.849365234375, 1.02423095703125, 1.1990966796875, 1.37396240234375, 1.548828125, 1.72369384765625, 1.8985595703125, 2.07342529296875, 2.248291015625, 2.42315673828125, 2.5980224609375, 2.77288818359375, 2.94775390625, 3.12261962890625, 3.2974853515625, 3.47235107421875, 3.647216796875, 3.82208251953125, 3.9969482421875, 4.17181396484375, 4.3466796875, 4.52154541015625, 4.6964111328125, 4.87127685546875, 5.046142578125, 5.22100830078125, 5.3958740234375, 5.57073974609375, 5.74560546875, 5.92047119140625, 6.0953369140625, 6.27020263671875, 6.445068359375, 6.61993408203125, 6.7947998046875, 6.96966552734375, 7.14453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 8.0, 17.0, 47.0, 96.0, 224.0, 533.0, 1148.0, 1142.0, 517.0, 204.0, 66.0, 39.0, 23.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.615234375, -1.550689697265625, -1.48614501953125, -1.421600341796875, -1.3570556640625, -1.292510986328125, -1.22796630859375, -1.163421630859375, -1.098876953125, -1.034332275390625, -0.96978759765625, -0.905242919921875, -0.8406982421875, -0.776153564453125, -0.71160888671875, -0.647064208984375, -0.58251953125, -0.517974853515625, -0.45343017578125, -0.388885498046875, -0.3243408203125, -0.259796142578125, -0.19525146484375, -0.130706787109375, -0.066162109375, -0.001617431640625, 0.06292724609375, 0.127471923828125, 0.1920166015625, 0.256561279296875, 0.32110595703125, 0.385650634765625, 0.4501953125, 0.514739990234375, 0.57928466796875, 0.643829345703125, 0.7083740234375, 0.772918701171875, 0.83746337890625, 0.902008056640625, 0.966552734375, 1.031097412109375, 1.09564208984375, 1.160186767578125, 1.2247314453125, 1.289276123046875, 1.35382080078125, 1.418365478515625, 1.48291015625, 1.547454833984375, 1.61199951171875, 1.676544189453125, 1.7410888671875, 1.805633544921875, 1.87017822265625, 1.934722900390625, 1.999267578125, 2.063812255859375, 2.12835693359375, 2.192901611328125, 2.2574462890625, 2.321990966796875, 2.38653564453125, 2.451080322265625, 2.515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 1.0, 4.0, 12.0, 14.0, 24.0, 45.0, 89.0, 128.0, 177.0, 192.0, 125.0, 79.0, 40.0, 22.0, 11.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.73093318939209, -10.38422966003418, -10.03752613067627, -9.69082260131836, -9.34411907196045, -8.997415542602539, -8.650711059570312, -8.304008483886719, -7.95730447769165, -7.61060094833374, -7.26389741897583, -6.917193412780762, -6.570489883422852, -6.223786354064941, -5.877082824707031, -5.530379295349121, -5.183675765991211, -4.836972236633301, -4.490268707275391, -4.1435651779174805, -3.796861410140991, -3.450157880783081, -3.103454113006592, -2.7567505836486816, -2.4100470542907715, -2.0633435249328613, -1.7166398763656616, -1.369936227798462, -1.0232326984405518, -0.6765291690826416, -0.32982540130615234, 0.016878128051757812, 0.36358165740966797, 0.7102852463722229, 1.0569888353347778, 1.4036924839019775, 1.7503960132598877, 2.097099542617798, 2.443803310394287, 2.7905068397521973, 3.1372103691101074, 3.4839138984680176, 3.8306174278259277, 4.177321434020996, 4.524024963378906, 4.870728492736816, 5.217432022094727, 5.564135551452637, 5.910839080810547, 6.257542610168457, 6.604246139526367, 6.950949668884277, 7.2976531982421875, 7.644356727600098, 7.991060733795166, 8.337764739990234, 8.684467315673828, 9.031170845031738, 9.377874374389648, 9.724577903747559, 10.071281433105469, 10.417984962463379, 10.764688491821289, 11.111392974853516, 11.458096504211426]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 6.0, 17.0, 28.0, 30.0, 25.0, 52.0, 61.0, 62.0, 66.0, 65.0, 89.0, 71.0, 74.0, 66.0, 36.0, 56.0, 40.0, 31.0, 32.0, 24.0, 10.0, 15.0, 10.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.474026203155518, -6.26028299331665, -6.046539783477783, -5.832796096801758, -5.619052886962891, -5.405309677124023, -5.191566467285156, -4.977823257446289, -4.764080047607422, -4.550336837768555, -4.3365936279296875, -4.12285041809082, -3.909106731414795, -3.6953635215759277, -3.4816203117370605, -3.2678771018981934, -3.054133415222168, -2.840390205383301, -2.6266467571258545, -2.4129035472869873, -2.199160099029541, -1.9854168891906738, -1.7716736793518066, -1.55793035030365, -1.3441870212554932, -1.1304436922073364, -0.9167004227638245, -0.7029571533203125, -0.48921382427215576, -0.275470495223999, -0.061727285385131836, 0.1520160436630249, 0.36575889587402344, 0.5795022249221802, 0.7932454943656921, 1.006988763809204, 1.2207320928573608, 1.4344754219055176, 1.6482186317443848, 1.8619619607925415, 2.0757052898406982, 2.2894484996795654, 2.5031919479370117, 2.716935157775879, 2.930678367614746, 3.1444218158721924, 3.3581650257110596, 3.571908473968506, 3.785651683807373, 3.9993948936462402, 4.213138103485107, 4.426881790161133, 4.640625, 4.854368209838867, 5.068111419677734, 5.281854629516602, 5.495597839355469, 5.709341049194336, 5.923084259033203, 6.13682746887207, 6.350571155548096, 6.564314365386963, 6.77805757522583, 6.991800785064697, 7.205544471740723]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 11.0, 12.0, 23.0, 29.0, 37.0, 59.0, 102.0, 201.0, 334.0, 627.0, 1492.0, 4141.0, 15381.0, 99059.0, 794539.0, 109193.0, 16011.0, 4194.0, 1586.0, 688.0, 349.0, 182.0, 104.0, 64.0, 56.0, 24.0, 16.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.779296875, -0.7579574584960938, -0.7366180419921875, -0.7152786254882812, -0.693939208984375, -0.6725997924804688, -0.6512603759765625, -0.6299209594726562, -0.60858154296875, -0.5872421264648438, -0.5659027099609375, -0.5445632934570312, -0.523223876953125, -0.5018844604492188, -0.4805450439453125, -0.45920562744140625, -0.4378662109375, -0.41652679443359375, -0.3951873779296875, -0.37384796142578125, -0.352508544921875, -0.33116912841796875, -0.3098297119140625, -0.28849029541015625, -0.26715087890625, -0.24581146240234375, -0.2244720458984375, -0.20313262939453125, -0.181793212890625, -0.16045379638671875, -0.1391143798828125, -0.11777496337890625, -0.096435546875, -0.07509613037109375, -0.0537567138671875, -0.03241729736328125, -0.011077880859375, 0.01026153564453125, 0.0316009521484375, 0.05294036865234375, 0.07427978515625, 0.09561920166015625, 0.1169586181640625, 0.13829803466796875, 0.159637451171875, 0.18097686767578125, 0.2023162841796875, 0.22365570068359375, 0.2449951171875, 0.26633453369140625, 0.2876739501953125, 0.30901336669921875, 0.330352783203125, 0.35169219970703125, 0.3730316162109375, 0.39437103271484375, 0.41571044921875, 0.43704986572265625, 0.4583892822265625, 0.47972869873046875, 0.501068115234375, 0.5224075317382812, 0.5437469482421875, 0.5650863647460938, 0.58642578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 9.0, 20.0, 24.0, 41.0, 36.0, 46.0, 54.0, 61.0, 61.0, 82.0, 85.0, 66.0, 88.0, 73.0, 56.0, 42.0, 39.0, 32.0, 15.0, 24.0, 7.0, 10.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37744140625, -0.362060546875, -0.3466796875, -0.331298828125, -0.31591796875, -0.300537109375, -0.28515625, -0.269775390625, -0.25439453125, -0.239013671875, -0.2236328125, -0.208251953125, -0.19287109375, -0.177490234375, -0.162109375, -0.146728515625, -0.13134765625, -0.115966796875, -0.1005859375, -0.085205078125, -0.06982421875, -0.054443359375, -0.0390625, -0.023681640625, -0.00830078125, 0.007080078125, 0.0224609375, 0.037841796875, 0.05322265625, 0.068603515625, 0.083984375, 0.099365234375, 0.11474609375, 0.130126953125, 0.1455078125, 0.160888671875, 0.17626953125, 0.191650390625, 0.20703125, 0.222412109375, 0.23779296875, 0.253173828125, 0.2685546875, 0.283935546875, 0.29931640625, 0.314697265625, 0.330078125, 0.345458984375, 0.36083984375, 0.376220703125, 0.3916015625, 0.406982421875, 0.42236328125, 0.437744140625, 0.453125, 0.468505859375, 0.48388671875, 0.499267578125, 0.5146484375, 0.530029296875, 0.54541015625, 0.560791015625, 0.576171875, 0.591552734375, 0.60693359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 11.0, 8.0, 8.0, 24.0, 21.0, 35.0, 36.0, 57.0, 71.0, 100.0, 147.0, 242.0, 401.0, 792.0, 2143.0, 9373.0, 93451.0, 896385.0, 37252.0, 5005.0, 1457.0, 612.0, 314.0, 193.0, 139.0, 65.0, 58.0, 44.0, 33.0, 16.0, 13.0, 11.0, 7.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6953125, -0.6750564575195312, -0.6548004150390625, -0.6345443725585938, -0.614288330078125, -0.5940322875976562, -0.5737762451171875, -0.5535202026367188, -0.53326416015625, -0.5130081176757812, -0.4927520751953125, -0.47249603271484375, -0.452239990234375, -0.43198394775390625, -0.4117279052734375, -0.39147186279296875, -0.3712158203125, -0.35095977783203125, -0.3307037353515625, -0.31044769287109375, -0.290191650390625, -0.26993560791015625, -0.2496795654296875, -0.22942352294921875, -0.20916748046875, -0.18891143798828125, -0.1686553955078125, -0.14839935302734375, -0.128143310546875, -0.10788726806640625, -0.0876312255859375, -0.06737518310546875, -0.047119140625, -0.02686309814453125, -0.0066070556640625, 0.01364898681640625, 0.033905029296875, 0.05416107177734375, 0.0744171142578125, 0.09467315673828125, 0.11492919921875, 0.13518524169921875, 0.1554412841796875, 0.17569732666015625, 0.195953369140625, 0.21620941162109375, 0.2364654541015625, 0.25672149658203125, 0.2769775390625, 0.29723358154296875, 0.3174896240234375, 0.33774566650390625, 0.358001708984375, 0.37825775146484375, 0.3985137939453125, 0.41876983642578125, 0.43902587890625, 0.45928192138671875, 0.4795379638671875, 0.49979400634765625, 0.520050048828125, 0.5403060913085938, 0.5605621337890625, 0.5808181762695312, 0.60107421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 5.0, 8.0, 4.0, 21.0, 14.0, 7.0, 25.0, 31.0, 28.0, 27.0, 44.0, 55.0, 66.0, 83.0, 74.0, 94.0, 72.0, 62.0, 51.0, 46.0, 36.0, 28.0, 27.0, 16.0, 19.0, 8.0, 7.0, 8.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5966796875, -1.5522308349609375, -1.507781982421875, -1.4633331298828125, -1.41888427734375, -1.3744354248046875, -1.329986572265625, -1.2855377197265625, -1.2410888671875, -1.1966400146484375, -1.152191162109375, -1.1077423095703125, -1.06329345703125, -1.0188446044921875, -0.974395751953125, -0.9299468994140625, -0.885498046875, -0.8410491943359375, -0.796600341796875, -0.7521514892578125, -0.70770263671875, -0.6632537841796875, -0.618804931640625, -0.5743560791015625, -0.5299072265625, -0.4854583740234375, -0.441009521484375, -0.3965606689453125, -0.35211181640625, -0.3076629638671875, -0.263214111328125, -0.2187652587890625, -0.17431640625, -0.1298675537109375, -0.085418701171875, -0.0409698486328125, 0.00347900390625, 0.0479278564453125, 0.092376708984375, 0.1368255615234375, 0.1812744140625, 0.2257232666015625, 0.270172119140625, 0.3146209716796875, 0.35906982421875, 0.4035186767578125, 0.447967529296875, 0.4924163818359375, 0.536865234375, 0.5813140869140625, 0.625762939453125, 0.6702117919921875, 0.71466064453125, 0.7591094970703125, 0.803558349609375, 0.8480072021484375, 0.8924560546875, 0.9369049072265625, 0.981353759765625, 1.0258026123046875, 1.07025146484375, 1.1147003173828125, 1.159149169921875, 1.2035980224609375, 1.248046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 10.0, 7.0, 5.0, 17.0, 18.0, 28.0, 35.0, 50.0, 71.0, 121.0, 229.0, 405.0, 811.0, 1950.0, 6048.0, 29070.0, 862139.0, 126801.0, 14180.0, 3741.0, 1337.0, 628.0, 325.0, 173.0, 93.0, 60.0, 48.0, 35.0, 19.0, 22.0, 17.0, 10.0, 8.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.142822265625, -0.1387176513671875, -0.134613037109375, -0.1305084228515625, -0.12640380859375, -0.1222991943359375, -0.118194580078125, -0.1140899658203125, -0.1099853515625, -0.1058807373046875, -0.101776123046875, -0.0976715087890625, -0.09356689453125, -0.0894622802734375, -0.085357666015625, -0.0812530517578125, -0.0771484375, -0.0730438232421875, -0.068939208984375, -0.0648345947265625, -0.06072998046875, -0.0566253662109375, -0.052520751953125, -0.0484161376953125, -0.0443115234375, -0.0402069091796875, -0.036102294921875, -0.0319976806640625, -0.02789306640625, -0.0237884521484375, -0.019683837890625, -0.0155792236328125, -0.011474609375, -0.0073699951171875, -0.003265380859375, 0.0008392333984375, 0.00494384765625, 0.0090484619140625, 0.013153076171875, 0.0172576904296875, 0.0213623046875, 0.0254669189453125, 0.029571533203125, 0.0336761474609375, 0.03778076171875, 0.0418853759765625, 0.045989990234375, 0.0500946044921875, 0.05419921875, 0.0583038330078125, 0.062408447265625, 0.0665130615234375, 0.07061767578125, 0.0747222900390625, 0.078826904296875, 0.0829315185546875, 0.0870361328125, 0.0911407470703125, 0.095245361328125, 0.0993499755859375, 0.10345458984375, 0.1075592041015625, 0.111663818359375, 0.1157684326171875, 0.119873046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 14.0, 24.0, 45.0, 91.0, 179.0, 275.0, 174.0, 106.0, 48.0, 18.0, 13.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.178285598754883e-05, -3.892090171575546e-05, -3.60589474439621e-05, -3.319699317216873e-05, -3.0335038900375366e-05, -2.7473084628582e-05, -2.4611130356788635e-05, -2.174917608499527e-05, -1.8887221813201904e-05, -1.602526754140854e-05, -1.3163313269615173e-05, -1.0301358997821808e-05, -7.439404726028442e-06, -4.577450454235077e-06, -1.7154961824417114e-06, 1.146458089351654e-06, 4.0084123611450195e-06, 6.870366632938385e-06, 9.73232090473175e-06, 1.2594275176525116e-05, 1.545622944831848e-05, 1.8318183720111847e-05, 2.1180137991905212e-05, 2.4042092263698578e-05, 2.6904046535491943e-05, 2.976600080728531e-05, 3.2627955079078674e-05, 3.548990935087204e-05, 3.8351863622665405e-05, 4.121381789445877e-05, 4.4075772166252136e-05, 4.69377264380455e-05, 4.979968070983887e-05, 5.266163498163223e-05, 5.55235892534256e-05, 5.8385543525218964e-05, 6.124749779701233e-05, 6.41094520688057e-05, 6.697140634059906e-05, 6.983336061239243e-05, 7.269531488418579e-05, 7.555726915597916e-05, 7.841922342777252e-05, 8.128117769956589e-05, 8.414313197135925e-05, 8.700508624315262e-05, 8.986704051494598e-05, 9.272899478673935e-05, 9.559094905853271e-05, 9.845290333032608e-05, 0.00010131485760211945, 0.00010417681187391281, 0.00010703876614570618, 0.00010990072041749954, 0.00011276267468929291, 0.00011562462896108627, 0.00011848658323287964, 0.000121348537504673, 0.00012421049177646637, 0.00012707244604825974, 0.0001299344003200531, 0.00013279635459184647, 0.00013565830886363983, 0.0001385202631354332, 0.00014138221740722656]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 1.0, 3.0, 8.0, 6.0, 13.0, 13.0, 15.0, 28.0, 38.0, 63.0, 90.0, 121.0, 230.0, 338.0, 705.0, 1290.0, 2827.0, 7297.0, 23321.0, 161935.0, 793488.0, 39142.0, 10112.0, 3797.0, 1615.0, 862.0, 477.0, 237.0, 166.0, 99.0, 67.0, 42.0, 29.0, 20.0, 24.0, 13.0, 2.0, 2.0, 9.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0960693359375, -0.09253311157226562, -0.08899688720703125, -0.08546066284179688, -0.0819244384765625, -0.07838821411132812, -0.07485198974609375, -0.07131576538085938, -0.067779541015625, -0.06424331665039062, -0.06070709228515625, -0.057170867919921875, -0.0536346435546875, -0.050098419189453125, -0.04656219482421875, -0.043025970458984375, -0.03948974609375, -0.035953521728515625, -0.03241729736328125, -0.028881072998046875, -0.0253448486328125, -0.021808624267578125, -0.01827239990234375, -0.014736175537109375, -0.011199951171875, -0.007663726806640625, -0.00412750244140625, -0.000591278076171875, 0.0029449462890625, 0.006481170654296875, 0.01001739501953125, 0.013553619384765625, 0.01708984375, 0.020626068115234375, 0.02416229248046875, 0.027698516845703125, 0.0312347412109375, 0.034770965576171875, 0.03830718994140625, 0.041843414306640625, 0.045379638671875, 0.048915863037109375, 0.05245208740234375, 0.055988311767578125, 0.0595245361328125, 0.06306076049804688, 0.06659698486328125, 0.07013320922851562, 0.07366943359375, 0.07720565795898438, 0.08074188232421875, 0.08427810668945312, 0.0878143310546875, 0.09135055541992188, 0.09488677978515625, 0.09842300415039062, 0.101959228515625, 0.10549545288085938, 0.10903167724609375, 0.11256790161132812, 0.1161041259765625, 0.11964035034179688, 0.12317657470703125, 0.12671279907226562, 0.1302490234375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 13.0, 15.0, 28.0, 19.0, 32.0, 47.0, 74.0, 118.0, 184.0, 147.0, 88.0, 47.0, 37.0, 19.0, 16.0, 12.0, 12.0, 17.0, 12.0, 9.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1466064453125, -0.1421222686767578, -0.13763809204101562, -0.13315391540527344, -0.12866973876953125, -0.12418556213378906, -0.11970138549804688, -0.11521720886230469, -0.1107330322265625, -0.10624885559082031, -0.10176467895507812, -0.09728050231933594, -0.09279632568359375, -0.08831214904785156, -0.08382797241210938, -0.07934379577636719, -0.074859619140625, -0.07037544250488281, -0.06589126586914062, -0.06140708923339844, -0.05692291259765625, -0.05243873596191406, -0.047954559326171875, -0.04347038269042969, -0.0389862060546875, -0.03450202941894531, -0.030017852783203125, -0.025533676147460938, -0.02104949951171875, -0.016565322875976562, -0.012081146240234375, -0.0075969696044921875, -0.00311279296875, 0.0013713836669921875, 0.005855560302734375, 0.010339736938476562, 0.01482391357421875, 0.019308090209960938, 0.023792266845703125, 0.028276443481445312, 0.0327606201171875, 0.03724479675292969, 0.041728973388671875, 0.04621315002441406, 0.05069732666015625, 0.05518150329589844, 0.059665679931640625, 0.06414985656738281, 0.068634033203125, 0.07311820983886719, 0.07760238647460938, 0.08208656311035156, 0.08657073974609375, 0.09105491638183594, 0.09553909301757812, 0.10002326965332031, 0.1045074462890625, 0.10899162292480469, 0.11347579956054688, 0.11795997619628906, 0.12244415283203125, 0.12692832946777344, 0.13141250610351562, 0.1358966827392578, 0.140380859375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 36.0, 99.0, 637.0, 140.0, 45.0, 20.0, 9.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.766404151916504, -6.4799113273620605, -6.193418502807617, -5.906926155090332, -5.620433330535889, -5.333940505981445, -5.04744815826416, -4.760955333709717, -4.474462509155273, -4.18796968460083, -3.901477098464966, -3.6149845123291016, -3.328491687774658, -3.041998863220215, -2.7555062770843506, -2.4690136909484863, -2.182520866394043, -1.8960281610488892, -1.6095354557037354, -1.3230427503585815, -1.0365500450134277, -0.7500573396682739, -0.4635646343231201, -0.17707204818725586, 0.1094207763671875, 0.3959134817123413, 0.6824061870574951, 0.9688988924026489, 1.2553915977478027, 1.5418843030929565, 1.8283770084381104, 2.1148695945739746, 2.4013633728027344, 2.6878561973571777, 2.974348783493042, 3.2608413696289062, 3.5473341941833496, 3.833827018737793, 4.120319366455078, 4.4068121910095215, 4.693305015563965, 4.979797840118408, 5.266290664672852, 5.552783012390137, 5.83927583694458, 6.125768661499023, 6.412261009216309, 6.698753833770752, 6.985246658325195, 7.271739482879639, 7.558232307434082, 7.844724655151367, 8.131217956542969, 8.417710304260254, 8.704202651977539, 8.99069595336914, 9.277188301086426, 9.563680648803711, 9.850173950195312, 10.136666297912598, 10.423158645629883, 10.709651947021484, 10.99614429473877, 11.282636642456055, 11.569129943847656]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 5.0, 8.0, 8.0, 4.0, 6.0, 10.0, 11.0, 13.0, 20.0, 16.0, 13.0, 17.0, 20.0, 27.0, 18.0, 48.0, 193.0, 262.0, 49.0, 29.0, 29.0, 18.0, 24.0, 22.0, 15.0, 11.0, 18.0, 10.0, 10.0, 11.0, 10.0, 5.0, 7.0, 7.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9586586952209473, -2.8534674644470215, -2.748276472091675, -2.643085241317749, -2.5378942489624023, -2.4327030181884766, -2.327511787414551, -2.222320795059204, -2.1171298027038574, -2.0119385719299316, -1.906747579574585, -1.8015563488006592, -1.6963653564453125, -1.5911741256713867, -1.4859830141067505, -1.3807919025421143, -1.2756006717681885, -1.1704095602035522, -1.065218448638916, -0.960027277469635, -0.8548361659049988, -0.7496450543403625, -0.6444538831710815, -0.5392627716064453, -0.4340716600418091, -0.32888054847717285, -0.22368940711021423, -0.11849826574325562, -0.013307154178619385, 0.09188395738601685, 0.19707512855529785, 0.3022662401199341, 0.4074571132659912, 0.5126482248306274, 0.6178393363952637, 0.7230305075645447, 0.8282216191291809, 0.9334127306938171, 1.0386039018630981, 1.1437950134277344, 1.2489861249923706, 1.3541772365570068, 1.459368348121643, 1.5645594596862793, 1.669750690460205, 1.7749416828155518, 1.8801329135894775, 1.9853240251541138, 2.09051513671875, 2.195706367492676, 2.3008973598480225, 2.4060885906219482, 2.511279582977295, 2.6164708137512207, 2.7216620445251465, 2.826853036880493, 2.93204402923584, 3.0372352600097656, 3.1424262523651123, 3.247617483139038, 3.3528084754943848, 3.4579997062683105, 3.5631909370422363, 3.668381929397583, 3.773573160171509]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 6.0, 0.0, 6.0, 5.0, 11.0, 9.0, 21.0, 21.0, 17.0, 18.0, 32.0, 27.0, 37.0, 45.0, 80.0, 222.0, 151.0, 52.0, 36.0, 40.0, 29.0, 22.0, 23.0, 17.0, 15.0, 7.0, 9.0, 9.0, 12.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349609375, -0.33789825439453125, -0.3261871337890625, -0.31447601318359375, -0.302764892578125, -0.29105377197265625, -0.2793426513671875, -0.26763153076171875, -0.25592041015625, -0.24420928955078125, -0.2324981689453125, -0.22078704833984375, -0.209075927734375, -0.19736480712890625, -0.1856536865234375, -0.17394256591796875, -0.1622314453125, -0.15052032470703125, -0.1388092041015625, -0.12709808349609375, -0.115386962890625, -0.10367584228515625, -0.0919647216796875, -0.08025360107421875, -0.06854248046875, -0.05683135986328125, -0.0451202392578125, -0.03340911865234375, -0.021697998046875, -0.00998687744140625, 0.0017242431640625, 0.01343536376953125, 0.025146484375, 0.03685760498046875, 0.0485687255859375, 0.06027984619140625, 0.071990966796875, 0.08370208740234375, 0.0954132080078125, 0.10712432861328125, 0.11883544921875, 0.13054656982421875, 0.1422576904296875, 0.15396881103515625, 0.165679931640625, 0.17739105224609375, 0.1891021728515625, 0.20081329345703125, 0.2125244140625, 0.22423553466796875, 0.2359466552734375, 0.24765777587890625, 0.259368896484375, 0.27108001708984375, 0.2827911376953125, 0.29450225830078125, 0.30621337890625, 0.31792449951171875, 0.3296356201171875, 0.34134674072265625, 0.353057861328125, 0.36476898193359375, 0.3764801025390625, 0.38819122314453125, 0.39990234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 1.0, 6.0, 1.0, 3.0, 5.0, 6.0, 14.0, 12.0, 9.0, 22.0, 37.0, 64.0, 96.0, 167.0, 318.0, 904.0, 4174.0, 600653.0, 7775854.0, 4553.0, 948.0, 310.0, 167.0, 88.0, 51.0, 22.0, 18.0, 10.0, 22.0, 11.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-4.084884166717529, -3.9531877040863037, -3.821491241455078, -3.6897947788238525, -3.558098316192627, -3.4264016151428223, -3.2947051525115967, -3.163008689880371, -3.0313122272491455, -2.89961576461792, -2.7679193019866943, -2.6362228393554688, -2.504526138305664, -2.3728299140930176, -2.241133213043213, -2.1094367504119873, -1.9777402877807617, -1.8460438251495361, -1.7143473625183105, -1.5826507806777954, -1.4509543180465698, -1.3192578554153442, -1.187561273574829, -1.0558648109436035, -0.9241683483123779, -0.7924718856811523, -0.660775363445282, -0.5290788412094116, -0.39738237857818604, -0.26568591594696045, -0.1339893937110901, -0.0022928714752197266, 0.12940311431884766, 0.26109960675239563, 0.3927960991859436, 0.524492621421814, 0.6561890840530396, 0.7878855466842651, 0.9195820689201355, 1.0512785911560059, 1.1829750537872314, 1.314671516418457, 1.4463679790496826, 1.5780645608901978, 1.7097610235214233, 1.841457486152649, 1.973154067993164, 2.1048505306243896, 2.2365469932556152, 2.368243455886841, 2.4999399185180664, 2.631636381149292, 2.7633328437805176, 2.8950295448303223, 3.026726007461548, 3.1584224700927734, 3.290118932723999, 3.4218153953552246, 3.55351185798645, 3.685208320617676, 3.8169050216674805, 3.948601245880127, 4.080297946929932, 4.211994171142578, 4.343690872192383]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 1.0, 7.0, 8.0, 6.0, 3.0, 7.0, 11.0, 9.0, 4.0, 7.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.042754173278809, -11.751832008361816, -11.460909843444824, -11.169987678527832, -10.87906551361084, -10.588143348693848, -10.297221183776855, -10.006299018859863, -9.715376853942871, -9.424454689025879, -9.133532524108887, -8.842610359191895, -8.551688194274902, -8.26076602935791, -7.969843864440918, -7.678921699523926, -7.388000011444092, -7.0970778465271, -6.806155681610107, -6.515233516693115, -6.224311351776123, -5.933389186859131, -5.642467498779297, -5.351545333862305, -5.0606231689453125, -4.76970100402832, -4.478778839111328, -4.187856674194336, -3.8969345092773438, -3.6060123443603516, -3.3150904178619385, -3.0241682529449463, -2.733245849609375, -2.442323684692383, -2.1514015197753906, -1.860479474067688, -1.5695573091506958, -1.2786351442337036, -0.987713098526001, -0.6967909336090088, -0.4058687686920166, -0.1149466335773468, 0.175975501537323, 0.4668976068496704, 0.7578197717666626, 1.0487419366836548, 1.3396639823913574, 1.6305861473083496, 1.9215083122253418, 2.212430477142334, 2.503352642059326, 2.7942748069763184, 3.0851969718933105, 3.3761191368103027, 3.667041063308716, 3.957963228225708, 4.248885154724121, 4.539807319641113, 4.8307294845581055, 5.121651649475098, 5.41257381439209, 5.703495979309082, 5.994418144226074, 6.285340309143066, 6.576262474060059]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 12.0, 14.0, 12.0, 20.0, 28.0, 47.0, 37.0, 54.0, 59.0, 68.0, 76.0, 82.0, 83.0, 86.0, 50.0, 42.0, 46.0, 43.0, 23.0, 28.0, 16.0, 21.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1212158203125, -0.11676216125488281, -0.11230850219726562, -0.10785484313964844, -0.10340118408203125, -0.09894752502441406, -0.09449386596679688, -0.09004020690917969, -0.0855865478515625, -0.08113288879394531, -0.07667922973632812, -0.07222557067871094, -0.06777191162109375, -0.06331825256347656, -0.058864593505859375, -0.05441093444824219, -0.049957275390625, -0.04550361633300781, -0.041049957275390625, -0.03659629821777344, -0.03214263916015625, -0.027688980102539062, -0.023235321044921875, -0.018781661987304688, -0.0143280029296875, -0.009874343872070312, -0.005420684814453125, -0.0009670257568359375, 0.00348663330078125, 0.007940292358398438, 0.012393951416015625, 0.016847610473632812, 0.02130126953125, 0.025754928588867188, 0.030208587646484375, 0.03466224670410156, 0.03911590576171875, 0.04356956481933594, 0.048023223876953125, 0.05247688293457031, 0.0569305419921875, 0.06138420104980469, 0.06583786010742188, 0.07029151916503906, 0.07474517822265625, 0.07919883728027344, 0.08365249633789062, 0.08810615539550781, 0.092559814453125, 0.09701347351074219, 0.10146713256835938, 0.10592079162597656, 0.11037445068359375, 0.11482810974121094, 0.11928176879882812, 0.12373542785644531, 0.1281890869140625, 0.1326427459716797, 0.13709640502929688, 0.14155006408691406, 0.14600372314453125, 0.15045738220214844, 0.15491104125976562, 0.1593647003173828, 0.163818359375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 2.0, 3.0, 9.0, 11.0, 8.0, 15.0, 14.0, 23.0, 28.0, 38.0, 53.0, 79.0, 133.0, 177.0, 214.0, 379.0, 572.0, 950.0, 1869.0, 3750.0, 8920.0, 23148.0, 66482.0, 179237.0, 151626.0, 52832.0, 18823.0, 7460.0, 3314.0, 1578.0, 885.0, 534.0, 325.0, 223.0, 130.0, 96.0, 76.0, 73.0, 51.0, 28.0, 16.0, 20.0, 9.0, 14.0, 11.0, 6.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.16015625, -2.087890625, -2.015625, -1.943359375, -1.87109375, -1.798828125, -1.7265625, -1.654296875, -1.58203125, -1.509765625, -1.4375, -1.365234375, -1.29296875, -1.220703125, -1.1484375, -1.076171875, -1.00390625, -0.931640625, -0.859375, -0.787109375, -0.71484375, -0.642578125, -0.5703125, -0.498046875, -0.42578125, -0.353515625, -0.28125, -0.208984375, -0.13671875, -0.064453125, 0.0078125, 0.080078125, 0.15234375, 0.224609375, 0.296875, 0.369140625, 0.44140625, 0.513671875, 0.5859375, 0.658203125, 0.73046875, 0.802734375, 0.875, 0.947265625, 1.01953125, 1.091796875, 1.1640625, 1.236328125, 1.30859375, 1.380859375, 1.453125, 1.525390625, 1.59765625, 1.669921875, 1.7421875, 1.814453125, 1.88671875, 1.958984375, 2.03125, 2.103515625, 2.17578125, 2.248046875, 2.3203125, 2.392578125, 2.46484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 10.0, 11.0, 18.0, 43.0, 39.0, 45.0, 53.0, 61.0, 82.0, 82.0, 71.0, 81.0, 77.0, 67.0, 56.0, 35.0, 34.0, 42.0, 21.0, 11.0, 18.0, 9.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4540596008300781, -0.43863677978515625, -0.4232139587402344, -0.4077911376953125, -0.3923683166503906, -0.37694549560546875, -0.3615226745605469, -0.346099853515625, -0.3306770324707031, -0.31525421142578125, -0.2998313903808594, -0.2844085693359375, -0.2689857482910156, -0.25356292724609375, -0.23814010620117188, -0.22271728515625, -0.20729446411132812, -0.19187164306640625, -0.17644882202148438, -0.1610260009765625, -0.14560317993164062, -0.13018035888671875, -0.11475753784179688, -0.099334716796875, -0.08391189575195312, -0.06848907470703125, -0.053066253662109375, -0.0376434326171875, -0.022220611572265625, -0.00679779052734375, 0.008625030517578125, 0.0240478515625, 0.039470672607421875, 0.05489349365234375, 0.07031631469726562, 0.0857391357421875, 0.10116195678710938, 0.11658477783203125, 0.13200759887695312, 0.147430419921875, 0.16285324096679688, 0.17827606201171875, 0.19369888305664062, 0.2091217041015625, 0.22454452514648438, 0.23996734619140625, 0.2553901672363281, 0.27081298828125, 0.2862358093261719, 0.30165863037109375, 0.3170814514160156, 0.3325042724609375, 0.3479270935058594, 0.36334991455078125, 0.3787727355957031, 0.394195556640625, 0.4096183776855469, 0.42504119873046875, 0.4404640197753906, 0.4558868408203125, 0.4713096618652344, 0.48673248291015625, 0.5021553039550781, 0.517578125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 7.0, 6.0, 25.0, 60.0, 125.0, 146.0, 59.0, 27.0, 15.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.931406021118164, -7.75246524810791, -7.573524475097656, -7.394583702087402, -7.215642929077148, -7.0367021560668945, -6.857761383056641, -6.678821086883545, -6.499880313873291, -6.320939540863037, -6.141998767852783, -5.963057994842529, -5.784117221832275, -5.60517692565918, -5.426236152648926, -5.247295379638672, -5.068354606628418, -4.889413833618164, -4.71047306060791, -4.531532287597656, -4.352591514587402, -4.173650741577148, -3.9947102069854736, -3.815769672393799, -3.6368284225463867, -3.457887649536133, -3.278946876525879, -3.100006103515625, -2.92106556892395, -2.7421247959136963, -2.5631840229034424, -2.3842434883117676, -2.2053024768829346, -2.0263617038726807, -1.8474210500717163, -1.6684802770614624, -1.489539623260498, -1.3105988502502441, -1.1316580772399902, -0.9527174234390259, -0.773776650428772, -0.5948359370231628, -0.4158951938152313, -0.2369544506072998, -0.058013737201690674, 0.12092697620391846, 0.29986774921417236, 0.4788084030151367, 0.6577491760253906, 0.8366898894309998, 1.0156306028366089, 1.1945713758468628, 1.3735120296478271, 1.552452802658081, 1.731393575668335, 1.9103342294692993, 2.0892748832702637, 2.2682156562805176, 2.4471564292907715, 2.6260972023010254, 2.8050377368927, 2.983978509902954, 3.162919282913208, 3.341859817504883, 3.520800828933716]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 9.0, 13.0, 16.0, 44.0, 85.0, 95.0, 98.0, 43.0, 20.0, 13.0, 10.0, 8.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.223564624786377, -4.117173194885254, -4.010781764984131, -3.904390573501587, -3.797999382019043, -3.69160795211792, -3.585216522216797, -3.478825330734253, -3.372434139251709, -3.266042709350586, -3.159651517868042, -3.053260087966919, -2.946868896484375, -2.840477466583252, -2.734086036682129, -2.627694845199585, -2.521303415298462, -2.414911985397339, -2.308520793914795, -2.202129364013672, -2.095738172531128, -1.9893467426300049, -1.8829554319381714, -1.776564121246338, -1.6701728105545044, -1.563781499862671, -1.4573901891708374, -1.350998878479004, -1.2446074485778809, -1.138216257095337, -1.0318248271942139, -0.9254335165023804, -0.8190422058105469, -0.7126508951187134, -0.6062595844268799, -0.4998682141304016, -0.3934769034385681, -0.2870855927467346, -0.18069422245025635, -0.07430291175842285, 0.032088398933410645, 0.13847972452640533, 0.24487105011940002, 0.3512623906135559, 0.4576537013053894, 0.5640450119972229, 0.6704363822937012, 0.7768276929855347, 0.8832190036773682, 0.9896103143692017, 1.0960016250610352, 1.2023930549621582, 1.3087842464447021, 1.4151756763458252, 1.5215669870376587, 1.6279582977294922, 1.7343496084213257, 1.8407409191131592, 1.9471322298049927, 2.053523540496826, 2.159914970397949, 2.266306161880493, 2.372697591781616, 2.47908878326416, 2.585480213165283]}, "eval/loss": 4.259941577911377, "eval/wer": 1.0190995636652123, "eval/runtime": 524.0014, "eval/samples_per_second": 5.042, "eval/steps_per_second": 0.632} \ No newline at end of file +{"train/loss": 3.1966, "train/learning_rate": 6.936416184971099e-08, "train/epoch": 10.0, "train/global_step": 2230, "_runtime": 51677, "_timestamp": 1648466626, "_step": 2234, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 33.0, 227.0, 474.0, 239.0, 34.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.604528427124023, -28.090166091918945, -27.5758056640625, -27.061443328857422, -26.547080993652344, -26.032718658447266, -25.51835823059082, -25.003995895385742, -24.489635467529297, -23.97527313232422, -23.460912704467773, -22.946550369262695, -22.432188034057617, -21.917827606201172, -21.403465270996094, -20.889102935791016, -20.374740600585938, -19.86037826538086, -19.346017837524414, -18.831655502319336, -18.317293167114258, -17.802932739257812, -17.288570404052734, -16.774208068847656, -16.259845733642578, -15.745484352111816, -15.231122016906738, -14.716760635375977, -14.202398300170898, -13.688036918640137, -13.173675537109375, -12.659313201904297, -12.144952774047852, -11.63059139251709, -11.116229057312012, -10.60186767578125, -10.087505340576172, -9.57314395904541, -9.058782577514648, -8.54442024230957, -8.030058860778809, -7.515697002410889, -7.001335144042969, -6.486973762512207, -5.972611904144287, -5.458250045776367, -4.9438886642456055, -4.4295268058776855, -3.9151649475097656, -3.4008030891418457, -2.886441469192505, -2.372079849243164, -1.8577179908752441, -1.3433561325073242, -0.8289945125579834, -0.3146328926086426, 0.19972896575927734, 0.7140907049179077, 1.228452444076538, 1.7428141832351685, 2.257175922393799, 2.7715377807617188, 3.2858994007110596, 3.8002610206604004, 4.31462287902832]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 4.0, 4.0, 8.0, 11.0, 8.0, 13.0, 21.0, 14.0, 16.0, 24.0, 34.0, 26.0, 30.0, 44.0, 41.0, 35.0, 39.0, 53.0, 39.0, 48.0, 48.0, 44.0, 47.0, 39.0, 35.0, 40.0, 35.0, 23.0, 26.0, 31.0, 17.0, 17.0, 15.0, 10.0, 17.0, 13.0, 11.0, 4.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1261658668518066, -3.028174877166748, -2.9301838874816895, -2.83219313621521, -2.7342021465301514, -2.6362111568450928, -2.5382204055786133, -2.4402294158935547, -2.342238426208496, -2.2442474365234375, -2.146256446838379, -2.0482656955718994, -1.9502747058868408, -1.8522837162017822, -1.7542928457260132, -1.6563019752502441, -1.5583109855651855, -1.460319995880127, -1.362329125404358, -1.2643382549285889, -1.1663472652435303, -1.0683562755584717, -0.9703654050827026, -0.8723744750022888, -0.774383544921875, -0.6763926148414612, -0.5784016847610474, -0.48041075468063354, -0.3824198246002197, -0.2844288945198059, -0.1864379644393921, -0.08844703435897827, 0.009543895721435547, 0.10753482580184937, 0.20552575588226318, 0.303516685962677, 0.4015076160430908, 0.49949854612350464, 0.5974894762039185, 0.6954804062843323, 0.7934713363647461, 0.8914622664451599, 0.9894531965255737, 1.0874440670013428, 1.1854350566864014, 1.28342604637146, 1.381416916847229, 1.479407787322998, 1.5773987770080566, 1.6753897666931152, 1.7733806371688843, 1.8713715076446533, 1.969362497329712, 2.0673534870147705, 2.16534423828125, 2.2633352279663086, 2.361326217651367, 2.459317207336426, 2.5573081970214844, 2.655298948287964, 2.7532899379730225, 2.851280927658081, 2.9492716789245605, 3.047262668609619, 3.1452536582946777]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 10.0, 12.0, 12.0, 32.0, 44.0, 80.0, 118.0, 210.0, 327.0, 586.0, 1276.0, 2408.0, 4794.0, 10173.0, 21924.0, 49846.0, 117445.0, 270224.0, 570534.0, 958582.0, 1007810.0, 632998.0, 306153.0, 131826.0, 57542.0, 25910.0, 11827.0, 5585.0, 2770.0, 1463.0, 742.0, 401.0, 227.0, 137.0, 90.0, 56.0, 28.0, 25.0, 20.0, 3.0, 6.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.155609130859375, -4.02996826171875, -3.904327392578125, -3.7786865234375, -3.653045654296875, -3.52740478515625, -3.401763916015625, -3.276123046875, -3.150482177734375, -3.02484130859375, -2.899200439453125, -2.7735595703125, -2.647918701171875, -2.52227783203125, -2.396636962890625, -2.27099609375, -2.145355224609375, -2.01971435546875, -1.894073486328125, -1.7684326171875, -1.642791748046875, -1.51715087890625, -1.391510009765625, -1.265869140625, -1.140228271484375, -1.01458740234375, -0.888946533203125, -0.7633056640625, -0.637664794921875, -0.51202392578125, -0.386383056640625, -0.2607421875, -0.135101318359375, -0.00946044921875, 0.116180419921875, 0.2418212890625, 0.367462158203125, 0.49310302734375, 0.618743896484375, 0.744384765625, 0.870025634765625, 0.99566650390625, 1.121307373046875, 1.2469482421875, 1.372589111328125, 1.49822998046875, 1.623870849609375, 1.74951171875, 1.875152587890625, 2.00079345703125, 2.126434326171875, 2.2520751953125, 2.377716064453125, 2.50335693359375, 2.628997802734375, 2.754638671875, 2.880279541015625, 3.00592041015625, 3.131561279296875, 3.2572021484375, 3.382843017578125, 3.50848388671875, 3.634124755859375, 3.759765625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 8.0, 12.0, 16.0, 19.0, 18.0, 23.0, 25.0, 26.0, 42.0, 29.0, 36.0, 32.0, 51.0, 45.0, 51.0, 48.0, 38.0, 46.0, 45.0, 45.0, 29.0, 35.0, 40.0, 27.0, 22.0, 25.0, 28.0, 21.0, 26.0, 18.0, 8.0, 7.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.27734375, -5.12713623046875, -4.9769287109375, -4.82672119140625, -4.676513671875, -4.52630615234375, -4.3760986328125, -4.22589111328125, -4.07568359375, -3.92547607421875, -3.7752685546875, -3.62506103515625, -3.474853515625, -3.32464599609375, -3.1744384765625, -3.02423095703125, -2.8740234375, -2.72381591796875, -2.5736083984375, -2.42340087890625, -2.273193359375, -2.12298583984375, -1.9727783203125, -1.82257080078125, -1.67236328125, -1.52215576171875, -1.3719482421875, -1.22174072265625, -1.071533203125, -0.92132568359375, -0.7711181640625, -0.62091064453125, -0.470703125, -0.32049560546875, -0.1702880859375, -0.02008056640625, 0.130126953125, 0.28033447265625, 0.4305419921875, 0.58074951171875, 0.73095703125, 0.88116455078125, 1.0313720703125, 1.18157958984375, 1.331787109375, 1.48199462890625, 1.6322021484375, 1.78240966796875, 1.9326171875, 2.08282470703125, 2.2330322265625, 2.38323974609375, 2.533447265625, 2.68365478515625, 2.8338623046875, 2.98406982421875, 3.13427734375, 3.28448486328125, 3.4346923828125, 3.58489990234375, 3.735107421875, 3.88531494140625, 4.0355224609375, 4.18572998046875, 4.3359375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 7.0, 13.0, 30.0, 62.0, 130.0, 320.0, 1114.0, 4176674.0, 14854.0, 689.0, 205.0, 87.0, 51.0, 8.0, 8.0, 8.0, 10.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5625, -95.3837890625, -91.205078125, -87.0263671875, -82.84765625, -78.6689453125, -74.490234375, -70.3115234375, -66.1328125, -61.9541015625, -57.775390625, -53.5966796875, -49.41796875, -45.2392578125, -41.060546875, -36.8818359375, -32.703125, -28.5244140625, -24.345703125, -20.1669921875, -15.98828125, -11.8095703125, -7.630859375, -3.4521484375, 0.7265625, 4.9052734375, 9.083984375, 13.2626953125, 17.44140625, 21.6201171875, 25.798828125, 29.9775390625, 34.15625, 38.3349609375, 42.513671875, 46.6923828125, 50.87109375, 55.0498046875, 59.228515625, 63.4072265625, 67.5859375, 71.7646484375, 75.943359375, 80.1220703125, 84.30078125, 88.4794921875, 92.658203125, 96.8369140625, 101.015625, 105.1943359375, 109.373046875, 113.5517578125, 117.73046875, 121.9091796875, 126.087890625, 130.2666015625, 134.4453125, 138.6240234375, 142.802734375, 146.9814453125, 151.16015625, 155.3388671875, 159.517578125, 163.6962890625, 167.875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 2.0, 12.0, 24.0, 41.0, 52.0, 100.0, 194.0, 348.0, 645.0, 1004.0, 724.0, 432.0, 225.0, 117.0, 61.0, 36.0, 16.0, 17.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.916168212890625, -2.78741455078125, -2.658660888671875, -2.5299072265625, -2.401153564453125, -2.27239990234375, -2.143646240234375, -2.014892578125, -1.886138916015625, -1.75738525390625, -1.628631591796875, -1.4998779296875, -1.371124267578125, -1.24237060546875, -1.113616943359375, -0.98486328125, -0.856109619140625, -0.72735595703125, -0.598602294921875, -0.4698486328125, -0.341094970703125, -0.21234130859375, -0.083587646484375, 0.045166015625, 0.173919677734375, 0.30267333984375, 0.431427001953125, 0.5601806640625, 0.688934326171875, 0.81768798828125, 0.946441650390625, 1.0751953125, 1.203948974609375, 1.33270263671875, 1.461456298828125, 1.5902099609375, 1.718963623046875, 1.84771728515625, 1.976470947265625, 2.105224609375, 2.233978271484375, 2.36273193359375, 2.491485595703125, 2.6202392578125, 2.748992919921875, 2.87774658203125, 3.006500244140625, 3.13525390625, 3.264007568359375, 3.39276123046875, 3.521514892578125, 3.6502685546875, 3.779022216796875, 3.90777587890625, 4.036529541015625, 4.165283203125, 4.294036865234375, 4.42279052734375, 4.551544189453125, 4.6802978515625, 4.809051513671875, 4.93780517578125, 5.066558837890625, 5.1953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 8.0, 10.0, 15.0, 25.0, 17.0, 29.0, 39.0, 32.0, 33.0, 59.0, 55.0, 59.0, 63.0, 53.0, 67.0, 59.0, 48.0, 57.0, 49.0, 42.0, 36.0, 29.0, 15.0, 20.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.272556781768799, -3.123746156692505, -2.974935531616211, -2.826124906539917, -2.677314281463623, -2.528503656387329, -2.379693031311035, -2.230882167816162, -2.0820717811584473, -1.9332611560821533, -1.7844505310058594, -1.6356399059295654, -1.4868292808532715, -1.3380186557769775, -1.189207911491394, -1.0403972864151, -0.8915865421295166, -0.7427759170532227, -0.5939652919769287, -0.44515460729599, -0.29634398221969604, -0.1475333571434021, 0.001277327537536621, 0.15008795261383057, 0.2988985776901245, 0.44770920276641846, 0.5965198278427124, 0.7453305125236511, 0.8941411375999451, 1.0429518222808838, 1.1917624473571777, 1.3405730724334717, 1.4893836975097656, 1.6381943225860596, 1.7870049476623535, 1.9358155727386475, 2.0846261978149414, 2.2334368228912354, 2.3822474479675293, 2.5310583114624023, 2.679868698120117, 2.828679323196411, 2.977489948272705, 3.126300573348999, 3.275111198425293, 3.423921823501587, 3.572732448577881, 3.721543312072754, 3.870353937149048, 4.019164562225342, 4.167975425720215, 4.31678581237793, 4.465596675872803, 4.614407062530518, 4.763217926025391, 4.9120283126831055, 5.0608391761779785, 5.209650039672852, 5.358460426330566, 5.5072712898254395, 5.656081676483154, 5.804892539978027, 5.953702926635742, 6.102513790130615, 6.25132417678833]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 8.0, 9.0, 5.0, 14.0, 13.0, 19.0, 23.0, 26.0, 36.0, 36.0, 42.0, 36.0, 46.0, 46.0, 44.0, 41.0, 59.0, 40.0, 45.0, 37.0, 39.0, 42.0, 43.0, 39.0, 35.0, 24.0, 21.0, 23.0, 22.0, 12.0, 18.0, 13.0, 8.0, 6.0, 3.0, 4.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.665203094482422, -4.525174140930176, -4.385145664215088, -4.245116710662842, -4.105088233947754, -3.965059280395508, -3.825030565261841, -3.685001850128174, -3.544973134994507, -3.40494441986084, -3.264915704727173, -3.124886989593506, -2.9848580360412598, -2.844829559326172, -2.704800605773926, -2.564771890640259, -2.424743175506592, -2.284714460372925, -2.144685745239258, -2.004657030105591, -1.8646281957626343, -1.7245994806289673, -1.5845706462860107, -1.4445419311523438, -1.3045132160186768, -1.1644845008850098, -1.0244557857513428, -0.8844269514083862, -0.7443982362747192, -0.6043695211410522, -0.4643407464027405, -0.3243119716644287, -0.18428325653076172, -0.04425451159477234, 0.09577423334121704, 0.23580297827720642, 0.3758317232131958, 0.5158604383468628, 0.6558892130851746, 0.7959179878234863, 0.9359467029571533, 1.0759754180908203, 1.2160041332244873, 1.3560329675674438, 1.4960616827011108, 1.6360903978347778, 1.7761192321777344, 1.9161479473114014, 2.0561766624450684, 2.1962053775787354, 2.3362340927124023, 2.4762628078460693, 2.6162915229797363, 2.7563204765319824, 2.8963491916656494, 3.0363779067993164, 3.1764066219329834, 3.3164353370666504, 3.4564640522003174, 3.5964927673339844, 3.7365217208862305, 3.8765501976013184, 4.0165791511535645, 4.156607627868652, 4.296636581420898]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 2.0, 7.0, 10.0, 7.0, 8.0, 17.0, 25.0, 27.0, 46.0, 62.0, 81.0, 131.0, 145.0, 247.0, 430.0, 634.0, 1360.0, 3100.0, 9875.0, 41461.0, 175962.0, 424715.0, 286755.0, 77005.0, 17523.0, 4816.0, 1783.0, 836.0, 498.0, 317.0, 228.0, 138.0, 93.0, 56.0, 32.0, 33.0, 24.0, 22.0, 14.0, 14.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1181640625, -1.084991455078125, -1.05181884765625, -1.018646240234375, -0.9854736328125, -0.952301025390625, -0.91912841796875, -0.885955810546875, -0.852783203125, -0.819610595703125, -0.78643798828125, -0.753265380859375, -0.7200927734375, -0.686920166015625, -0.65374755859375, -0.620574951171875, -0.58740234375, -0.554229736328125, -0.52105712890625, -0.487884521484375, -0.4547119140625, -0.421539306640625, -0.38836669921875, -0.355194091796875, -0.322021484375, -0.288848876953125, -0.25567626953125, -0.222503662109375, -0.1893310546875, -0.156158447265625, -0.12298583984375, -0.089813232421875, -0.056640625, -0.023468017578125, 0.00970458984375, 0.042877197265625, 0.0760498046875, 0.109222412109375, 0.14239501953125, 0.175567626953125, 0.208740234375, 0.241912841796875, 0.27508544921875, 0.308258056640625, 0.3414306640625, 0.374603271484375, 0.40777587890625, 0.440948486328125, 0.47412109375, 0.507293701171875, 0.54046630859375, 0.573638916015625, 0.6068115234375, 0.639984130859375, 0.67315673828125, 0.706329345703125, 0.739501953125, 0.772674560546875, 0.80584716796875, 0.839019775390625, 0.8721923828125, 0.905364990234375, 0.93853759765625, 0.971710205078125, 1.0048828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 9.0, 11.0, 21.0, 20.0, 21.0, 38.0, 35.0, 38.0, 28.0, 44.0, 49.0, 61.0, 43.0, 53.0, 47.0, 53.0, 45.0, 40.0, 33.0, 48.0, 33.0, 30.0, 39.0, 24.0, 19.0, 19.0, 12.0, 15.0, 9.0, 9.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.533233642578125, -3.41217041015625, -3.291107177734375, -3.1700439453125, -3.048980712890625, -2.92791748046875, -2.806854248046875, -2.685791015625, -2.564727783203125, -2.44366455078125, -2.322601318359375, -2.2015380859375, -2.080474853515625, -1.95941162109375, -1.838348388671875, -1.71728515625, -1.596221923828125, -1.47515869140625, -1.354095458984375, -1.2330322265625, -1.111968994140625, -0.99090576171875, -0.869842529296875, -0.748779296875, -0.627716064453125, -0.50665283203125, -0.385589599609375, -0.2645263671875, -0.143463134765625, -0.02239990234375, 0.098663330078125, 0.2197265625, 0.340789794921875, 0.46185302734375, 0.582916259765625, 0.7039794921875, 0.825042724609375, 0.94610595703125, 1.067169189453125, 1.188232421875, 1.309295654296875, 1.43035888671875, 1.551422119140625, 1.6724853515625, 1.793548583984375, 1.91461181640625, 2.035675048828125, 2.15673828125, 2.277801513671875, 2.39886474609375, 2.519927978515625, 2.6409912109375, 2.762054443359375, 2.88311767578125, 3.004180908203125, 3.125244140625, 3.246307373046875, 3.36737060546875, 3.488433837890625, 3.6094970703125, 3.730560302734375, 3.85162353515625, 3.972686767578125, 4.09375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 16.0, 11.0, 25.0, 38.0, 65.0, 111.0, 171.0, 347.0, 583.0, 1132.0, 2019.0, 3709.0, 6841.0, 12575.0, 22487.0, 38292.0, 62771.0, 96458.0, 133815.0, 161359.0, 156514.0, 125992.0, 88283.0, 56578.0, 34106.0, 19589.0, 11019.0, 6239.0, 3336.0, 1792.0, 981.0, 544.0, 308.0, 187.0, 91.0, 65.0, 27.0, 25.0, 13.0, 11.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.302490234375, -0.2930030822753906, -0.28351593017578125, -0.2740287780761719, -0.2645416259765625, -0.2550544738769531, -0.24556732177734375, -0.23608016967773438, -0.226593017578125, -0.21710586547851562, -0.20761871337890625, -0.19813156127929688, -0.1886444091796875, -0.17915725708007812, -0.16967010498046875, -0.16018295288085938, -0.15069580078125, -0.14120864868164062, -0.13172149658203125, -0.12223434448242188, -0.1127471923828125, -0.10326004028320312, -0.09377288818359375, -0.08428573608398438, -0.074798583984375, -0.06531143188476562, -0.05582427978515625, -0.046337127685546875, -0.0368499755859375, -0.027362823486328125, -0.01787567138671875, -0.008388519287109375, 0.0010986328125, 0.010585784912109375, 0.02007293701171875, 0.029560089111328125, 0.0390472412109375, 0.048534393310546875, 0.05802154541015625, 0.06750869750976562, 0.076995849609375, 0.08648300170898438, 0.09597015380859375, 0.10545730590820312, 0.1149444580078125, 0.12443161010742188, 0.13391876220703125, 0.14340591430664062, 0.15289306640625, 0.16238021850585938, 0.17186737060546875, 0.18135452270507812, 0.1908416748046875, 0.20032882690429688, 0.20981597900390625, 0.21930313110351562, 0.228790283203125, 0.23827743530273438, 0.24776458740234375, 0.2572517395019531, 0.2667388916015625, 0.2762260437011719, 0.28571319580078125, 0.2952003479003906, 0.3046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 6.0, 11.0, 14.0, 6.0, 13.0, 14.0, 13.0, 16.0, 37.0, 30.0, 30.0, 25.0, 29.0, 32.0, 43.0, 44.0, 34.0, 45.0, 37.0, 48.0, 43.0, 37.0, 34.0, 40.0, 23.0, 41.0, 31.0, 27.0, 27.0, 25.0, 26.0, 20.0, 11.0, 12.0, 17.0, 13.0, 7.0, 8.0, 6.0, 5.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.26171875, -6.0599365234375, -5.858154296875, -5.6563720703125, -5.45458984375, -5.2528076171875, -5.051025390625, -4.8492431640625, -4.6474609375, -4.4456787109375, -4.243896484375, -4.0421142578125, -3.84033203125, -3.6385498046875, -3.436767578125, -3.2349853515625, -3.033203125, -2.8314208984375, -2.629638671875, -2.4278564453125, -2.22607421875, -2.0242919921875, -1.822509765625, -1.6207275390625, -1.4189453125, -1.2171630859375, -1.015380859375, -0.8135986328125, -0.61181640625, -0.4100341796875, -0.208251953125, -0.0064697265625, 0.1953125, 0.3970947265625, 0.598876953125, 0.8006591796875, 1.00244140625, 1.2042236328125, 1.406005859375, 1.6077880859375, 1.8095703125, 2.0113525390625, 2.213134765625, 2.4149169921875, 2.61669921875, 2.8184814453125, 3.020263671875, 3.2220458984375, 3.423828125, 3.6256103515625, 3.827392578125, 4.0291748046875, 4.23095703125, 4.4327392578125, 4.634521484375, 4.8363037109375, 5.0380859375, 5.2398681640625, 5.441650390625, 5.6434326171875, 5.84521484375, 6.0469970703125, 6.248779296875, 6.4505615234375, 6.65234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 10.0, 17.0, 15.0, 55.0, 68.0, 83.0, 185.0, 355.0, 639.0, 1300.0, 2798.0, 7264.0, 20976.0, 70512.0, 231863.0, 403376.0, 213656.0, 64017.0, 19429.0, 6752.0, 2736.0, 1125.0, 592.0, 315.0, 179.0, 87.0, 53.0, 41.0, 16.0, 14.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062255859375, -0.05990314483642578, -0.05755043029785156, -0.055197715759277344, -0.052845001220703125, -0.050492286682128906, -0.04813957214355469, -0.04578685760498047, -0.04343414306640625, -0.04108142852783203, -0.03872871398925781, -0.036375999450683594, -0.034023284912109375, -0.031670570373535156, -0.029317855834960938, -0.02696514129638672, -0.0246124267578125, -0.02225971221923828, -0.019906997680664062, -0.017554283142089844, -0.015201568603515625, -0.012848854064941406, -0.010496139526367188, -0.008143424987792969, -0.00579071044921875, -0.0034379959106445312, -0.0010852813720703125, 0.0012674331665039062, 0.003620147705078125, 0.005972862243652344, 0.008325576782226562, 0.010678291320800781, 0.013031005859375, 0.015383720397949219, 0.017736434936523438, 0.020089149475097656, 0.022441864013671875, 0.024794578552246094, 0.027147293090820312, 0.02950000762939453, 0.03185272216796875, 0.03420543670654297, 0.03655815124511719, 0.038910865783691406, 0.041263580322265625, 0.043616294860839844, 0.04596900939941406, 0.04832172393798828, 0.0506744384765625, 0.05302715301513672, 0.05537986755371094, 0.057732582092285156, 0.060085296630859375, 0.062438011169433594, 0.06479072570800781, 0.06714344024658203, 0.06949615478515625, 0.07184886932373047, 0.07420158386230469, 0.0765542984008789, 0.07890701293945312, 0.08125972747802734, 0.08361244201660156, 0.08596515655517578, 0.08831787109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 4.0, 9.0, 10.0, 27.0, 27.0, 36.0, 38.0, 50.0, 80.0, 96.0, 97.0, 112.0, 105.0, 81.0, 58.0, 43.0, 45.0, 33.0, 14.0, 10.0, 7.0, 8.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.179115295410156e-05, -8.864142000675201e-05, -8.549168705940247e-05, -8.234195411205292e-05, -7.919222116470337e-05, -7.604248821735382e-05, -7.289275527000427e-05, -6.974302232265472e-05, -6.659328937530518e-05, -6.344355642795563e-05, -6.029382348060608e-05, -5.714409053325653e-05, -5.399435758590698e-05, -5.0844624638557434e-05, -4.7694891691207886e-05, -4.454515874385834e-05, -4.139542579650879e-05, -3.824569284915924e-05, -3.509595990180969e-05, -3.1946226954460144e-05, -2.8796494007110596e-05, -2.5646761059761047e-05, -2.24970281124115e-05, -1.934729516506195e-05, -1.6197562217712402e-05, -1.3047829270362854e-05, -9.898096323013306e-06, -6.748363375663757e-06, -3.598630428314209e-06, -4.4889748096466064e-07, 2.7008354663848877e-06, 5.850568413734436e-06, 9.000301361083984e-06, 1.2150034308433533e-05, 1.529976725578308e-05, 1.844950020313263e-05, 2.1599233150482178e-05, 2.4748966097831726e-05, 2.7898699045181274e-05, 3.104843199253082e-05, 3.419816493988037e-05, 3.734789788722992e-05, 4.049763083457947e-05, 4.3647363781929016e-05, 4.6797096729278564e-05, 4.994682967662811e-05, 5.309656262397766e-05, 5.624629557132721e-05, 5.939602851867676e-05, 6.25457614660263e-05, 6.569549441337585e-05, 6.88452273607254e-05, 7.199496030807495e-05, 7.51446932554245e-05, 7.829442620277405e-05, 8.14441591501236e-05, 8.459389209747314e-05, 8.774362504482269e-05, 9.089335799217224e-05, 9.404309093952179e-05, 9.719282388687134e-05, 0.00010034255683422089, 0.00010349228978157043, 0.00010664202272891998, 0.00010979175567626953]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 3.0, 9.0, 11.0, 15.0, 17.0, 18.0, 24.0, 31.0, 44.0, 54.0, 87.0, 148.0, 296.0, 716.0, 2061.0, 8963.0, 69927.0, 619955.0, 311137.0, 28057.0, 4600.0, 1302.0, 443.0, 214.0, 111.0, 73.0, 59.0, 30.0, 32.0, 21.0, 17.0, 6.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.134521484375, -0.13015365600585938, -0.12578582763671875, -0.12141799926757812, -0.1170501708984375, -0.11268234252929688, -0.10831451416015625, -0.10394668579101562, -0.099578857421875, -0.09521102905273438, -0.09084320068359375, -0.08647537231445312, -0.0821075439453125, -0.07773971557617188, -0.07337188720703125, -0.06900405883789062, -0.06463623046875, -0.060268402099609375, -0.05590057373046875, -0.051532745361328125, -0.0471649169921875, -0.042797088623046875, -0.03842926025390625, -0.034061431884765625, -0.029693603515625, -0.025325775146484375, -0.02095794677734375, -0.016590118408203125, -0.0122222900390625, -0.007854461669921875, -0.00348663330078125, 0.000881195068359375, 0.0052490234375, 0.009616851806640625, 0.01398468017578125, 0.018352508544921875, 0.0227203369140625, 0.027088165283203125, 0.03145599365234375, 0.035823822021484375, 0.040191650390625, 0.044559478759765625, 0.04892730712890625, 0.053295135498046875, 0.0576629638671875, 0.062030792236328125, 0.06639862060546875, 0.07076644897460938, 0.07513427734375, 0.07950210571289062, 0.08386993408203125, 0.08823776245117188, 0.0926055908203125, 0.09697341918945312, 0.10134124755859375, 0.10570907592773438, 0.110076904296875, 0.11444473266601562, 0.11881256103515625, 0.12318038940429688, 0.1275482177734375, 0.13191604614257812, 0.13628387451171875, 0.14065170288085938, 0.14501953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 5.0, 5.0, 11.0, 11.0, 17.0, 23.0, 24.0, 34.0, 46.0, 47.0, 75.0, 73.0, 55.0, 83.0, 61.0, 71.0, 68.0, 50.0, 48.0, 44.0, 30.0, 23.0, 14.0, 16.0, 11.0, 13.0, 6.0, 2.0, 3.0, 7.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0177459716796875, -0.017147541046142578, -0.016549110412597656, -0.015950679779052734, -0.015352249145507812, -0.01475381851196289, -0.014155387878417969, -0.013556957244873047, -0.012958526611328125, -0.012360095977783203, -0.011761665344238281, -0.01116323471069336, -0.010564804077148438, -0.009966373443603516, -0.009367942810058594, -0.008769512176513672, -0.00817108154296875, -0.007572650909423828, -0.006974220275878906, -0.006375789642333984, -0.0057773590087890625, -0.005178928375244141, -0.004580497741699219, -0.003982067108154297, -0.003383636474609375, -0.002785205841064453, -0.0021867752075195312, -0.0015883445739746094, -0.0009899139404296875, -0.0003914833068847656, 0.00020694732666015625, 0.0008053779602050781, 0.00140380859375, 0.002002239227294922, 0.0026006698608398438, 0.0031991004943847656, 0.0037975311279296875, 0.004395961761474609, 0.004994392395019531, 0.005592823028564453, 0.006191253662109375, 0.006789684295654297, 0.007388114929199219, 0.00798654556274414, 0.008584976196289062, 0.009183406829833984, 0.009781837463378906, 0.010380268096923828, 0.01097869873046875, 0.011577129364013672, 0.012175559997558594, 0.012773990631103516, 0.013372421264648438, 0.01397085189819336, 0.014569282531738281, 0.015167713165283203, 0.015766143798828125, 0.016364574432373047, 0.01696300506591797, 0.01756143569946289, 0.018159866333007812, 0.018758296966552734, 0.019356727600097656, 0.019955158233642578, 0.0205535888671875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 31.0, 57.0, 97.0, 160.0, 208.0, 189.0, 147.0, 55.0, 27.0, 12.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.97476863861084, -10.578423500061035, -10.182079315185547, -9.785734176635742, -9.389389038085938, -8.99304485321045, -8.596699714660645, -8.200355529785156, -7.804010391235352, -7.407665729522705, -7.011321067810059, -6.614975929260254, -6.218631267547607, -5.822286605834961, -5.425941467285156, -5.02959680557251, -4.633252143859863, -4.236907482147217, -3.840562582015991, -3.4442176818847656, -3.047873020172119, -2.6515283584594727, -2.255183458328247, -1.8588385581970215, -1.462493896484375, -1.066149115562439, -0.6698043346405029, -0.2734595537185669, 0.12288522720336914, 0.5192300081253052, 0.9155747890472412, 1.3119196891784668, 1.7082643508911133, 2.1046090126037598, 2.5009539127349854, 2.897298812866211, 3.2936434745788574, 3.689988136291504, 4.086333274841309, 4.482677936553955, 4.879022598266602, 5.275367259979248, 5.6717119216918945, 6.068057060241699, 6.464401721954346, 6.860746383666992, 7.257091522216797, 7.653436183929443, 8.04978084564209, 8.446125984191895, 8.842470169067383, 9.238815307617188, 9.635160446166992, 10.03150463104248, 10.427849769592285, 10.824193954467773, 11.220539093017578, 11.616884231567383, 12.013228416442871, 12.409573554992676, 12.805917739868164, 13.202262878417969, 13.598608016967773, 13.994953155517578, 14.391297340393066]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 4.0, 8.0, 12.0, 13.0, 16.0, 18.0, 31.0, 25.0, 40.0, 30.0, 45.0, 50.0, 43.0, 57.0, 49.0, 51.0, 48.0, 39.0, 45.0, 44.0, 33.0, 39.0, 52.0, 34.0, 31.0, 20.0, 25.0, 12.0, 18.0, 14.0, 10.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.816917657852173, -3.698347806930542, -3.579777956008911, -3.4612081050872803, -3.3426382541656494, -3.2240684032440186, -3.1054985523223877, -2.986928701400757, -2.868358850479126, -2.749788999557495, -2.6312191486358643, -2.5126492977142334, -2.3940794467926025, -2.2755095958709717, -2.156939744949341, -2.03836989402771, -1.9198001623153687, -1.8012303113937378, -1.682660460472107, -1.564090609550476, -1.4455207586288452, -1.326951026916504, -1.208381175994873, -1.0898113250732422, -0.9712414145469666, -0.8526715636253357, -0.7341017127037048, -0.6155319213867188, -0.4969620406627655, -0.37839221954345703, -0.25982236862182617, -0.1412525177001953, -0.022682666778564453, 0.09588717669248581, 0.21445702016353607, 0.33302685618400574, 0.4515967071056366, 0.5701665282249451, 0.6887363791465759, 0.8073062300682068, 0.9258760809898376, 1.0444458723068237, 1.1630157232284546, 1.2815855741500854, 1.4001554250717163, 1.5187252759933472, 1.637295126914978, 1.7558649778366089, 1.8744348287582397, 1.9930046796798706, 2.111574411392212, 2.2301442623138428, 2.3487141132354736, 2.4672839641571045, 2.5858538150787354, 2.704423666000366, 2.822993516921997, 2.941563367843628, 3.060133218765259, 3.1787030696868896, 3.2972729206085205, 3.4158427715301514, 3.5344126224517822, 3.652982473373413, 3.771552324295044]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 24.0, 34.0, 55.0, 80.0, 120.0, 238.0, 360.0, 615.0, 1020.0, 1765.0, 3041.0, 5492.0, 9664.0, 17273.0, 29933.0, 51365.0, 84426.0, 126997.0, 165304.0, 173097.0, 139208.0, 96299.0, 59461.0, 35357.0, 20455.0, 11531.0, 6664.0, 3670.0, 2079.0, 1137.0, 664.0, 395.0, 269.0, 156.0, 93.0, 72.0, 39.0, 22.0, 15.0, 13.0, 11.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.22314453125, -1.1796875, -1.13623046875, -1.0927734375, -1.04931640625, -1.005859375, -0.96240234375, -0.9189453125, -0.87548828125, -0.83203125, -0.78857421875, -0.7451171875, -0.70166015625, -0.658203125, -0.61474609375, -0.5712890625, -0.52783203125, -0.484375, -0.44091796875, -0.3974609375, -0.35400390625, -0.310546875, -0.26708984375, -0.2236328125, -0.18017578125, -0.13671875, -0.09326171875, -0.0498046875, -0.00634765625, 0.037109375, 0.08056640625, 0.1240234375, 0.16748046875, 0.2109375, 0.25439453125, 0.2978515625, 0.34130859375, 0.384765625, 0.42822265625, 0.4716796875, 0.51513671875, 0.55859375, 0.60205078125, 0.6455078125, 0.68896484375, 0.732421875, 0.77587890625, 0.8193359375, 0.86279296875, 0.90625, 0.94970703125, 0.9931640625, 1.03662109375, 1.080078125, 1.12353515625, 1.1669921875, 1.21044921875, 1.25390625, 1.29736328125, 1.3408203125, 1.38427734375, 1.427734375, 1.47119140625, 1.5146484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 7.0, 6.0, 5.0, 9.0, 16.0, 14.0, 20.0, 19.0, 22.0, 40.0, 25.0, 34.0, 43.0, 52.0, 54.0, 63.0, 49.0, 57.0, 62.0, 52.0, 48.0, 45.0, 50.0, 39.0, 32.0, 37.0, 27.0, 23.0, 11.0, 7.0, 3.0, 9.0, 6.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.96142578125, -19.3916015625, -18.82177734375, -18.251953125, -17.68212890625, -17.1123046875, -16.54248046875, -15.97265625, -15.40283203125, -14.8330078125, -14.26318359375, -13.693359375, -13.12353515625, -12.5537109375, -11.98388671875, -11.4140625, -10.84423828125, -10.2744140625, -9.70458984375, -9.134765625, -8.56494140625, -7.9951171875, -7.42529296875, -6.85546875, -6.28564453125, -5.7158203125, -5.14599609375, -4.576171875, -4.00634765625, -3.4365234375, -2.86669921875, -2.296875, -1.72705078125, -1.1572265625, -0.58740234375, -0.017578125, 0.55224609375, 1.1220703125, 1.69189453125, 2.26171875, 2.83154296875, 3.4013671875, 3.97119140625, 4.541015625, 5.11083984375, 5.6806640625, 6.25048828125, 6.8203125, 7.39013671875, 7.9599609375, 8.52978515625, 9.099609375, 9.66943359375, 10.2392578125, 10.80908203125, 11.37890625, 11.94873046875, 12.5185546875, 13.08837890625, 13.658203125, 14.22802734375, 14.7978515625, 15.36767578125, 15.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 9.0, 5.0, 9.0, 13.0, 13.0, 18.0, 21.0, 45.0, 42.0, 49.0, 74.0, 80.0, 112.0, 130.0, 191.0, 275.0, 490.0, 1426.0, 12472.0, 378457.0, 626953.0, 23926.0, 2000.0, 556.0, 287.0, 206.0, 142.0, 132.0, 92.0, 66.0, 72.0, 43.0, 33.0, 33.0, 22.0, 16.0, 12.0, 9.0, 6.0, 7.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-11.265625, -10.969970703125, -10.67431640625, -10.378662109375, -10.0830078125, -9.787353515625, -9.49169921875, -9.196044921875, -8.900390625, -8.604736328125, -8.30908203125, -8.013427734375, -7.7177734375, -7.422119140625, -7.12646484375, -6.830810546875, -6.53515625, -6.239501953125, -5.94384765625, -5.648193359375, -5.3525390625, -5.056884765625, -4.76123046875, -4.465576171875, -4.169921875, -3.874267578125, -3.57861328125, -3.282958984375, -2.9873046875, -2.691650390625, -2.39599609375, -2.100341796875, -1.8046875, -1.509033203125, -1.21337890625, -0.917724609375, -0.6220703125, -0.326416015625, -0.03076171875, 0.264892578125, 0.560546875, 0.856201171875, 1.15185546875, 1.447509765625, 1.7431640625, 2.038818359375, 2.33447265625, 2.630126953125, 2.92578125, 3.221435546875, 3.51708984375, 3.812744140625, 4.1083984375, 4.404052734375, 4.69970703125, 4.995361328125, 5.291015625, 5.586669921875, 5.88232421875, 6.177978515625, 6.4736328125, 6.769287109375, 7.06494140625, 7.360595703125, 7.65625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 9.0, 9.0, 11.0, 6.0, 17.0, 10.0, 21.0, 21.0, 24.0, 29.0, 33.0, 38.0, 40.0, 34.0, 36.0, 51.0, 51.0, 40.0, 60.0, 43.0, 53.0, 43.0, 34.0, 31.0, 35.0, 33.0, 38.0, 27.0, 18.0, 19.0, 14.0, 16.0, 15.0, 7.0, 4.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.734375, -16.2696533203125, -15.804931640625, -15.3402099609375, -14.87548828125, -14.4107666015625, -13.946044921875, -13.4813232421875, -13.0166015625, -12.5518798828125, -12.087158203125, -11.6224365234375, -11.15771484375, -10.6929931640625, -10.228271484375, -9.7635498046875, -9.298828125, -8.8341064453125, -8.369384765625, -7.9046630859375, -7.43994140625, -6.9752197265625, -6.510498046875, -6.0457763671875, -5.5810546875, -5.1163330078125, -4.651611328125, -4.1868896484375, -3.72216796875, -3.2574462890625, -2.792724609375, -2.3280029296875, -1.86328125, -1.3985595703125, -0.933837890625, -0.4691162109375, -0.00439453125, 0.4603271484375, 0.925048828125, 1.3897705078125, 1.8544921875, 2.3192138671875, 2.783935546875, 3.2486572265625, 3.71337890625, 4.1781005859375, 4.642822265625, 5.1075439453125, 5.572265625, 6.0369873046875, 6.501708984375, 6.9664306640625, 7.43115234375, 7.8958740234375, 8.360595703125, 8.8253173828125, 9.2900390625, 9.7547607421875, 10.219482421875, 10.6842041015625, 11.14892578125, 11.6136474609375, 12.078369140625, 12.5430908203125, 13.0078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 5.0, 11.0, 28.0, 47.0, 117.0, 469.0, 5239.0, 1035040.0, 6787.0, 572.0, 118.0, 48.0, 22.0, 16.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.57598876953125, -6.2965087890625, -6.01702880859375, -5.737548828125, -5.45806884765625, -5.1785888671875, -4.89910888671875, -4.61962890625, -4.34014892578125, -4.0606689453125, -3.78118896484375, -3.501708984375, -3.22222900390625, -2.9427490234375, -2.66326904296875, -2.3837890625, -2.10430908203125, -1.8248291015625, -1.54534912109375, -1.265869140625, -0.98638916015625, -0.7069091796875, -0.42742919921875, -0.14794921875, 0.13153076171875, 0.4110107421875, 0.69049072265625, 0.969970703125, 1.24945068359375, 1.5289306640625, 1.80841064453125, 2.087890625, 2.36737060546875, 2.6468505859375, 2.92633056640625, 3.205810546875, 3.48529052734375, 3.7647705078125, 4.04425048828125, 4.32373046875, 4.60321044921875, 4.8826904296875, 5.16217041015625, 5.441650390625, 5.72113037109375, 6.0006103515625, 6.28009033203125, 6.5595703125, 6.83905029296875, 7.1185302734375, 7.39801025390625, 7.677490234375, 7.95697021484375, 8.2364501953125, 8.51593017578125, 8.79541015625, 9.07489013671875, 9.3543701171875, 9.63385009765625, 9.913330078125, 10.19281005859375, 10.4722900390625, 10.75177001953125, 11.03125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 17.0, 26.0, 61.0, 115.0, 168.0, 187.0, 156.0, 95.0, 68.0, 41.0, 16.0, 10.0, 3.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003647804260253906, -0.0003528296947479248, -0.000340878963470459, -0.00032892823219299316, -0.00031697750091552734, -0.0003050267696380615, -0.0002930760383605957, -0.0002811253070831299, -0.00026917457580566406, -0.00025722384452819824, -0.0002452731132507324, -0.0002333223819732666, -0.00022137165069580078, -0.00020942091941833496, -0.00019747018814086914, -0.00018551945686340332, -0.0001735687255859375, -0.00016161799430847168, -0.00014966726303100586, -0.00013771653175354004, -0.00012576580047607422, -0.0001138150691986084, -0.00010186433792114258, -8.991360664367676e-05, -7.796287536621094e-05, -6.601214408874512e-05, -5.40614128112793e-05, -4.2110681533813477e-05, -3.0159950256347656e-05, -1.8209218978881836e-05, -6.258487701416016e-06, 5.692243576049805e-06, 1.7642974853515625e-05, 2.9593706130981445e-05, 4.1544437408447266e-05, 5.3495168685913086e-05, 6.54458999633789e-05, 7.739663124084473e-05, 8.934736251831055e-05, 0.00010129809379577637, 0.00011324882507324219, 0.000125199556350708, 0.00013715028762817383, 0.00014910101890563965, 0.00016105175018310547, 0.0001730024814605713, 0.0001849532127380371, 0.00019690394401550293, 0.00020885467529296875, 0.00022080540657043457, 0.0002327561378479004, 0.0002447068691253662, 0.00025665760040283203, 0.00026860833168029785, 0.00028055906295776367, 0.0002925097942352295, 0.0003044605255126953, 0.00031641125679016113, 0.00032836198806762695, 0.0003403127193450928, 0.0003522634506225586, 0.0003642141819000244, 0.00037616491317749023, 0.00038811564445495605, 0.0004000663757324219]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 11.0, 16.0, 35.0, 39.0, 77.0, 141.0, 299.0, 979.0, 5133.0, 90292.0, 890402.0, 55586.0, 4086.0, 817.0, 257.0, 154.0, 86.0, 38.0, 25.0, 11.0, 8.0, 14.0, 6.0, 5.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.234954833984375, -2.15350341796875, -2.072052001953125, -1.9906005859375, -1.909149169921875, -1.82769775390625, -1.746246337890625, -1.664794921875, -1.583343505859375, -1.50189208984375, -1.420440673828125, -1.3389892578125, -1.257537841796875, -1.17608642578125, -1.094635009765625, -1.01318359375, -0.931732177734375, -0.85028076171875, -0.768829345703125, -0.6873779296875, -0.605926513671875, -0.52447509765625, -0.443023681640625, -0.361572265625, -0.280120849609375, -0.19866943359375, -0.117218017578125, -0.0357666015625, 0.045684814453125, 0.12713623046875, 0.208587646484375, 0.2900390625, 0.371490478515625, 0.45294189453125, 0.534393310546875, 0.6158447265625, 0.697296142578125, 0.77874755859375, 0.860198974609375, 0.941650390625, 1.023101806640625, 1.10455322265625, 1.186004638671875, 1.2674560546875, 1.348907470703125, 1.43035888671875, 1.511810302734375, 1.59326171875, 1.674713134765625, 1.75616455078125, 1.837615966796875, 1.9190673828125, 2.000518798828125, 2.08197021484375, 2.163421630859375, 2.244873046875, 2.326324462890625, 2.40777587890625, 2.489227294921875, 2.5706787109375, 2.652130126953125, 2.73358154296875, 2.815032958984375, 2.896484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 9.0, 8.0, 10.0, 16.0, 18.0, 38.0, 36.0, 56.0, 59.0, 93.0, 66.0, 100.0, 97.0, 87.0, 81.0, 50.0, 56.0, 36.0, 27.0, 17.0, 9.0, 6.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5372390747070312, -0.5207672119140625, -0.5042953491210938, -0.487823486328125, -0.47135162353515625, -0.4548797607421875, -0.43840789794921875, -0.42193603515625, -0.40546417236328125, -0.3889923095703125, -0.37252044677734375, -0.356048583984375, -0.33957672119140625, -0.3231048583984375, -0.30663299560546875, -0.2901611328125, -0.27368927001953125, -0.2572174072265625, -0.24074554443359375, -0.224273681640625, -0.20780181884765625, -0.1913299560546875, -0.17485809326171875, -0.15838623046875, -0.14191436767578125, -0.1254425048828125, -0.10897064208984375, -0.092498779296875, -0.07602691650390625, -0.0595550537109375, -0.04308319091796875, -0.026611328125, -0.01013946533203125, 0.0063323974609375, 0.02280426025390625, 0.039276123046875, 0.05574798583984375, 0.0722198486328125, 0.08869171142578125, 0.10516357421875, 0.12163543701171875, 0.1381072998046875, 0.15457916259765625, 0.171051025390625, 0.18752288818359375, 0.2039947509765625, 0.22046661376953125, 0.2369384765625, 0.25341033935546875, 0.2698822021484375, 0.28635406494140625, 0.302825927734375, 0.31929779052734375, 0.3357696533203125, 0.35224151611328125, 0.36871337890625, 0.38518524169921875, 0.4016571044921875, 0.41812896728515625, 0.434600830078125, 0.45107269287109375, 0.4675445556640625, 0.48401641845703125, 0.50048828125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 19.0, 55.0, 204.0, 341.0, 289.0, 80.0, 20.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.697264671325684, -7.567928314208984, -6.438591957092285, -5.309255123138428, -4.1799187660217285, -3.0505824089050293, -1.9212455749511719, -0.7919092178344727, 0.33742713928222656, 1.4667636156082153, 2.596100091934204, 3.7254366874694824, 4.854773044586182, 5.984109401702881, 7.113446235656738, 8.242782592773438, 9.372118949890137, 10.501455307006836, 11.630791664123535, 12.760128021240234, 13.88946533203125, 15.018800735473633, 16.14813804626465, 17.27747344970703, 18.406810760498047, 19.536148071289062, 20.665483474731445, 21.79482078552246, 22.924156188964844, 24.05349349975586, 25.182830810546875, 26.312166213989258, 27.44150161743164, 28.570838928222656, 29.70017433166504, 30.829511642456055, 31.958847045898438, 33.08818435668945, 34.21752166748047, 35.34685516357422, 36.476192474365234, 37.60552978515625, 38.734867095947266, 39.864200592041016, 40.99353790283203, 42.12287521362305, 43.25221252441406, 44.38154602050781, 45.510887145996094, 46.64022445678711, 47.769561767578125, 48.898895263671875, 50.02823257446289, 51.157569885253906, 52.28690719604492, 53.41624450683594, 54.54557800292969, 55.6749153137207, 56.80425262451172, 57.93358612060547, 59.062923431396484, 60.1922607421875, 61.321598052978516, 62.45093536376953, 63.58026885986328]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 5.0, 6.0, 8.0, 8.0, 7.0, 21.0, 14.0, 22.0, 25.0, 22.0, 22.0, 28.0, 34.0, 24.0, 44.0, 46.0, 51.0, 41.0, 48.0, 47.0, 50.0, 44.0, 49.0, 49.0, 48.0, 27.0, 37.0, 29.0, 26.0, 32.0, 17.0, 7.0, 7.0, 11.0, 12.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.276214599609375, -25.53334617614746, -24.790477752685547, -24.047609329223633, -23.30474090576172, -22.561872482299805, -21.81900405883789, -21.07613754272461, -20.333267211914062, -19.59039878845215, -18.847530364990234, -18.10466194152832, -17.361793518066406, -16.618925094604492, -15.876057624816895, -15.13318920135498, -14.390321731567383, -13.647453308105469, -12.904584884643555, -12.16171646118164, -11.418848037719727, -10.675979614257812, -9.933112144470215, -9.1902437210083, -8.447375297546387, -7.704506874084473, -6.961638450622559, -6.218770503997803, -5.475902080535889, -4.733033657073975, -3.9901657104492188, -3.2472972869873047, -2.5044307708740234, -1.761562466621399, -1.0186941623687744, -0.27582597732543945, 0.4670424461364746, 1.2099108695983887, 1.9527788162231445, 2.6956472396850586, 3.4385156631469727, 4.181384086608887, 4.924252510070801, 5.667120456695557, 6.409988880157471, 7.152857303619385, 7.895725250244141, 8.638593673706055, 9.381462097167969, 10.124330520629883, 10.867198944091797, 11.610067367553711, 12.352935791015625, 13.095804214477539, 13.838671684265137, 14.58154010772705, 15.324408531188965, 16.067276000976562, 16.810144424438477, 17.55301284790039, 18.295881271362305, 19.03874969482422, 19.781618118286133, 20.524486541748047, 21.26735496520996]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 10.0, 20.0, 27.0, 35.0, 50.0, 86.0, 162.0, 271.0, 515.0, 1065.0, 2239.0, 5314.0, 13311.0, 36809.0, 115715.0, 384351.0, 1034491.0, 1419658.0, 798462.0, 261169.0, 77253.0, 25715.0, 9734.0, 4063.0, 1776.0, 839.0, 463.0, 256.0, 144.0, 85.0, 54.0, 38.0, 19.0, 13.0, 10.0, 10.0, 10.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5234375, -4.37908935546875, -4.2347412109375, -4.09039306640625, -3.946044921875, -3.80169677734375, -3.6573486328125, -3.51300048828125, -3.36865234375, -3.22430419921875, -3.0799560546875, -2.93560791015625, -2.791259765625, -2.64691162109375, -2.5025634765625, -2.35821533203125, -2.2138671875, -2.06951904296875, -1.9251708984375, -1.78082275390625, -1.636474609375, -1.49212646484375, -1.3477783203125, -1.20343017578125, -1.05908203125, -0.91473388671875, -0.7703857421875, -0.62603759765625, -0.481689453125, -0.33734130859375, -0.1929931640625, -0.04864501953125, 0.095703125, 0.24005126953125, 0.3843994140625, 0.52874755859375, 0.673095703125, 0.81744384765625, 0.9617919921875, 1.10614013671875, 1.25048828125, 1.39483642578125, 1.5391845703125, 1.68353271484375, 1.827880859375, 1.97222900390625, 2.1165771484375, 2.26092529296875, 2.4052734375, 2.54962158203125, 2.6939697265625, 2.83831787109375, 2.982666015625, 3.12701416015625, 3.2713623046875, 3.41571044921875, 3.56005859375, 3.70440673828125, 3.8487548828125, 3.99310302734375, 4.137451171875, 4.28179931640625, 4.4261474609375, 4.57049560546875, 4.71484375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 9.0, 7.0, 8.0, 10.0, 16.0, 16.0, 31.0, 17.0, 26.0, 34.0, 38.0, 26.0, 28.0, 32.0, 44.0, 36.0, 47.0, 45.0, 49.0, 51.0, 36.0, 38.0, 44.0, 40.0, 30.0, 32.0, 41.0, 22.0, 21.0, 19.0, 20.0, 11.0, 10.0, 13.0, 6.0, 8.0, 5.0, 6.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.76171875, -3.6334228515625, -3.505126953125, -3.3768310546875, -3.24853515625, -3.1202392578125, -2.991943359375, -2.8636474609375, -2.7353515625, -2.6070556640625, -2.478759765625, -2.3504638671875, -2.22216796875, -2.0938720703125, -1.965576171875, -1.8372802734375, -1.708984375, -1.5806884765625, -1.452392578125, -1.3240966796875, -1.19580078125, -1.0675048828125, -0.939208984375, -0.8109130859375, -0.6826171875, -0.5543212890625, -0.426025390625, -0.2977294921875, -0.16943359375, -0.0411376953125, 0.087158203125, 0.2154541015625, 0.34375, 0.4720458984375, 0.600341796875, 0.7286376953125, 0.85693359375, 0.9852294921875, 1.113525390625, 1.2418212890625, 1.3701171875, 1.4984130859375, 1.626708984375, 1.7550048828125, 1.88330078125, 2.0115966796875, 2.139892578125, 2.2681884765625, 2.396484375, 2.5247802734375, 2.653076171875, 2.7813720703125, 2.90966796875, 3.0379638671875, 3.166259765625, 3.2945556640625, 3.4228515625, 3.5511474609375, 3.679443359375, 3.8077392578125, 3.93603515625, 4.0643310546875, 4.192626953125, 4.3209228515625, 4.44921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 4.0, 8.0, 10.0, 17.0, 22.0, 75.0, 241.0, 27000.0, 4166308.0, 419.0, 63.0, 29.0, 21.0, 13.0, 4.0, 13.0, 10.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.4375, -96.2451171875, -93.052734375, -89.8603515625, -86.66796875, -83.4755859375, -80.283203125, -77.0908203125, -73.8984375, -70.7060546875, -67.513671875, -64.3212890625, -61.12890625, -57.9365234375, -54.744140625, -51.5517578125, -48.359375, -45.1669921875, -41.974609375, -38.7822265625, -35.58984375, -32.3974609375, -29.205078125, -26.0126953125, -22.8203125, -19.6279296875, -16.435546875, -13.2431640625, -10.05078125, -6.8583984375, -3.666015625, -0.4736328125, 2.71875, 5.9111328125, 9.103515625, 12.2958984375, 15.48828125, 18.6806640625, 21.873046875, 25.0654296875, 28.2578125, 31.4501953125, 34.642578125, 37.8349609375, 41.02734375, 44.2197265625, 47.412109375, 50.6044921875, 53.796875, 56.9892578125, 60.181640625, 63.3740234375, 66.56640625, 69.7587890625, 72.951171875, 76.1435546875, 79.3359375, 82.5283203125, 85.720703125, 88.9130859375, 92.10546875, 95.2978515625, 98.490234375, 101.6826171875, 104.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 14.0, 11.0, 11.0, 16.0, 22.0, 25.0, 31.0, 57.0, 63.0, 93.0, 117.0, 168.0, 224.0, 313.0, 429.0, 508.0, 442.0, 409.0, 317.0, 217.0, 164.0, 114.0, 78.0, 66.0, 49.0, 30.0, 17.0, 27.0, 8.0, 12.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.4609375, -2.39410400390625, -2.3272705078125, -2.26043701171875, -2.193603515625, -2.12677001953125, -2.0599365234375, -1.99310302734375, -1.92626953125, -1.85943603515625, -1.7926025390625, -1.72576904296875, -1.658935546875, -1.59210205078125, -1.5252685546875, -1.45843505859375, -1.3916015625, -1.32476806640625, -1.2579345703125, -1.19110107421875, -1.124267578125, -1.05743408203125, -0.9906005859375, -0.92376708984375, -0.85693359375, -0.79010009765625, -0.7232666015625, -0.65643310546875, -0.589599609375, -0.52276611328125, -0.4559326171875, -0.38909912109375, -0.322265625, -0.25543212890625, -0.1885986328125, -0.12176513671875, -0.054931640625, 0.01190185546875, 0.0787353515625, 0.14556884765625, 0.21240234375, 0.27923583984375, 0.3460693359375, 0.41290283203125, 0.479736328125, 0.54656982421875, 0.6134033203125, 0.68023681640625, 0.7470703125, 0.81390380859375, 0.8807373046875, 0.94757080078125, 1.014404296875, 1.08123779296875, 1.1480712890625, 1.21490478515625, 1.28173828125, 1.34857177734375, 1.4154052734375, 1.48223876953125, 1.549072265625, 1.61590576171875, 1.6827392578125, 1.74957275390625, 1.81640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 21.0, 27.0, 33.0, 40.0, 58.0, 71.0, 81.0, 83.0, 98.0, 92.0, 83.0, 79.0, 55.0, 52.0, 36.0, 32.0, 16.0, 12.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.964637279510498, -4.736578941345215, -4.50852108001709, -4.280462741851807, -4.052404403686523, -3.8243460655212402, -3.596287965774536, -3.368229866027832, -3.140171527862549, -2.9121131896972656, -2.6840550899505615, -2.4559969902038574, -2.227938652038574, -1.9998804330825806, -1.771822214126587, -1.5437639951705933, -1.3157057762145996, -1.087647557258606, -0.8595893383026123, -0.6315311193466187, -0.403472900390625, -0.17541468143463135, 0.052643537521362305, 0.28070175647735596, 0.5087599754333496, 0.7368181943893433, 0.9648764133453369, 1.1929346323013306, 1.4209928512573242, 1.6490510702133179, 1.8771092891693115, 2.1051673889160156, 2.333226203918457, 2.5612845420837402, 2.7893426418304443, 3.0174007415771484, 3.2454590797424316, 3.473517417907715, 3.701575517654419, 3.929633617401123, 4.157691955566406, 4.3857502937316895, 4.613808631896973, 4.841866493225098, 5.069924831390381, 5.297983169555664, 5.526041030883789, 5.754099369049072, 5.9821577072143555, 6.210216045379639, 6.438274383544922, 6.666332244873047, 6.89439058303833, 7.122448921203613, 7.350506782531738, 7.5785651206970215, 7.806623458862305, 8.03468132019043, 8.262740135192871, 8.490797996520996, 8.718856811523438, 8.946914672851562, 9.174972534179688, 9.403031349182129, 9.631089210510254]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 7.0, 6.0, 5.0, 14.0, 21.0, 15.0, 23.0, 25.0, 23.0, 37.0, 33.0, 27.0, 42.0, 41.0, 41.0, 47.0, 57.0, 40.0, 30.0, 44.0, 35.0, 34.0, 37.0, 25.0, 36.0, 32.0, 26.0, 31.0, 20.0, 23.0, 22.0, 17.0, 13.0, 9.0, 5.0, 12.0, 7.0, 6.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-4.238742351531982, -4.105901718139648, -3.9730613231658936, -3.8402206897735596, -3.7073802947998047, -3.5745396614074707, -3.4416990280151367, -3.3088583946228027, -3.176017999649048, -3.043177366256714, -2.910336971282959, -2.777496337890625, -2.644655704498291, -2.511815309524536, -2.378974676132202, -2.2461342811584473, -2.1132936477661133, -1.9804531335830688, -1.8476126194000244, -1.7147719860076904, -1.581931471824646, -1.4490909576416016, -1.3162503242492676, -1.1834098100662231, -1.0505692958831787, -0.9177287817001343, -0.7848882079124451, -0.6520476341247559, -0.5192071199417114, -0.386366605758667, -0.2535260319709778, -0.12068545818328857, 0.01215505599975586, 0.14499559998512268, 0.2778361439704895, 0.4106766879558563, 0.5435172319412231, 0.6763577461242676, 0.8091983199119568, 0.942038893699646, 1.0748794078826904, 1.2077199220657349, 1.3405604362487793, 1.4734010696411133, 1.6062415838241577, 1.7390820980072021, 1.8719227313995361, 2.004763126373291, 2.137603759765625, 2.270444393157959, 2.403284788131714, 2.536125421524048, 2.6689658164978027, 2.8018064498901367, 2.9346470832824707, 3.0674877166748047, 3.2003281116485596, 3.3331687450408936, 3.4660091400146484, 3.5988497734069824, 3.7316904067993164, 3.8645308017730713, 3.9973714351654053, 4.13021183013916, 4.263052463531494]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 10.0, 5.0, 10.0, 15.0, 26.0, 28.0, 35.0, 45.0, 57.0, 82.0, 117.0, 155.0, 171.0, 252.0, 355.0, 418.0, 532.0, 750.0, 1021.0, 1380.0, 2005.0, 3514.0, 8143.0, 29977.0, 132495.0, 402008.0, 335165.0, 92255.0, 21239.0, 6472.0, 2996.0, 1756.0, 1276.0, 933.0, 681.0, 542.0, 405.0, 299.0, 220.0, 162.0, 132.0, 97.0, 83.0, 57.0, 59.0, 35.0, 23.0, 20.0, 12.0, 15.0, 10.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.82763671875, -0.8016738891601562, -0.7757110595703125, -0.7497482299804688, -0.723785400390625, -0.6978225708007812, -0.6718597412109375, -0.6458969116210938, -0.61993408203125, -0.5939712524414062, -0.5680084228515625, -0.5420455932617188, -0.516082763671875, -0.49011993408203125, -0.4641571044921875, -0.43819427490234375, -0.4122314453125, -0.38626861572265625, -0.3603057861328125, -0.33434295654296875, -0.308380126953125, -0.28241729736328125, -0.2564544677734375, -0.23049163818359375, -0.20452880859375, -0.17856597900390625, -0.1526031494140625, -0.12664031982421875, -0.100677490234375, -0.07471466064453125, -0.0487518310546875, -0.02278900146484375, 0.003173828125, 0.02913665771484375, 0.0550994873046875, 0.08106231689453125, 0.107025146484375, 0.13298797607421875, 0.1589508056640625, 0.18491363525390625, 0.21087646484375, 0.23683929443359375, 0.2628021240234375, 0.28876495361328125, 0.314727783203125, 0.34069061279296875, 0.3666534423828125, 0.39261627197265625, 0.4185791015625, 0.44454193115234375, 0.4705047607421875, 0.49646759033203125, 0.522430419921875, 0.5483932495117188, 0.5743560791015625, 0.6003189086914062, 0.62628173828125, 0.6522445678710938, 0.6782073974609375, 0.7041702270507812, 0.730133056640625, 0.7560958862304688, 0.7820587158203125, 0.8080215454101562, 0.833984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 13.0, 10.0, 15.0, 29.0, 13.0, 22.0, 21.0, 34.0, 37.0, 39.0, 41.0, 35.0, 36.0, 46.0, 25.0, 52.0, 48.0, 42.0, 30.0, 43.0, 40.0, 35.0, 23.0, 38.0, 21.0, 34.0, 30.0, 25.0, 16.0, 11.0, 10.0, 13.0, 10.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.650390625, -2.560577392578125, -2.47076416015625, -2.380950927734375, -2.2911376953125, -2.201324462890625, -2.11151123046875, -2.021697998046875, -1.931884765625, -1.842071533203125, -1.75225830078125, -1.662445068359375, -1.5726318359375, -1.482818603515625, -1.39300537109375, -1.303192138671875, -1.21337890625, -1.123565673828125, -1.03375244140625, -0.943939208984375, -0.8541259765625, -0.764312744140625, -0.67449951171875, -0.584686279296875, -0.494873046875, -0.405059814453125, -0.31524658203125, -0.225433349609375, -0.1356201171875, -0.045806884765625, 0.04400634765625, 0.133819580078125, 0.2236328125, 0.313446044921875, 0.40325927734375, 0.493072509765625, 0.5828857421875, 0.672698974609375, 0.76251220703125, 0.852325439453125, 0.942138671875, 1.031951904296875, 1.12176513671875, 1.211578369140625, 1.3013916015625, 1.391204833984375, 1.48101806640625, 1.570831298828125, 1.66064453125, 1.750457763671875, 1.84027099609375, 1.930084228515625, 2.0198974609375, 2.109710693359375, 2.19952392578125, 2.289337158203125, 2.379150390625, 2.468963623046875, 2.55877685546875, 2.648590087890625, 2.7384033203125, 2.828216552734375, 2.91802978515625, 3.007843017578125, 3.09765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 14.0, 21.0, 37.0, 50.0, 105.0, 189.0, 295.0, 647.0, 1177.0, 2403.0, 4537.0, 8963.0, 17668.0, 32726.0, 60601.0, 105859.0, 164604.0, 202284.0, 178463.0, 118634.0, 69643.0, 37997.0, 19847.0, 10712.0, 5413.0, 2754.0, 1372.0, 706.0, 388.0, 194.0, 106.0, 47.0, 20.0, 22.0, 15.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28369140625, -0.2744255065917969, -0.26515960693359375, -0.2558937072753906, -0.2466278076171875, -0.23736190795898438, -0.22809600830078125, -0.21883010864257812, -0.209564208984375, -0.20029830932617188, -0.19103240966796875, -0.18176651000976562, -0.1725006103515625, -0.16323471069335938, -0.15396881103515625, -0.14470291137695312, -0.13543701171875, -0.12617111206054688, -0.11690521240234375, -0.10763931274414062, -0.0983734130859375, -0.08910751342773438, -0.07984161376953125, -0.07057571411132812, -0.061309814453125, -0.052043914794921875, -0.04277801513671875, -0.033512115478515625, -0.0242462158203125, -0.014980316162109375, -0.00571441650390625, 0.003551483154296875, 0.0128173828125, 0.022083282470703125, 0.03134918212890625, 0.040615081787109375, 0.0498809814453125, 0.059146881103515625, 0.06841278076171875, 0.07767868041992188, 0.086944580078125, 0.09621047973632812, 0.10547637939453125, 0.11474227905273438, 0.1240081787109375, 0.13327407836914062, 0.14253997802734375, 0.15180587768554688, 0.16107177734375, 0.17033767700195312, 0.17960357666015625, 0.18886947631835938, 0.1981353759765625, 0.20740127563476562, 0.21666717529296875, 0.22593307495117188, 0.235198974609375, 0.24446487426757812, 0.25373077392578125, 0.2629966735839844, 0.2722625732421875, 0.2815284729003906, 0.29079437255859375, 0.3000602722167969, 0.309326171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 5.0, 8.0, 6.0, 16.0, 18.0, 21.0, 13.0, 18.0, 26.0, 20.0, 32.0, 32.0, 37.0, 39.0, 44.0, 58.0, 43.0, 51.0, 75.0, 54.0, 56.0, 36.0, 34.0, 38.0, 27.0, 33.0, 30.0, 20.0, 25.0, 11.0, 14.0, 12.0, 9.0, 2.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.21484375, -6.0247802734375, -5.834716796875, -5.6446533203125, -5.45458984375, -5.2645263671875, -5.074462890625, -4.8843994140625, -4.6943359375, -4.5042724609375, -4.314208984375, -4.1241455078125, -3.93408203125, -3.7440185546875, -3.553955078125, -3.3638916015625, -3.173828125, -2.9837646484375, -2.793701171875, -2.6036376953125, -2.41357421875, -2.2235107421875, -2.033447265625, -1.8433837890625, -1.6533203125, -1.4632568359375, -1.273193359375, -1.0831298828125, -0.89306640625, -0.7030029296875, -0.512939453125, -0.3228759765625, -0.1328125, 0.0572509765625, 0.247314453125, 0.4373779296875, 0.62744140625, 0.8175048828125, 1.007568359375, 1.1976318359375, 1.3876953125, 1.5777587890625, 1.767822265625, 1.9578857421875, 2.14794921875, 2.3380126953125, 2.528076171875, 2.7181396484375, 2.908203125, 3.0982666015625, 3.288330078125, 3.4783935546875, 3.66845703125, 3.8585205078125, 4.048583984375, 4.2386474609375, 4.4287109375, 4.6187744140625, 4.808837890625, 4.9989013671875, 5.18896484375, 5.3790283203125, 5.569091796875, 5.7591552734375, 5.94921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 8.0, 23.0, 32.0, 43.0, 64.0, 76.0, 133.0, 227.0, 350.0, 717.0, 1519.0, 3315.0, 8583.0, 27051.0, 104885.0, 361604.0, 379720.0, 115058.0, 29096.0, 9133.0, 3584.0, 1572.0, 755.0, 391.0, 207.0, 125.0, 92.0, 49.0, 46.0, 20.0, 17.0, 20.0, 3.0, 7.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0684814453125, -0.06640815734863281, -0.06433486938476562, -0.06226158142089844, -0.06018829345703125, -0.05811500549316406, -0.056041717529296875, -0.05396842956542969, -0.0518951416015625, -0.04982185363769531, -0.047748565673828125, -0.04567527770996094, -0.04360198974609375, -0.04152870178222656, -0.039455413818359375, -0.03738212585449219, -0.035308837890625, -0.03323554992675781, -0.031162261962890625, -0.029088973999023438, -0.02701568603515625, -0.024942398071289062, -0.022869110107421875, -0.020795822143554688, -0.0187225341796875, -0.016649246215820312, -0.014575958251953125, -0.012502670288085938, -0.01042938232421875, -0.008356094360351562, -0.006282806396484375, -0.0042095184326171875, -0.00213623046875, -6.29425048828125e-05, 0.002010345458984375, 0.0040836334228515625, 0.00615692138671875, 0.008230209350585938, 0.010303497314453125, 0.012376785278320312, 0.0144500732421875, 0.016523361206054688, 0.018596649169921875, 0.020669937133789062, 0.02274322509765625, 0.024816513061523438, 0.026889801025390625, 0.028963088989257812, 0.031036376953125, 0.03310966491699219, 0.035182952880859375, 0.03725624084472656, 0.03932952880859375, 0.04140281677246094, 0.043476104736328125, 0.04554939270019531, 0.0476226806640625, 0.04969596862792969, 0.051769256591796875, 0.05384254455566406, 0.05591583251953125, 0.05798912048339844, 0.060062408447265625, 0.06213569641113281, 0.064208984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 12.0, 12.0, 22.0, 25.0, 29.0, 42.0, 58.0, 46.0, 93.0, 97.0, 114.0, 65.0, 85.0, 89.0, 62.0, 37.0, 38.0, 17.0, 25.0, 5.0, 11.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-05, -5.1616691052913666e-05, -4.958920180797577e-05, -4.756171256303787e-05, -4.5534223318099976e-05, -4.350673407316208e-05, -4.147924482822418e-05, -3.9451755583286285e-05, -3.742426633834839e-05, -3.539677709341049e-05, -3.3369287848472595e-05, -3.13417986035347e-05, -2.9314309358596802e-05, -2.7286820113658905e-05, -2.5259330868721008e-05, -2.323184162378311e-05, -2.1204352378845215e-05, -1.9176863133907318e-05, -1.714937388896942e-05, -1.5121884644031525e-05, -1.3094395399093628e-05, -1.1066906154155731e-05, -9.039416909217834e-06, -7.011927664279938e-06, -4.984438419342041e-06, -2.9569491744041443e-06, -9.294599294662476e-07, 1.0980293154716492e-06, 3.125518560409546e-06, 5.153007805347443e-06, 7.180497050285339e-06, 9.207986295223236e-06, 1.1235475540161133e-05, 1.326296478509903e-05, 1.5290454030036926e-05, 1.7317943274974823e-05, 1.934543251991272e-05, 2.1372921764850616e-05, 2.3400411009788513e-05, 2.542790025472641e-05, 2.7455389499664307e-05, 2.9482878744602203e-05, 3.15103679895401e-05, 3.3537857234478e-05, 3.5565346479415894e-05, 3.759283572435379e-05, 3.962032496929169e-05, 4.1647814214229584e-05, 4.367530345916748e-05, 4.570279270410538e-05, 4.7730281949043274e-05, 4.975777119398117e-05, 5.178526043891907e-05, 5.3812749683856964e-05, 5.584023892879486e-05, 5.786772817373276e-05, 5.9895217418670654e-05, 6.192270666360855e-05, 6.395019590854645e-05, 6.597768515348434e-05, 6.800517439842224e-05, 7.003266364336014e-05, 7.206015288829803e-05, 7.408764213323593e-05, 7.611513137817383e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 11.0, 25.0, 29.0, 32.0, 59.0, 85.0, 132.0, 433.0, 3419.0, 94243.0, 911685.0, 35643.0, 2025.0, 356.0, 127.0, 59.0, 43.0, 34.0, 20.0, 15.0, 10.0, 14.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2177734375, -0.21104812622070312, -0.20432281494140625, -0.19759750366210938, -0.1908721923828125, -0.18414688110351562, -0.17742156982421875, -0.17069625854492188, -0.163970947265625, -0.15724563598632812, -0.15052032470703125, -0.14379501342773438, -0.1370697021484375, -0.13034439086914062, -0.12361907958984375, -0.11689376831054688, -0.11016845703125, -0.10344314575195312, -0.09671783447265625, -0.08999252319335938, -0.0832672119140625, -0.07654190063476562, -0.06981658935546875, -0.06309127807617188, -0.056365966796875, -0.049640655517578125, -0.04291534423828125, -0.036190032958984375, -0.0294647216796875, -0.022739410400390625, -0.01601409912109375, -0.009288787841796875, -0.0025634765625, 0.004161834716796875, 0.01088714599609375, 0.017612457275390625, 0.0243377685546875, 0.031063079833984375, 0.03778839111328125, 0.044513702392578125, 0.051239013671875, 0.057964324951171875, 0.06468963623046875, 0.07141494750976562, 0.0781402587890625, 0.08486557006835938, 0.09159088134765625, 0.09831619262695312, 0.10504150390625, 0.11176681518554688, 0.11849212646484375, 0.12521743774414062, 0.1319427490234375, 0.13866806030273438, 0.14539337158203125, 0.15211868286132812, 0.158843994140625, 0.16556930541992188, 0.17229461669921875, 0.17901992797851562, 0.1857452392578125, 0.19247055053710938, 0.19919586181640625, 0.20592117309570312, 0.212646484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 14.0, 22.0, 12.0, 31.0, 38.0, 55.0, 59.0, 91.0, 108.0, 118.0, 100.0, 89.0, 69.0, 52.0, 22.0, 23.0, 19.0, 11.0, 10.0, 9.0, 7.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220947265625, -0.021407127380371094, -0.020719528198242188, -0.02003192901611328, -0.019344329833984375, -0.01865673065185547, -0.017969131469726562, -0.017281532287597656, -0.01659393310546875, -0.015906333923339844, -0.015218734741210938, -0.014531135559082031, -0.013843536376953125, -0.013155937194824219, -0.012468338012695312, -0.011780738830566406, -0.0110931396484375, -0.010405540466308594, -0.009717941284179688, -0.009030342102050781, -0.008342742919921875, -0.007655143737792969, -0.0069675445556640625, -0.006279945373535156, -0.00559234619140625, -0.004904747009277344, -0.0042171478271484375, -0.0035295486450195312, -0.002841949462890625, -0.0021543502807617188, -0.0014667510986328125, -0.0007791519165039062, -9.1552734375e-05, 0.0005960464477539062, 0.0012836456298828125, 0.0019712448120117188, 0.002658843994140625, 0.0033464431762695312, 0.0040340423583984375, 0.004721641540527344, 0.00540924072265625, 0.006096839904785156, 0.0067844390869140625, 0.007472038269042969, 0.008159637451171875, 0.008847236633300781, 0.009534835815429688, 0.010222434997558594, 0.0109100341796875, 0.011597633361816406, 0.012285232543945312, 0.012972831726074219, 0.013660430908203125, 0.014348030090332031, 0.015035629272460938, 0.015723228454589844, 0.01641082763671875, 0.017098426818847656, 0.017786026000976562, 0.01847362518310547, 0.019161224365234375, 0.01984882354736328, 0.020536422729492188, 0.021224021911621094, 0.02191162109375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 6.0, 11.0, 17.0, 26.0, 49.0, 58.0, 87.0, 97.0, 112.0, 119.0, 110.0, 81.0, 82.0, 54.0, 39.0, 25.0, 10.0, 3.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.748645305633545, -6.567481994628906, -6.386318206787109, -6.205154895782471, -6.023991584777832, -5.842827796936035, -5.6616644859313965, -5.480501174926758, -5.299337387084961, -5.118174076080322, -4.937010288238525, -4.755846977233887, -4.574683666229248, -4.393520355224609, -4.2123565673828125, -4.031193256378174, -3.850029945373535, -3.6688663959503174, -3.4877030849456787, -3.306539535522461, -3.1253762245178223, -2.9442126750946045, -2.7630491256713867, -2.581885814666748, -2.4007222652435303, -2.2195587158203125, -2.038395404815674, -1.857231855392456, -1.6760684251785278, -1.4949049949645996, -1.3137414455413818, -1.1325780153274536, -0.9514145851135254, -0.7702511548995972, -0.5890876650810242, -0.40792417526245117, -0.22676074504852295, -0.04559731483459473, 0.13556623458862305, 0.31672966480255127, 0.4978930950164795, 0.6790565252304077, 0.8602200150489807, 1.0413835048675537, 1.222546935081482, 1.4037103652954102, 1.584873914718628, 1.7660373449325562, 1.9472007751464844, 2.128364324569702, 2.309527635574341, 2.4906911849975586, 2.6718544960021973, 2.853018045425415, 3.034181594848633, 3.2153449058532715, 3.3965084552764893, 3.577672004699707, 3.7588353157043457, 3.9399988651275635, 4.121162414550781, 4.30232572555542, 4.483489036560059, 4.6646528244018555, 4.845816135406494]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 5.0, 10.0, 21.0, 16.0, 22.0, 21.0, 23.0, 30.0, 34.0, 35.0, 40.0, 42.0, 38.0, 44.0, 48.0, 43.0, 43.0, 39.0, 37.0, 36.0, 41.0, 27.0, 35.0, 34.0, 35.0, 23.0, 18.0, 25.0, 23.0, 16.0, 9.0, 14.0, 5.0, 10.0, 9.0, 7.0, 8.0, 0.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.8218719959259033, -2.735198974609375, -2.6485259532928467, -2.5618529319763184, -2.47517991065979, -2.3885068893432617, -2.3018336296081543, -2.215160846710205, -2.1284875869750977, -2.0418145656585693, -1.955141544342041, -1.8684685230255127, -1.7817955017089844, -1.695122480392456, -1.6084493398666382, -1.5217763185501099, -1.435103416442871, -1.3484303951263428, -1.2617573738098145, -1.1750843524932861, -1.0884113311767578, -1.0017383098602295, -0.9150651693344116, -0.8283921480178833, -0.741719126701355, -0.6550461053848267, -0.5683730840682983, -0.48170000314712524, -0.3950269818305969, -0.3083539605140686, -0.2216808795928955, -0.1350078582763672, -0.048334598541259766, 0.03833843767642975, 0.12501147389411926, 0.21168452501296997, 0.2983575463294983, 0.3850305676460266, 0.4717036485671997, 0.558376669883728, 0.6450496912002563, 0.7317227125167847, 0.818395733833313, 0.9050688147544861, 0.9917418360710144, 1.0784149169921875, 1.1650879383087158, 1.2517609596252441, 1.3384339809417725, 1.4251070022583008, 1.511780023574829, 1.5984530448913574, 1.6851260662078857, 1.771799087524414, 1.858472228050232, 1.9451452493667603, 2.031818389892578, 2.1184914112091064, 2.2051644325256348, 2.291837453842163, 2.3785104751586914, 2.4651834964752197, 2.551856517791748, 2.6385297775268555, 2.7252025604248047]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 2.0, 7.0, 11.0, 21.0, 25.0, 20.0, 51.0, 74.0, 125.0, 182.0, 289.0, 456.0, 776.0, 1384.0, 2275.0, 4503.0, 8769.0, 19064.0, 43174.0, 100931.0, 214778.0, 292768.0, 195680.0, 90182.0, 38462.0, 16907.0, 8090.0, 4206.0, 2182.0, 1275.0, 740.0, 423.0, 240.0, 180.0, 97.0, 64.0, 48.0, 26.0, 20.0, 12.0, 8.0, 7.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.983642578125, -1.91845703125, -1.853271484375, -1.7880859375, -1.722900390625, -1.65771484375, -1.592529296875, -1.52734375, -1.462158203125, -1.39697265625, -1.331787109375, -1.2666015625, -1.201416015625, -1.13623046875, -1.071044921875, -1.005859375, -0.940673828125, -0.87548828125, -0.810302734375, -0.7451171875, -0.679931640625, -0.61474609375, -0.549560546875, -0.484375, -0.419189453125, -0.35400390625, -0.288818359375, -0.2236328125, -0.158447265625, -0.09326171875, -0.028076171875, 0.037109375, 0.102294921875, 0.16748046875, 0.232666015625, 0.2978515625, 0.363037109375, 0.42822265625, 0.493408203125, 0.55859375, 0.623779296875, 0.68896484375, 0.754150390625, 0.8193359375, 0.884521484375, 0.94970703125, 1.014892578125, 1.080078125, 1.145263671875, 1.21044921875, 1.275634765625, 1.3408203125, 1.406005859375, 1.47119140625, 1.536376953125, 1.6015625, 1.666748046875, 1.73193359375, 1.797119140625, 1.8623046875, 1.927490234375, 1.99267578125, 2.057861328125, 2.123046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 10.0, 11.0, 8.0, 10.0, 6.0, 20.0, 13.0, 13.0, 13.0, 26.0, 32.0, 27.0, 33.0, 34.0, 47.0, 58.0, 43.0, 46.0, 46.0, 38.0, 44.0, 49.0, 33.0, 40.0, 59.0, 38.0, 29.0, 29.0, 23.0, 25.0, 21.0, 19.0, 13.0, 13.0, 11.0, 5.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.21875, -8.95611572265625, -8.6934814453125, -8.43084716796875, -8.168212890625, -7.90557861328125, -7.6429443359375, -7.38031005859375, -7.11767578125, -6.85504150390625, -6.5924072265625, -6.32977294921875, -6.067138671875, -5.80450439453125, -5.5418701171875, -5.27923583984375, -5.0166015625, -4.75396728515625, -4.4913330078125, -4.22869873046875, -3.966064453125, -3.70343017578125, -3.4407958984375, -3.17816162109375, -2.91552734375, -2.65289306640625, -2.3902587890625, -2.12762451171875, -1.864990234375, -1.60235595703125, -1.3397216796875, -1.07708740234375, -0.814453125, -0.55181884765625, -0.2891845703125, -0.02655029296875, 0.236083984375, 0.49871826171875, 0.7613525390625, 1.02398681640625, 1.28662109375, 1.54925537109375, 1.8118896484375, 2.07452392578125, 2.337158203125, 2.59979248046875, 2.8624267578125, 3.12506103515625, 3.3876953125, 3.65032958984375, 3.9129638671875, 4.17559814453125, 4.438232421875, 4.70086669921875, 4.9635009765625, 5.22613525390625, 5.48876953125, 5.75140380859375, 6.0140380859375, 6.27667236328125, 6.539306640625, 6.80194091796875, 7.0645751953125, 7.32720947265625, 7.58984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 10.0, 5.0, 6.0, 8.0, 5.0, 12.0, 24.0, 26.0, 20.0, 20.0, 29.0, 29.0, 67.0, 73.0, 90.0, 159.0, 282.0, 726.0, 29629.0, 1011862.0, 4252.0, 478.0, 222.0, 123.0, 92.0, 78.0, 37.0, 37.0, 33.0, 25.0, 13.0, 6.0, 10.0, 7.0, 16.0, 8.0, 5.0, 10.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-23.453125, -22.789306640625, -22.12548828125, -21.461669921875, -20.7978515625, -20.134033203125, -19.47021484375, -18.806396484375, -18.142578125, -17.478759765625, -16.81494140625, -16.151123046875, -15.4873046875, -14.823486328125, -14.15966796875, -13.495849609375, -12.83203125, -12.168212890625, -11.50439453125, -10.840576171875, -10.1767578125, -9.512939453125, -8.84912109375, -8.185302734375, -7.521484375, -6.857666015625, -6.19384765625, -5.530029296875, -4.8662109375, -4.202392578125, -3.53857421875, -2.874755859375, -2.2109375, -1.547119140625, -0.88330078125, -0.219482421875, 0.4443359375, 1.108154296875, 1.77197265625, 2.435791015625, 3.099609375, 3.763427734375, 4.42724609375, 5.091064453125, 5.7548828125, 6.418701171875, 7.08251953125, 7.746337890625, 8.41015625, 9.073974609375, 9.73779296875, 10.401611328125, 11.0654296875, 11.729248046875, 12.39306640625, 13.056884765625, 13.720703125, 14.384521484375, 15.04833984375, 15.712158203125, 16.3759765625, 17.039794921875, 17.70361328125, 18.367431640625, 19.03125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 7.0, 6.0, 7.0, 7.0, 6.0, 14.0, 21.0, 18.0, 15.0, 27.0, 20.0, 22.0, 43.0, 36.0, 36.0, 33.0, 53.0, 46.0, 51.0, 51.0, 63.0, 49.0, 56.0, 35.0, 36.0, 32.0, 34.0, 25.0, 22.0, 31.0, 16.0, 7.0, 7.0, 13.0, 8.0, 6.0, 10.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.609375, -9.32958984375, -9.0498046875, -8.77001953125, -8.490234375, -8.21044921875, -7.9306640625, -7.65087890625, -7.37109375, -7.09130859375, -6.8115234375, -6.53173828125, -6.251953125, -5.97216796875, -5.6923828125, -5.41259765625, -5.1328125, -4.85302734375, -4.5732421875, -4.29345703125, -4.013671875, -3.73388671875, -3.4541015625, -3.17431640625, -2.89453125, -2.61474609375, -2.3349609375, -2.05517578125, -1.775390625, -1.49560546875, -1.2158203125, -0.93603515625, -0.65625, -0.37646484375, -0.0966796875, 0.18310546875, 0.462890625, 0.74267578125, 1.0224609375, 1.30224609375, 1.58203125, 1.86181640625, 2.1416015625, 2.42138671875, 2.701171875, 2.98095703125, 3.2607421875, 3.54052734375, 3.8203125, 4.10009765625, 4.3798828125, 4.65966796875, 4.939453125, 5.21923828125, 5.4990234375, 5.77880859375, 6.05859375, 6.33837890625, 6.6181640625, 6.89794921875, 7.177734375, 7.45751953125, 7.7373046875, 8.01708984375, 8.296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 10.0, 9.0, 5.0, 15.0, 20.0, 46.0, 54.0, 74.0, 132.0, 213.0, 636.0, 3333.0, 89107.0, 926992.0, 25162.0, 1815.0, 420.0, 172.0, 120.0, 72.0, 45.0, 23.0, 17.0, 14.0, 13.0, 6.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.392578125, -3.28082275390625, -3.1690673828125, -3.05731201171875, -2.945556640625, -2.83380126953125, -2.7220458984375, -2.61029052734375, -2.49853515625, -2.38677978515625, -2.2750244140625, -2.16326904296875, -2.051513671875, -1.93975830078125, -1.8280029296875, -1.71624755859375, -1.6044921875, -1.49273681640625, -1.3809814453125, -1.26922607421875, -1.157470703125, -1.04571533203125, -0.9339599609375, -0.82220458984375, -0.71044921875, -0.59869384765625, -0.4869384765625, -0.37518310546875, -0.263427734375, -0.15167236328125, -0.0399169921875, 0.07183837890625, 0.18359375, 0.29534912109375, 0.4071044921875, 0.51885986328125, 0.630615234375, 0.74237060546875, 0.8541259765625, 0.96588134765625, 1.07763671875, 1.18939208984375, 1.3011474609375, 1.41290283203125, 1.524658203125, 1.63641357421875, 1.7481689453125, 1.85992431640625, 1.9716796875, 2.08343505859375, 2.1951904296875, 2.30694580078125, 2.418701171875, 2.53045654296875, 2.6422119140625, 2.75396728515625, 2.86572265625, 2.97747802734375, 3.0892333984375, 3.20098876953125, 3.312744140625, 3.42449951171875, 3.5362548828125, 3.64801025390625, 3.759765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 8.0, 8.0, 12.0, 13.0, 8.0, 18.0, 34.0, 34.0, 56.0, 73.0, 75.0, 110.0, 105.0, 86.0, 103.0, 60.0, 44.0, 48.0, 22.0, 27.0, 20.0, 12.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000213623046875, -0.00020686909556388855, -0.0002001151442527771, -0.00019336119294166565, -0.0001866072416305542, -0.00017985329031944275, -0.0001730993390083313, -0.00016634538769721985, -0.0001595914363861084, -0.00015283748507499695, -0.0001460835337638855, -0.00013932958245277405, -0.0001325756311416626, -0.00012582167983055115, -0.0001190677285194397, -0.00011231377720832825, -0.0001055598258972168, -9.880587458610535e-05, -9.20519232749939e-05, -8.529797196388245e-05, -7.8544020652771e-05, -7.179006934165955e-05, -6.50361180305481e-05, -5.8282166719436646e-05, -5.1528215408325195e-05, -4.4774264097213745e-05, -3.8020312786102295e-05, -3.1266361474990845e-05, -2.4512410163879395e-05, -1.7758458852767944e-05, -1.1004507541656494e-05, -4.250556230545044e-06, 2.5033950805664062e-06, 9.257346391677856e-06, 1.6011297702789307e-05, 2.2765249013900757e-05, 2.9519200325012207e-05, 3.627315163612366e-05, 4.302710294723511e-05, 4.978105425834656e-05, 5.653500556945801e-05, 6.328895688056946e-05, 7.004290819168091e-05, 7.679685950279236e-05, 8.355081081390381e-05, 9.030476212501526e-05, 9.705871343612671e-05, 0.00010381266474723816, 0.00011056661605834961, 0.00011732056736946106, 0.0001240745186805725, 0.00013082846999168396, 0.0001375824213027954, 0.00014433637261390686, 0.0001510903239250183, 0.00015784427523612976, 0.0001645982265472412, 0.00017135217785835266, 0.0001781061291694641, 0.00018486008048057556, 0.000191614031791687, 0.00019836798310279846, 0.0002051219344139099, 0.00021187588572502136, 0.0002186298370361328]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 6.0, 6.0, 21.0, 17.0, 45.0, 53.0, 153.0, 354.0, 1641.0, 32139.0, 975824.0, 35878.0, 1686.0, 394.0, 143.0, 76.0, 43.0, 19.0, 21.0, 10.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8671875, -4.730133056640625, -4.59307861328125, -4.456024169921875, -4.3189697265625, -4.181915283203125, -4.04486083984375, -3.907806396484375, -3.770751953125, -3.633697509765625, -3.49664306640625, -3.359588623046875, -3.2225341796875, -3.085479736328125, -2.94842529296875, -2.811370849609375, -2.67431640625, -2.537261962890625, -2.40020751953125, -2.263153076171875, -2.1260986328125, -1.989044189453125, -1.85198974609375, -1.714935302734375, -1.577880859375, -1.440826416015625, -1.30377197265625, -1.166717529296875, -1.0296630859375, -0.892608642578125, -0.75555419921875, -0.618499755859375, -0.4814453125, -0.344390869140625, -0.20733642578125, -0.070281982421875, 0.0667724609375, 0.203826904296875, 0.34088134765625, 0.477935791015625, 0.614990234375, 0.752044677734375, 0.88909912109375, 1.026153564453125, 1.1632080078125, 1.300262451171875, 1.43731689453125, 1.574371337890625, 1.71142578125, 1.848480224609375, 1.98553466796875, 2.122589111328125, 2.2596435546875, 2.396697998046875, 2.53375244140625, 2.670806884765625, 2.807861328125, 2.944915771484375, 3.08197021484375, 3.219024658203125, 3.3560791015625, 3.493133544921875, 3.63018798828125, 3.767242431640625, 3.904296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 12.0, 22.0, 29.0, 71.0, 87.0, 127.0, 158.0, 151.0, 108.0, 79.0, 64.0, 34.0, 21.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82568359375, -0.7960739135742188, -0.7664642333984375, -0.7368545532226562, -0.707244873046875, -0.6776351928710938, -0.6480255126953125, -0.6184158325195312, -0.58880615234375, -0.5591964721679688, -0.5295867919921875, -0.49997711181640625, -0.470367431640625, -0.44075775146484375, -0.4111480712890625, -0.38153839111328125, -0.3519287109375, -0.32231903076171875, -0.2927093505859375, -0.26309967041015625, -0.233489990234375, -0.20388031005859375, -0.1742706298828125, -0.14466094970703125, -0.11505126953125, -0.08544158935546875, -0.0558319091796875, -0.02622222900390625, 0.003387451171875, 0.03299713134765625, 0.0626068115234375, 0.09221649169921875, 0.121826171875, 0.15143585205078125, 0.1810455322265625, 0.21065521240234375, 0.240264892578125, 0.26987457275390625, 0.2994842529296875, 0.32909393310546875, 0.35870361328125, 0.38831329345703125, 0.4179229736328125, 0.44753265380859375, 0.477142333984375, 0.5067520141601562, 0.5363616943359375, 0.5659713745117188, 0.5955810546875, 0.6251907348632812, 0.6548004150390625, 0.6844100952148438, 0.714019775390625, 0.7436294555664062, 0.7732391357421875, 0.8028488159179688, 0.83245849609375, 0.8620681762695312, 0.8916778564453125, 0.9212875366210938, 0.950897216796875, 0.9805068969726562, 1.0101165771484375, 1.0397262573242188, 1.0693359375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 9.0, 11.0, 18.0, 20.0, 26.0, 42.0, 52.0, 53.0, 58.0, 87.0, 87.0, 88.0, 92.0, 87.0, 73.0, 49.0, 46.0, 35.0, 23.0, 15.0, 12.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.76408576965332, -10.501669883728027, -10.239253997802734, -9.976838111877441, -9.714422225952148, -9.452006340026855, -9.189590454101562, -8.92717456817627, -8.664758682250977, -8.402342796325684, -8.13992691040039, -7.877511024475098, -7.615095138549805, -7.352679252624512, -7.090263366699219, -6.827847480773926, -6.565432071685791, -6.303016185760498, -6.040600299835205, -5.778184413909912, -5.515768527984619, -5.253352642059326, -4.990937232971191, -4.728521347045898, -4.4661054611206055, -4.2036895751953125, -3.9412736892700195, -3.6788578033447266, -3.4164419174194336, -3.1540260314941406, -2.8916103839874268, -2.629194498062134, -2.3667778968811035, -2.1043620109558105, -1.8419461250305176, -1.5795303583145142, -1.3171144723892212, -1.0546985864639282, -0.7922828197479248, -0.5298669338226318, -0.26745104789733887, -0.005035191774368286, 0.2573806643486023, 0.5197964906692505, 0.7822123765945435, 1.0446282625198364, 1.3070440292358398, 1.5694599151611328, 1.8318758010864258, 2.0942916870117188, 2.3567075729370117, 2.6191234588623047, 2.8815393447875977, 3.1439552307128906, 3.4063708782196045, 3.6687867641448975, 3.9312026500701904, 4.193618297576904, 4.456034183502197, 4.71845006942749, 4.980865955352783, 5.243281841278076, 5.505697727203369, 5.768113613128662, 6.030529499053955]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 4.0, 13.0, 10.0, 9.0, 16.0, 16.0, 20.0, 19.0, 25.0, 20.0, 31.0, 22.0, 36.0, 32.0, 45.0, 44.0, 33.0, 46.0, 42.0, 50.0, 30.0, 42.0, 36.0, 27.0, 21.0, 34.0, 35.0, 23.0, 29.0, 23.0, 19.0, 22.0, 27.0, 22.0, 8.0, 8.0, 13.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.694212913513184, -11.369037628173828, -11.043863296508789, -10.718688011169434, -10.393512725830078, -10.068337440490723, -9.743162155151367, -9.417987823486328, -9.092812538146973, -8.767637252807617, -8.442462921142578, -8.117287635803223, -7.792112350463867, -7.466937065124512, -7.1417622566223145, -6.816587448120117, -6.491412162780762, -6.166236877441406, -5.841062068939209, -5.515887260437012, -5.190711975097656, -4.865536689758301, -4.5403618812561035, -4.215187072753906, -3.890011787414551, -3.5648367404937744, -3.239661693572998, -2.9144866466522217, -2.5893115997314453, -2.264136552810669, -1.9389615058898926, -1.6137864589691162, -1.2886123657226562, -0.9634373188018799, -0.6382622718811035, -0.31308722496032715, 0.012087821960449219, 0.3372628688812256, 0.662437915802002, 0.9876129627227783, 1.3127880096435547, 1.637963056564331, 1.9631381034851074, 2.288313150405884, 2.61348819732666, 2.9386632442474365, 3.263838291168213, 3.5890133380889893, 3.9141883850097656, 4.239363670349121, 4.564538478851318, 4.889713287353516, 5.214888572692871, 5.540063858032227, 5.865238666534424, 6.190413475036621, 6.515588760375977, 6.840764045715332, 7.165938854217529, 7.491113662719727, 7.816288948059082, 8.141464233398438, 8.466638565063477, 8.791813850402832, 9.116989135742188]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 6.0, 3.0, 1.0, 6.0, 10.0, 8.0, 18.0, 14.0, 24.0, 37.0, 41.0, 69.0, 106.0, 140.0, 265.0, 465.0, 1164.0, 3899.0, 19349.0, 139522.0, 1061807.0, 2259843.0, 620578.0, 72017.0, 11013.0, 2410.0, 660.0, 283.0, 147.0, 102.0, 66.0, 47.0, 31.0, 21.0, 19.0, 24.0, 19.0, 14.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.9771728515625, -6.747314453125, -6.5174560546875, -6.28759765625, -6.0577392578125, -5.827880859375, -5.5980224609375, -5.3681640625, -5.1383056640625, -4.908447265625, -4.6785888671875, -4.44873046875, -4.2188720703125, -3.989013671875, -3.7591552734375, -3.529296875, -3.2994384765625, -3.069580078125, -2.8397216796875, -2.60986328125, -2.3800048828125, -2.150146484375, -1.9202880859375, -1.6904296875, -1.4605712890625, -1.230712890625, -1.0008544921875, -0.77099609375, -0.5411376953125, -0.311279296875, -0.0814208984375, 0.1484375, 0.3782958984375, 0.608154296875, 0.8380126953125, 1.06787109375, 1.2977294921875, 1.527587890625, 1.7574462890625, 1.9873046875, 2.2171630859375, 2.447021484375, 2.6768798828125, 2.90673828125, 3.1365966796875, 3.366455078125, 3.5963134765625, 3.826171875, 4.0560302734375, 4.285888671875, 4.5157470703125, 4.74560546875, 4.9754638671875, 5.205322265625, 5.4351806640625, 5.6650390625, 5.8948974609375, 6.124755859375, 6.3546142578125, 6.58447265625, 6.8143310546875, 7.044189453125, 7.2740478515625, 7.50390625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 13.0, 17.0, 17.0, 19.0, 24.0, 23.0, 33.0, 37.0, 41.0, 42.0, 52.0, 42.0, 59.0, 63.0, 42.0, 45.0, 53.0, 46.0, 40.0, 41.0, 39.0, 27.0, 28.0, 29.0, 21.0, 25.0, 18.0, 9.0, 12.0, 7.0, 9.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1640625, -4.02703857421875, -3.8900146484375, -3.75299072265625, -3.615966796875, -3.47894287109375, -3.3419189453125, -3.20489501953125, -3.06787109375, -2.93084716796875, -2.7938232421875, -2.65679931640625, -2.519775390625, -2.38275146484375, -2.2457275390625, -2.10870361328125, -1.9716796875, -1.83465576171875, -1.6976318359375, -1.56060791015625, -1.423583984375, -1.28656005859375, -1.1495361328125, -1.01251220703125, -0.87548828125, -0.73846435546875, -0.6014404296875, -0.46441650390625, -0.327392578125, -0.19036865234375, -0.0533447265625, 0.08367919921875, 0.220703125, 0.35772705078125, 0.4947509765625, 0.63177490234375, 0.768798828125, 0.90582275390625, 1.0428466796875, 1.17987060546875, 1.31689453125, 1.45391845703125, 1.5909423828125, 1.72796630859375, 1.864990234375, 2.00201416015625, 2.1390380859375, 2.27606201171875, 2.4130859375, 2.55010986328125, 2.6871337890625, 2.82415771484375, 2.961181640625, 3.09820556640625, 3.2352294921875, 3.37225341796875, 3.50927734375, 3.64630126953125, 3.7833251953125, 3.92034912109375, 4.057373046875, 4.19439697265625, 4.3314208984375, 4.46844482421875, 4.60546875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 6.0, 2.0, 14.0, 12.0, 24.0, 46.0, 73.0, 197.0, 493.0, 2469.0, 3795448.0, 393405.0, 1436.0, 358.0, 136.0, 81.0, 40.0, 13.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.560302734375, -40.40185546875, -39.243408203125, -38.0849609375, -36.926513671875, -35.76806640625, -34.609619140625, -33.451171875, -32.292724609375, -31.13427734375, -29.975830078125, -28.8173828125, -27.658935546875, -26.50048828125, -25.342041015625, -24.18359375, -23.025146484375, -21.86669921875, -20.708251953125, -19.5498046875, -18.391357421875, -17.23291015625, -16.074462890625, -14.916015625, -13.757568359375, -12.59912109375, -11.440673828125, -10.2822265625, -9.123779296875, -7.96533203125, -6.806884765625, -5.6484375, -4.489990234375, -3.33154296875, -2.173095703125, -1.0146484375, 0.143798828125, 1.30224609375, 2.460693359375, 3.619140625, 4.777587890625, 5.93603515625, 7.094482421875, 8.2529296875, 9.411376953125, 10.56982421875, 11.728271484375, 12.88671875, 14.045166015625, 15.20361328125, 16.362060546875, 17.5205078125, 18.678955078125, 19.83740234375, 20.995849609375, 22.154296875, 23.312744140625, 24.47119140625, 25.629638671875, 26.7880859375, 27.946533203125, 29.10498046875, 30.263427734375, 31.421875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 6.0, 13.0, 18.0, 26.0, 38.0, 35.0, 67.0, 68.0, 101.0, 126.0, 155.0, 195.0, 251.0, 321.0, 385.0, 354.0, 371.0, 334.0, 280.0, 223.0, 173.0, 126.0, 108.0, 62.0, 49.0, 34.0, 20.0, 28.0, 25.0, 15.0, 8.0, 14.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.7605438232421875, -1.706634521484375, -1.6527252197265625, -1.59881591796875, -1.5449066162109375, -1.490997314453125, -1.4370880126953125, -1.3831787109375, -1.3292694091796875, -1.275360107421875, -1.2214508056640625, -1.16754150390625, -1.1136322021484375, -1.059722900390625, -1.0058135986328125, -0.951904296875, -0.8979949951171875, -0.844085693359375, -0.7901763916015625, -0.73626708984375, -0.6823577880859375, -0.628448486328125, -0.5745391845703125, -0.5206298828125, -0.4667205810546875, -0.412811279296875, -0.3589019775390625, -0.30499267578125, -0.2510833740234375, -0.197174072265625, -0.1432647705078125, -0.08935546875, -0.0354461669921875, 0.018463134765625, 0.0723724365234375, 0.12628173828125, 0.1801910400390625, 0.234100341796875, 0.2880096435546875, 0.3419189453125, 0.3958282470703125, 0.449737548828125, 0.5036468505859375, 0.55755615234375, 0.6114654541015625, 0.665374755859375, 0.7192840576171875, 0.773193359375, 0.8271026611328125, 0.881011962890625, 0.9349212646484375, 0.98883056640625, 1.0427398681640625, 1.096649169921875, 1.1505584716796875, 1.2044677734375, 1.2583770751953125, 1.312286376953125, 1.3661956787109375, 1.42010498046875, 1.4740142822265625, 1.527923583984375, 1.5818328857421875, 1.6357421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 10.0, 22.0, 43.0, 56.0, 133.0, 168.0, 159.0, 164.0, 121.0, 79.0, 30.0, 15.0, 9.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.579390048980713, -4.14121675491333, -3.7030434608459473, -3.2648701667785645, -2.8266968727111816, -2.388523817062378, -1.9503505229949951, -1.5121772289276123, -1.0740039348602295, -0.6358306407928467, -0.19765740633010864, 0.2405158281326294, 0.6786891222000122, 1.1168622970581055, 1.5550355911254883, 1.993208885192871, 2.431382179260254, 2.8695554733276367, 3.3077287673950195, 3.7459020614624023, 4.184075355529785, 4.622248649597168, 5.060421943664551, 5.498595237731934, 5.936768531799316, 6.374941825866699, 6.813115119934082, 7.251288414001465, 7.689461708068848, 8.12763500213623, 8.565808296203613, 9.003981590270996, 9.442154884338379, 9.880328178405762, 10.318501472473145, 10.756674766540527, 11.19484806060791, 11.633021354675293, 12.071194648742676, 12.509367942810059, 12.947541236877441, 13.385714530944824, 13.823887825012207, 14.26206111907959, 14.700234413146973, 15.138407707214355, 15.576581001281738, 16.014753341674805, 16.452926635742188, 16.89109992980957, 17.329273223876953, 17.767446517944336, 18.20561981201172, 18.6437931060791, 19.081966400146484, 19.520139694213867, 19.95831298828125, 20.396486282348633, 20.834659576416016, 21.2728328704834, 21.71100616455078, 22.149179458618164, 22.587352752685547, 23.02552604675293, 23.463699340820312]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 7.0, 4.0, 13.0, 12.0, 15.0, 20.0, 21.0, 13.0, 23.0, 16.0, 32.0, 31.0, 31.0, 25.0, 29.0, 40.0, 46.0, 43.0, 30.0, 35.0, 50.0, 42.0, 45.0, 42.0, 37.0, 28.0, 24.0, 21.0, 26.0, 17.0, 22.0, 25.0, 17.0, 10.0, 10.0, 11.0, 11.0, 7.0, 7.0, 10.0, 8.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.3748116493225098, -3.2615673542022705, -3.1483232975006104, -3.035079002380371, -2.921834707260132, -2.8085904121398926, -2.6953463554382324, -2.582102060317993, -2.468857765197754, -2.3556134700775146, -2.2423694133758545, -2.1291251182556152, -2.015880823135376, -1.9026366472244263, -1.7893924713134766, -1.6761481761932373, -1.5629041194915771, -1.4496599435806274, -1.3364156484603882, -1.2231714725494385, -1.1099271774291992, -0.9966830015182495, -0.8834388256072998, -0.7701945900917053, -0.6569503545761108, -0.5437061190605164, -0.43046191334724426, -0.31721770763397217, -0.20397347211837769, -0.0907292366027832, 0.022514939308166504, 0.135759174823761, 0.24900341033935547, 0.36224764585494995, 0.47549185156822205, 0.5887360572814941, 0.7019802927970886, 0.8152245283126831, 0.9284687042236328, 1.041712999343872, 1.1549571752548218, 1.2682013511657715, 1.3814456462860107, 1.4946898221969604, 1.6079339981079102, 1.7211782932281494, 1.8344224691390991, 1.9476666450500488, 2.060910940170288, 2.1741552352905273, 2.2873992919921875, 2.4006435871124268, 2.513887882232666, 2.627131938934326, 2.7403762340545654, 2.8536205291748047, 2.966864585876465, 3.080108880996704, 3.1933529376983643, 3.3065972328186035, 3.4198415279388428, 3.533085823059082, 3.646329879760742, 3.7595741748809814, 3.8728184700012207]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 6.0, 10.0, 17.0, 36.0, 54.0, 84.0, 119.0, 183.0, 374.0, 590.0, 897.0, 1536.0, 2536.0, 4820.0, 14282.0, 128138.0, 683076.0, 181452.0, 18110.0, 5255.0, 2731.0, 1676.0, 982.0, 594.0, 375.0, 238.0, 122.0, 91.0, 55.0, 36.0, 20.0, 14.0, 11.0, 5.0, 5.0, 2.0, 6.0, 3.0, 0.0, 3.0], "bins": [-1.6484375, -1.6078033447265625, -1.567169189453125, -1.5265350341796875, -1.48590087890625, -1.4452667236328125, -1.404632568359375, -1.3639984130859375, -1.3233642578125, -1.2827301025390625, -1.242095947265625, -1.2014617919921875, -1.16082763671875, -1.1201934814453125, -1.079559326171875, -1.0389251708984375, -0.998291015625, -0.9576568603515625, -0.917022705078125, -0.8763885498046875, -0.83575439453125, -0.7951202392578125, -0.754486083984375, -0.7138519287109375, -0.6732177734375, -0.6325836181640625, -0.591949462890625, -0.5513153076171875, -0.51068115234375, -0.4700469970703125, -0.429412841796875, -0.3887786865234375, -0.34814453125, -0.3075103759765625, -0.266876220703125, -0.2262420654296875, -0.18560791015625, -0.1449737548828125, -0.104339599609375, -0.0637054443359375, -0.0230712890625, 0.0175628662109375, 0.058197021484375, 0.0988311767578125, 0.13946533203125, 0.1800994873046875, 0.220733642578125, 0.2613677978515625, 0.302001953125, 0.3426361083984375, 0.383270263671875, 0.4239044189453125, 0.46453857421875, 0.5051727294921875, 0.545806884765625, 0.5864410400390625, 0.6270751953125, 0.6677093505859375, 0.708343505859375, 0.7489776611328125, 0.78961181640625, 0.8302459716796875, 0.870880126953125, 0.9115142822265625, 0.9521484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 5.0, 8.0, 16.0, 12.0, 17.0, 14.0, 16.0, 35.0, 35.0, 36.0, 20.0, 50.0, 42.0, 49.0, 46.0, 54.0, 70.0, 62.0, 48.0, 52.0, 43.0, 39.0, 41.0, 30.0, 32.0, 18.0, 15.0, 19.0, 23.0, 15.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.18792724609375, -2.0906982421875, -1.99346923828125, -1.896240234375, -1.79901123046875, -1.7017822265625, -1.60455322265625, -1.50732421875, -1.41009521484375, -1.3128662109375, -1.21563720703125, -1.118408203125, -1.02117919921875, -0.9239501953125, -0.82672119140625, -0.7294921875, -0.63226318359375, -0.5350341796875, -0.43780517578125, -0.340576171875, -0.24334716796875, -0.1461181640625, -0.04888916015625, 0.04833984375, 0.14556884765625, 0.2427978515625, 0.34002685546875, 0.437255859375, 0.53448486328125, 0.6317138671875, 0.72894287109375, 0.826171875, 0.92340087890625, 1.0206298828125, 1.11785888671875, 1.215087890625, 1.31231689453125, 1.4095458984375, 1.50677490234375, 1.60400390625, 1.70123291015625, 1.7984619140625, 1.89569091796875, 1.992919921875, 2.09014892578125, 2.1873779296875, 2.28460693359375, 2.3818359375, 2.47906494140625, 2.5762939453125, 2.67352294921875, 2.770751953125, 2.86798095703125, 2.9652099609375, 3.06243896484375, 3.15966796875, 3.25689697265625, 3.3541259765625, 3.45135498046875, 3.548583984375, 3.64581298828125, 3.7430419921875, 3.84027099609375, 3.9375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 9.0, 27.0, 27.0, 49.0, 75.0, 119.0, 222.0, 439.0, 905.0, 1781.0, 3606.0, 7392.0, 14966.0, 31104.0, 64726.0, 124038.0, 202728.0, 232767.0, 172379.0, 97242.0, 48562.0, 23269.0, 11147.0, 5474.0, 2703.0, 1330.0, 675.0, 338.0, 150.0, 119.0, 61.0, 42.0, 19.0, 15.0, 5.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.25331878662109375, -0.2446746826171875, -0.23603057861328125, -0.227386474609375, -0.21874237060546875, -0.2100982666015625, -0.20145416259765625, -0.19281005859375, -0.18416595458984375, -0.1755218505859375, -0.16687774658203125, -0.158233642578125, -0.14958953857421875, -0.1409454345703125, -0.13230133056640625, -0.1236572265625, -0.11501312255859375, -0.1063690185546875, -0.09772491455078125, -0.089080810546875, -0.08043670654296875, -0.0717926025390625, -0.06314849853515625, -0.05450439453125, -0.04586029052734375, -0.0372161865234375, -0.02857208251953125, -0.019927978515625, -0.01128387451171875, -0.0026397705078125, 0.00600433349609375, 0.0146484375, 0.02329254150390625, 0.0319366455078125, 0.04058074951171875, 0.049224853515625, 0.05786895751953125, 0.0665130615234375, 0.07515716552734375, 0.08380126953125, 0.09244537353515625, 0.1010894775390625, 0.10973358154296875, 0.118377685546875, 0.12702178955078125, 0.1356658935546875, 0.14430999755859375, 0.1529541015625, 0.16159820556640625, 0.1702423095703125, 0.17888641357421875, 0.187530517578125, 0.19617462158203125, 0.2048187255859375, 0.21346282958984375, 0.22210693359375, 0.23075103759765625, 0.2393951416015625, 0.24803924560546875, 0.256683349609375, 0.26532745361328125, 0.2739715576171875, 0.28261566162109375, 0.291259765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 5.0, 10.0, 12.0, 10.0, 12.0, 19.0, 14.0, 16.0, 21.0, 32.0, 34.0, 37.0, 34.0, 46.0, 55.0, 67.0, 56.0, 68.0, 67.0, 37.0, 63.0, 26.0, 46.0, 38.0, 36.0, 21.0, 13.0, 16.0, 24.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.546875, -5.369140625, -5.19140625, -5.013671875, -4.8359375, -4.658203125, -4.48046875, -4.302734375, -4.125, -3.947265625, -3.76953125, -3.591796875, -3.4140625, -3.236328125, -3.05859375, -2.880859375, -2.703125, -2.525390625, -2.34765625, -2.169921875, -1.9921875, -1.814453125, -1.63671875, -1.458984375, -1.28125, -1.103515625, -0.92578125, -0.748046875, -0.5703125, -0.392578125, -0.21484375, -0.037109375, 0.140625, 0.318359375, 0.49609375, 0.673828125, 0.8515625, 1.029296875, 1.20703125, 1.384765625, 1.5625, 1.740234375, 1.91796875, 2.095703125, 2.2734375, 2.451171875, 2.62890625, 2.806640625, 2.984375, 3.162109375, 3.33984375, 3.517578125, 3.6953125, 3.873046875, 4.05078125, 4.228515625, 4.40625, 4.583984375, 4.76171875, 4.939453125, 5.1171875, 5.294921875, 5.47265625, 5.650390625, 5.828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 7.0, 9.0, 12.0, 18.0, 26.0, 28.0, 42.0, 78.0, 106.0, 159.0, 275.0, 440.0, 702.0, 1214.0, 2505.0, 6270.0, 21068.0, 132440.0, 647862.0, 194091.0, 27470.0, 7612.0, 2872.0, 1414.0, 738.0, 413.0, 252.0, 135.0, 108.0, 43.0, 43.0, 26.0, 28.0, 17.0, 12.0, 9.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0853271484375, -0.08234214782714844, -0.07935714721679688, -0.07637214660644531, -0.07338714599609375, -0.07040214538574219, -0.06741714477539062, -0.06443214416503906, -0.0614471435546875, -0.05846214294433594, -0.055477142333984375, -0.05249214172363281, -0.04950714111328125, -0.04652214050292969, -0.043537139892578125, -0.04055213928222656, -0.037567138671875, -0.03458213806152344, -0.031597137451171875, -0.028612136840820312, -0.02562713623046875, -0.022642135620117188, -0.019657135009765625, -0.016672134399414062, -0.0136871337890625, -0.010702133178710938, -0.007717132568359375, -0.0047321319580078125, -0.00174713134765625, 0.0012378692626953125, 0.004222869873046875, 0.0072078704833984375, 0.01019287109375, 0.013177871704101562, 0.016162872314453125, 0.019147872924804688, 0.02213287353515625, 0.025117874145507812, 0.028102874755859375, 0.031087875366210938, 0.0340728759765625, 0.03705787658691406, 0.040042877197265625, 0.04302787780761719, 0.04601287841796875, 0.04899787902832031, 0.051982879638671875, 0.05496788024902344, 0.057952880859375, 0.06093788146972656, 0.06392288208007812, 0.06690788269042969, 0.06989288330078125, 0.07287788391113281, 0.07586288452148438, 0.07884788513183594, 0.0818328857421875, 0.08481788635253906, 0.08780288696289062, 0.09078788757324219, 0.09377288818359375, 0.09675788879394531, 0.09974288940429688, 0.10272789001464844, 0.105712890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 8.0, 16.0, 16.0, 21.0, 29.0, 25.0, 47.0, 68.0, 76.0, 93.0, 121.0, 75.0, 83.0, 87.0, 60.0, 53.0, 30.0, 22.0, 18.0, 13.0, 12.0, 3.0, 8.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26173210144043e-05, -4.090741276741028e-05, -3.919750452041626e-05, -3.748759627342224e-05, -3.577768802642822e-05, -3.4067779779434204e-05, -3.2357871532440186e-05, -3.064796328544617e-05, -2.893805503845215e-05, -2.722814679145813e-05, -2.551823854446411e-05, -2.3808330297470093e-05, -2.2098422050476074e-05, -2.0388513803482056e-05, -1.8678605556488037e-05, -1.696869730949402e-05, -1.52587890625e-05, -1.3548880815505981e-05, -1.1838972568511963e-05, -1.0129064321517944e-05, -8.419156074523926e-06, -6.709247827529907e-06, -4.999339580535889e-06, -3.28943133354187e-06, -1.5795230865478516e-06, 1.30385160446167e-07, 1.8402934074401855e-06, 3.550201654434204e-06, 5.260109901428223e-06, 6.970018148422241e-06, 8.67992639541626e-06, 1.0389834642410278e-05, 1.2099742889404297e-05, 1.3809651136398315e-05, 1.5519559383392334e-05, 1.7229467630386353e-05, 1.893937587738037e-05, 2.064928412437439e-05, 2.2359192371368408e-05, 2.4069100618362427e-05, 2.5779008865356445e-05, 2.7488917112350464e-05, 2.9198825359344482e-05, 3.09087336063385e-05, 3.261864185333252e-05, 3.432855010032654e-05, 3.603845834732056e-05, 3.7748366594314575e-05, 3.9458274841308594e-05, 4.116818308830261e-05, 4.287809133529663e-05, 4.458799958229065e-05, 4.629790782928467e-05, 4.8007816076278687e-05, 4.9717724323272705e-05, 5.1427632570266724e-05, 5.313754081726074e-05, 5.484744906425476e-05, 5.655735731124878e-05, 5.82672655582428e-05, 5.9977173805236816e-05, 6.168708205223083e-05, 6.339699029922485e-05, 6.510689854621887e-05, 6.681680679321289e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 13.0, 30.0, 64.0, 187.0, 532.0, 1610.0, 5887.0, 182114.0, 845639.0, 9259.0, 2100.0, 669.0, 250.0, 93.0, 43.0, 13.0, 14.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317138671875, -0.30625152587890625, -0.2953643798828125, -0.28447723388671875, -0.273590087890625, -0.26270294189453125, -0.2518157958984375, -0.24092864990234375, -0.23004150390625, -0.21915435791015625, -0.2082672119140625, -0.19738006591796875, -0.186492919921875, -0.17560577392578125, -0.1647186279296875, -0.15383148193359375, -0.1429443359375, -0.13205718994140625, -0.1211700439453125, -0.11028289794921875, -0.099395751953125, -0.08850860595703125, -0.0776214599609375, -0.06673431396484375, -0.05584716796875, -0.04496002197265625, -0.0340728759765625, -0.02318572998046875, -0.012298583984375, -0.00141143798828125, 0.0094757080078125, 0.02036285400390625, 0.03125, 0.04213714599609375, 0.0530242919921875, 0.06391143798828125, 0.074798583984375, 0.08568572998046875, 0.0965728759765625, 0.10746002197265625, 0.11834716796875, 0.12923431396484375, 0.1401214599609375, 0.15100860595703125, 0.161895751953125, 0.17278289794921875, 0.1836700439453125, 0.19455718994140625, 0.2054443359375, 0.21633148193359375, 0.2272186279296875, 0.23810577392578125, 0.248992919921875, 0.25988006591796875, 0.2707672119140625, 0.28165435791015625, 0.29254150390625, 0.30342864990234375, 0.3143157958984375, 0.32520294189453125, 0.336090087890625, 0.34697723388671875, 0.3578643798828125, 0.36875152587890625, 0.379638671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 6.0, 9.0, 13.0, 17.0, 21.0, 47.0, 59.0, 104.0, 163.0, 180.0, 144.0, 78.0, 52.0, 28.0, 16.0, 11.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026056289672851562, -0.025135040283203125, -0.024213790893554688, -0.02329254150390625, -0.022371292114257812, -0.021450042724609375, -0.020528793334960938, -0.0196075439453125, -0.018686294555664062, -0.017765045166015625, -0.016843795776367188, -0.01592254638671875, -0.015001296997070312, -0.014080047607421875, -0.013158798217773438, -0.012237548828125, -0.011316299438476562, -0.010395050048828125, -0.009473800659179688, -0.00855255126953125, -0.0076313018798828125, -0.006710052490234375, -0.0057888031005859375, -0.0048675537109375, -0.0039463043212890625, -0.003025054931640625, -0.0021038055419921875, -0.00118255615234375, -0.0002613067626953125, 0.000659942626953125, 0.0015811920166015625, 0.00250244140625, 0.0034236907958984375, 0.004344940185546875, 0.0052661895751953125, 0.00618743896484375, 0.0071086883544921875, 0.008029937744140625, 0.008951187133789062, 0.0098724365234375, 0.010793685913085938, 0.011714935302734375, 0.012636184692382812, 0.01355743408203125, 0.014478683471679688, 0.015399932861328125, 0.016321182250976562, 0.017242431640625, 0.018163681030273438, 0.019084930419921875, 0.020006179809570312, 0.02092742919921875, 0.021848678588867188, 0.022769927978515625, 0.023691177368164062, 0.0246124267578125, 0.025533676147460938, 0.026454925537109375, 0.027376174926757812, 0.02829742431640625, 0.029218673706054688, 0.030139923095703125, 0.031061172485351562, 0.031982421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 15.0, 19.0, 19.0, 23.0, 29.0, 55.0, 73.0, 83.0, 72.0, 83.0, 77.0, 81.0, 81.0, 65.0, 66.0, 47.0, 37.0, 18.0, 12.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0147171020507812, -2.890411615371704, -2.766105890274048, -2.6418004035949707, -2.5174946784973145, -2.3931891918182373, -2.268883466720581, -2.144577980041504, -2.0202722549438477, -1.895966649055481, -1.7716610431671143, -1.6473554372787476, -1.5230498313903809, -1.3987443447113037, -1.2744386196136475, -1.1501331329345703, -1.0258275270462036, -0.9015219211578369, -0.7772163152694702, -0.6529107093811035, -0.5286051034927368, -0.4042995572090149, -0.2799939513206482, -0.1556883454322815, -0.031382739543914795, 0.09292285889387131, 0.2172284573316574, 0.3415340483188629, 0.4658396542072296, 0.5901452302932739, 0.7144508361816406, 0.8387564420700073, 0.963062047958374, 1.0873676538467407, 1.2116732597351074, 1.3359788656234741, 1.4602844715118408, 1.584589958190918, 1.7088956832885742, 1.8332011699676514, 1.9575068950653076, 2.0818123817443848, 2.206118106842041, 2.330423593521118, 2.4547293186187744, 2.5790348052978516, 2.703340530395508, 2.827646017074585, 2.951951503753662, 3.0762569904327393, 3.2005627155303955, 3.3248682022094727, 3.449173927307129, 3.573479413986206, 3.6977851390838623, 3.8220906257629395, 3.9463963508605957, 4.070702075958252, 4.19500732421875, 4.319313049316406, 4.4436187744140625, 4.567924499511719, 4.692229747772217, 4.816535472869873, 4.940841197967529]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 6.0, 8.0, 10.0, 13.0, 11.0, 19.0, 19.0, 24.0, 23.0, 18.0, 28.0, 36.0, 30.0, 32.0, 42.0, 46.0, 49.0, 43.0, 47.0, 48.0, 58.0, 55.0, 43.0, 36.0, 33.0, 23.0, 25.0, 26.0, 26.0, 24.0, 14.0, 12.0, 9.0, 10.0, 10.0, 11.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.269278049468994, -2.1899757385253906, -2.110673427581787, -2.0313708782196045, -1.952068567276001, -1.8727662563323975, -1.7934638261795044, -1.7141613960266113, -1.6348590850830078, -1.5555567741394043, -1.4762543439865112, -1.3969519138336182, -1.3176496028900146, -1.2383472919464111, -1.159044861793518, -1.079742431640625, -1.0004401206970215, -0.9211377501487732, -0.8418353796005249, -0.7625330090522766, -0.6832306385040283, -0.60392826795578, -0.5246258974075317, -0.44532352685928345, -0.36602115631103516, -0.28671878576278687, -0.20741641521453857, -0.12811404466629028, -0.04881167411804199, 0.0304906964302063, 0.10979306697845459, 0.18909543752670288, 0.26839780807495117, 0.34770017862319946, 0.42700254917144775, 0.506304919719696, 0.5856072902679443, 0.6649096608161926, 0.7442120313644409, 0.8235144019126892, 0.9028167724609375, 0.9821191430091858, 1.061421513557434, 1.1407239437103271, 1.2200262546539307, 1.2993285655975342, 1.3786309957504272, 1.4579334259033203, 1.5372357368469238, 1.6165380477905273, 1.6958404779434204, 1.7751429080963135, 1.854445219039917, 1.9337475299835205, 2.013050079345703, 2.0923523902893066, 2.17165470123291, 2.2509570121765137, 2.330259323120117, 2.4095618724823, 2.4888641834259033, 2.568166494369507, 2.6474690437316895, 2.726771354675293, 2.8060736656188965]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 7.0, 15.0, 19.0, 14.0, 37.0, 52.0, 66.0, 92.0, 136.0, 243.0, 411.0, 743.0, 1245.0, 2101.0, 4051.0, 7320.0, 14065.0, 29786.0, 64835.0, 137096.0, 248483.0, 255580.0, 147124.0, 69903.0, 32365.0, 15253.0, 7882.0, 4109.0, 2307.0, 1302.0, 744.0, 382.0, 275.0, 157.0, 121.0, 57.0, 39.0, 30.0, 21.0, 18.0, 17.0, 12.0, 5.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0], "bins": [-2.14453125, -2.083343505859375, -2.02215576171875, -1.960968017578125, -1.8997802734375, -1.838592529296875, -1.77740478515625, -1.716217041015625, -1.655029296875, -1.593841552734375, -1.53265380859375, -1.471466064453125, -1.4102783203125, -1.349090576171875, -1.28790283203125, -1.226715087890625, -1.16552734375, -1.104339599609375, -1.04315185546875, -0.981964111328125, -0.9207763671875, -0.859588623046875, -0.79840087890625, -0.737213134765625, -0.676025390625, -0.614837646484375, -0.55364990234375, -0.492462158203125, -0.4312744140625, -0.370086669921875, -0.30889892578125, -0.247711181640625, -0.1865234375, -0.125335693359375, -0.06414794921875, -0.002960205078125, 0.0582275390625, 0.119415283203125, 0.18060302734375, 0.241790771484375, 0.302978515625, 0.364166259765625, 0.42535400390625, 0.486541748046875, 0.5477294921875, 0.608917236328125, 0.67010498046875, 0.731292724609375, 0.79248046875, 0.853668212890625, 0.91485595703125, 0.976043701171875, 1.0372314453125, 1.098419189453125, 1.15960693359375, 1.220794677734375, 1.281982421875, 1.343170166015625, 1.40435791015625, 1.465545654296875, 1.5267333984375, 1.587921142578125, 1.64910888671875, 1.710296630859375, 1.771484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 5.0, 18.0, 11.0, 18.0, 15.0, 20.0, 14.0, 22.0, 30.0, 35.0, 30.0, 47.0, 41.0, 38.0, 40.0, 53.0, 50.0, 57.0, 47.0, 50.0, 44.0, 35.0, 43.0, 35.0, 16.0, 24.0, 27.0, 23.0, 18.0, 10.0, 8.0, 20.0, 15.0, 6.0, 7.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0859375, -4.92730712890625, -4.7686767578125, -4.61004638671875, -4.451416015625, -4.29278564453125, -4.1341552734375, -3.97552490234375, -3.81689453125, -3.65826416015625, -3.4996337890625, -3.34100341796875, -3.182373046875, -3.02374267578125, -2.8651123046875, -2.70648193359375, -2.5478515625, -2.38922119140625, -2.2305908203125, -2.07196044921875, -1.913330078125, -1.75469970703125, -1.5960693359375, -1.43743896484375, -1.27880859375, -1.12017822265625, -0.9615478515625, -0.80291748046875, -0.644287109375, -0.48565673828125, -0.3270263671875, -0.16839599609375, -0.009765625, 0.14886474609375, 0.3074951171875, 0.46612548828125, 0.624755859375, 0.78338623046875, 0.9420166015625, 1.10064697265625, 1.25927734375, 1.41790771484375, 1.5765380859375, 1.73516845703125, 1.893798828125, 2.05242919921875, 2.2110595703125, 2.36968994140625, 2.5283203125, 2.68695068359375, 2.8455810546875, 3.00421142578125, 3.162841796875, 3.32147216796875, 3.4801025390625, 3.63873291015625, 3.79736328125, 3.95599365234375, 4.1146240234375, 4.27325439453125, 4.431884765625, 4.59051513671875, 4.7491455078125, 4.90777587890625, 5.06640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 9.0, 10.0, 9.0, 13.0, 9.0, 10.0, 14.0, 24.0, 21.0, 30.0, 32.0, 56.0, 60.0, 98.0, 153.0, 231.0, 633.0, 26660.0, 1009278.0, 9996.0, 475.0, 206.0, 129.0, 79.0, 52.0, 57.0, 48.0, 36.0, 22.0, 26.0, 22.0, 12.0, 3.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.078125, -18.470703125, -17.86328125, -17.255859375, -16.6484375, -16.041015625, -15.43359375, -14.826171875, -14.21875, -13.611328125, -13.00390625, -12.396484375, -11.7890625, -11.181640625, -10.57421875, -9.966796875, -9.359375, -8.751953125, -8.14453125, -7.537109375, -6.9296875, -6.322265625, -5.71484375, -5.107421875, -4.5, -3.892578125, -3.28515625, -2.677734375, -2.0703125, -1.462890625, -0.85546875, -0.248046875, 0.359375, 0.966796875, 1.57421875, 2.181640625, 2.7890625, 3.396484375, 4.00390625, 4.611328125, 5.21875, 5.826171875, 6.43359375, 7.041015625, 7.6484375, 8.255859375, 8.86328125, 9.470703125, 10.078125, 10.685546875, 11.29296875, 11.900390625, 12.5078125, 13.115234375, 13.72265625, 14.330078125, 14.9375, 15.544921875, 16.15234375, 16.759765625, 17.3671875, 17.974609375, 18.58203125, 19.189453125, 19.796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 9.0, 7.0, 15.0, 17.0, 17.0, 18.0, 15.0, 20.0, 25.0, 24.0, 28.0, 34.0, 35.0, 35.0, 41.0, 45.0, 49.0, 55.0, 46.0, 52.0, 45.0, 42.0, 40.0, 29.0, 38.0, 33.0, 32.0, 20.0, 27.0, 16.0, 20.0, 12.0, 8.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.38665771484375, -4.2342529296875, -4.08184814453125, -3.929443359375, -3.77703857421875, -3.6246337890625, -3.47222900390625, -3.31982421875, -3.16741943359375, -3.0150146484375, -2.86260986328125, -2.710205078125, -2.55780029296875, -2.4053955078125, -2.25299072265625, -2.1005859375, -1.94818115234375, -1.7957763671875, -1.64337158203125, -1.490966796875, -1.33856201171875, -1.1861572265625, -1.03375244140625, -0.88134765625, -0.72894287109375, -0.5765380859375, -0.42413330078125, -0.271728515625, -0.11932373046875, 0.0330810546875, 0.18548583984375, 0.337890625, 0.49029541015625, 0.6427001953125, 0.79510498046875, 0.947509765625, 1.09991455078125, 1.2523193359375, 1.40472412109375, 1.55712890625, 1.70953369140625, 1.8619384765625, 2.01434326171875, 2.166748046875, 2.31915283203125, 2.4715576171875, 2.62396240234375, 2.7763671875, 2.92877197265625, 3.0811767578125, 3.23358154296875, 3.385986328125, 3.53839111328125, 3.6907958984375, 3.84320068359375, 3.99560546875, 4.14801025390625, 4.3004150390625, 4.45281982421875, 4.605224609375, 4.75762939453125, 4.9100341796875, 5.06243896484375, 5.21484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 7.0, 11.0, 15.0, 17.0, 31.0, 41.0, 58.0, 127.0, 342.0, 1225.0, 9220.0, 465741.0, 558655.0, 11094.0, 1267.0, 337.0, 124.0, 65.0, 35.0, 31.0, 15.0, 16.0, 13.0, 9.0, 1.0, 6.0, 10.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.404296875, -3.298004150390625, -3.19171142578125, -3.085418701171875, -2.9791259765625, -2.872833251953125, -2.76654052734375, -2.660247802734375, -2.553955078125, -2.447662353515625, -2.34136962890625, -2.235076904296875, -2.1287841796875, -2.022491455078125, -1.91619873046875, -1.809906005859375, -1.70361328125, -1.597320556640625, -1.49102783203125, -1.384735107421875, -1.2784423828125, -1.172149658203125, -1.06585693359375, -0.959564208984375, -0.853271484375, -0.746978759765625, -0.64068603515625, -0.534393310546875, -0.4281005859375, -0.321807861328125, -0.21551513671875, -0.109222412109375, -0.0029296875, 0.103363037109375, 0.20965576171875, 0.315948486328125, 0.4222412109375, 0.528533935546875, 0.63482666015625, 0.741119384765625, 0.847412109375, 0.953704833984375, 1.05999755859375, 1.166290283203125, 1.2725830078125, 1.378875732421875, 1.48516845703125, 1.591461181640625, 1.69775390625, 1.804046630859375, 1.91033935546875, 2.016632080078125, 2.1229248046875, 2.229217529296875, 2.33551025390625, 2.441802978515625, 2.548095703125, 2.654388427734375, 2.76068115234375, 2.866973876953125, 2.9732666015625, 3.079559326171875, 3.18585205078125, 3.292144775390625, 3.3984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 9.0, 12.0, 19.0, 11.0, 34.0, 39.0, 39.0, 56.0, 80.0, 71.0, 74.0, 79.0, 81.0, 77.0, 72.0, 61.0, 42.0, 37.0, 19.0, 22.0, 19.0, 6.0, 12.0, 7.0, 6.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002384185791015625, -0.00023208186030387878, -0.00022574514150619507, -0.00021940842270851135, -0.00021307170391082764, -0.00020673498511314392, -0.0002003982663154602, -0.0001940615475177765, -0.00018772482872009277, -0.00018138810992240906, -0.00017505139112472534, -0.00016871467232704163, -0.0001623779535293579, -0.0001560412347316742, -0.00014970451593399048, -0.00014336779713630676, -0.00013703107833862305, -0.00013069435954093933, -0.00012435764074325562, -0.0001180209219455719, -0.00011168420314788818, -0.00010534748435020447, -9.901076555252075e-05, -9.267404675483704e-05, -8.633732795715332e-05, -8.00006091594696e-05, -7.366389036178589e-05, -6.732717156410217e-05, -6.099045276641846e-05, -5.465373396873474e-05, -4.8317015171051025e-05, -4.198029637336731e-05, -3.5643577575683594e-05, -2.9306858777999878e-05, -2.2970139980316162e-05, -1.6633421182632446e-05, -1.029670238494873e-05, -3.959983587265015e-06, 2.376735210418701e-06, 8.713454008102417e-06, 1.5050172805786133e-05, 2.138689160346985e-05, 2.7723610401153564e-05, 3.406032919883728e-05, 4.0397047996520996e-05, 4.673376679420471e-05, 5.307048559188843e-05, 5.9407204389572144e-05, 6.574392318725586e-05, 7.208064198493958e-05, 7.841736078262329e-05, 8.475407958030701e-05, 9.109079837799072e-05, 9.742751717567444e-05, 0.00010376423597335815, 0.00011010095477104187, 0.00011643767356872559, 0.0001227743923664093, 0.00012911111116409302, 0.00013544782996177673, 0.00014178454875946045, 0.00014812126755714417, 0.00015445798635482788, 0.0001607947051525116, 0.0001671314239501953]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 15.0, 23.0, 41.0, 56.0, 115.0, 266.0, 841.0, 3937.0, 70290.0, 905479.0, 62335.0, 3783.0, 818.0, 270.0, 109.0, 44.0, 51.0, 24.0, 15.0, 6.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2265625, -3.12408447265625, -3.0216064453125, -2.91912841796875, -2.816650390625, -2.71417236328125, -2.6116943359375, -2.50921630859375, -2.40673828125, -2.30426025390625, -2.2017822265625, -2.09930419921875, -1.996826171875, -1.89434814453125, -1.7918701171875, -1.68939208984375, -1.5869140625, -1.48443603515625, -1.3819580078125, -1.27947998046875, -1.177001953125, -1.07452392578125, -0.9720458984375, -0.86956787109375, -0.76708984375, -0.66461181640625, -0.5621337890625, -0.45965576171875, -0.357177734375, -0.25469970703125, -0.1522216796875, -0.04974365234375, 0.052734375, 0.15521240234375, 0.2576904296875, 0.36016845703125, 0.462646484375, 0.56512451171875, 0.6676025390625, 0.77008056640625, 0.87255859375, 0.97503662109375, 1.0775146484375, 1.17999267578125, 1.282470703125, 1.38494873046875, 1.4874267578125, 1.58990478515625, 1.6923828125, 1.79486083984375, 1.8973388671875, 1.99981689453125, 2.102294921875, 2.20477294921875, 2.3072509765625, 2.40972900390625, 2.51220703125, 2.61468505859375, 2.7171630859375, 2.81964111328125, 2.922119140625, 3.02459716796875, 3.1270751953125, 3.22955322265625, 3.33203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 26.0, 41.0, 66.0, 96.0, 123.0, 144.0, 156.0, 105.0, 81.0, 47.0, 26.0, 23.0, 21.0, 9.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.986328125, -0.95526123046875, -0.9241943359375, -0.89312744140625, -0.862060546875, -0.83099365234375, -0.7999267578125, -0.76885986328125, -0.73779296875, -0.70672607421875, -0.6756591796875, -0.64459228515625, -0.613525390625, -0.58245849609375, -0.5513916015625, -0.52032470703125, -0.4892578125, -0.45819091796875, -0.4271240234375, -0.39605712890625, -0.364990234375, -0.33392333984375, -0.3028564453125, -0.27178955078125, -0.24072265625, -0.20965576171875, -0.1785888671875, -0.14752197265625, -0.116455078125, -0.08538818359375, -0.0543212890625, -0.02325439453125, 0.0078125, 0.03887939453125, 0.0699462890625, 0.10101318359375, 0.132080078125, 0.16314697265625, 0.1942138671875, 0.22528076171875, 0.25634765625, 0.28741455078125, 0.3184814453125, 0.34954833984375, 0.380615234375, 0.41168212890625, 0.4427490234375, 0.47381591796875, 0.5048828125, 0.53594970703125, 0.5670166015625, 0.59808349609375, 0.629150390625, 0.66021728515625, 0.6912841796875, 0.72235107421875, 0.75341796875, 0.78448486328125, 0.8155517578125, 0.84661865234375, 0.877685546875, 0.90875244140625, 0.9398193359375, 0.97088623046875, 1.001953125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 16.0, 23.0, 78.0, 162.0, 246.0, 208.0, 185.0, 65.0, 21.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.61861038208008, -35.89997863769531, -35.18135070800781, -34.46271896362305, -33.74409103393555, -33.02545928955078, -32.30683135986328, -31.588199615478516, -30.869569778442383, -30.15093994140625, -29.432310104370117, -28.713680267333984, -27.99504852294922, -27.276418685913086, -26.557788848876953, -25.83915901184082, -25.120529174804688, -24.401899337768555, -23.683269500732422, -22.964637756347656, -22.246007919311523, -21.52737808227539, -20.808748245239258, -20.090118408203125, -19.37148666381836, -18.652856826782227, -17.934226989746094, -17.215595245361328, -16.496965408325195, -15.778335571289062, -15.05970573425293, -14.341075897216797, -13.622445106506348, -12.903815269470215, -12.185184478759766, -11.466554641723633, -10.7479248046875, -10.029294967651367, -9.310664176940918, -8.592034339904785, -7.873404026031494, -7.154773712158203, -6.43614387512207, -5.717513561248779, -4.998883247375488, -4.2802534103393555, -3.5616230964660645, -2.8429932594299316, -2.1243629455566406, -1.4057328701019287, -0.6871026754379272, 0.03152751922607422, 0.7501575946807861, 1.468787670135498, 2.187417984008789, 2.906047821044922, 3.624678134918213, 4.343308448791504, 5.061938285827637, 5.780568599700928, 6.499198913574219, 7.217828750610352, 7.936459064483643, 8.655088424682617, 9.373719215393066]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 17.0, 10.0, 15.0, 16.0, 18.0, 26.0, 27.0, 29.0, 33.0, 45.0, 34.0, 54.0, 44.0, 47.0, 44.0, 47.0, 50.0, 51.0, 42.0, 45.0, 44.0, 45.0, 41.0, 31.0, 24.0, 23.0, 21.0, 16.0, 6.0, 8.0, 9.0, 7.0, 11.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.641238689422607, -6.403675556182861, -6.166112899780273, -5.928549766540527, -5.690986633300781, -5.453423976898193, -5.215860843658447, -4.978298187255859, -4.740735054016113, -4.503171920776367, -4.265609264373779, -4.028046131134033, -3.790483236312866, -3.552920341491699, -3.315357208251953, -3.077794313430786, -2.840231418609619, -2.602668523788452, -2.365105628967285, -2.127542495727539, -1.889979600906372, -1.652416706085205, -1.4148536920547485, -1.177290678024292, -0.939727783203125, -0.7021648287773132, -0.46460187435150146, -0.2270389199256897, 0.01052403450012207, 0.24808692932128906, 0.4856499433517456, 0.7232129573822021, 0.9607763290405273, 1.1983392238616943, 1.4359022378921509, 1.6734652519226074, 1.9110281467437744, 2.1485910415649414, 2.3861541748046875, 2.6237170696258545, 2.8612799644470215, 3.0988428592681885, 3.3364057540893555, 3.5739688873291016, 3.8115317821502686, 4.0490946769714355, 4.286657810211182, 4.5242204666137695, 4.761783599853516, 4.999346733093262, 5.23690938949585, 5.474472522735596, 5.712035179138184, 5.94959831237793, 6.187161445617676, 6.424724578857422, 6.66228723526001, 6.899850368499756, 7.137413024902344, 7.37497615814209, 7.612539291381836, 7.850101947784424, 8.087664604187012, 8.325227737426758, 8.562790870666504]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 19.0, 16.0, 35.0, 45.0, 48.0, 67.0, 125.0, 197.0, 258.0, 577.0, 1721.0, 9056.0, 81838.0, 870989.0, 2450739.0, 701835.0, 66051.0, 7794.0, 1552.0, 501.0, 241.0, 189.0, 115.0, 72.0, 52.0, 38.0, 24.0, 17.0, 15.0, 15.0, 6.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9453125, -7.707763671875, -7.47021484375, -7.232666015625, -6.9951171875, -6.757568359375, -6.52001953125, -6.282470703125, -6.044921875, -5.807373046875, -5.56982421875, -5.332275390625, -5.0947265625, -4.857177734375, -4.61962890625, -4.382080078125, -4.14453125, -3.906982421875, -3.66943359375, -3.431884765625, -3.1943359375, -2.956787109375, -2.71923828125, -2.481689453125, -2.244140625, -2.006591796875, -1.76904296875, -1.531494140625, -1.2939453125, -1.056396484375, -0.81884765625, -0.581298828125, -0.34375, -0.106201171875, 0.13134765625, 0.368896484375, 0.6064453125, 0.843994140625, 1.08154296875, 1.319091796875, 1.556640625, 1.794189453125, 2.03173828125, 2.269287109375, 2.5068359375, 2.744384765625, 2.98193359375, 3.219482421875, 3.45703125, 3.694580078125, 3.93212890625, 4.169677734375, 4.4072265625, 4.644775390625, 4.88232421875, 5.119873046875, 5.357421875, 5.594970703125, 5.83251953125, 6.070068359375, 6.3076171875, 6.545166015625, 6.78271484375, 7.020263671875, 7.2578125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 7.0, 4.0, 8.0, 7.0, 5.0, 10.0, 9.0, 19.0, 13.0, 18.0, 19.0, 20.0, 20.0, 40.0, 24.0, 25.0, 33.0, 51.0, 47.0, 40.0, 38.0, 55.0, 39.0, 39.0, 43.0, 42.0, 51.0, 32.0, 39.0, 28.0, 29.0, 25.0, 29.0, 18.0, 17.0, 9.0, 12.0, 8.0, 7.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3828125, -3.272735595703125, -3.16265869140625, -3.052581787109375, -2.9425048828125, -2.832427978515625, -2.72235107421875, -2.612274169921875, -2.502197265625, -2.392120361328125, -2.28204345703125, -2.171966552734375, -2.0618896484375, -1.951812744140625, -1.84173583984375, -1.731658935546875, -1.62158203125, -1.511505126953125, -1.40142822265625, -1.291351318359375, -1.1812744140625, -1.071197509765625, -0.96112060546875, -0.851043701171875, -0.740966796875, -0.630889892578125, -0.52081298828125, -0.410736083984375, -0.3006591796875, -0.190582275390625, -0.08050537109375, 0.029571533203125, 0.1396484375, 0.249725341796875, 0.35980224609375, 0.469879150390625, 0.5799560546875, 0.690032958984375, 0.80010986328125, 0.910186767578125, 1.020263671875, 1.130340576171875, 1.24041748046875, 1.350494384765625, 1.4605712890625, 1.570648193359375, 1.68072509765625, 1.790802001953125, 1.90087890625, 2.010955810546875, 2.12103271484375, 2.231109619140625, 2.3411865234375, 2.451263427734375, 2.56134033203125, 2.671417236328125, 2.781494140625, 2.891571044921875, 3.00164794921875, 3.111724853515625, 3.2218017578125, 3.331878662109375, 3.44195556640625, 3.552032470703125, 3.662109375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 14.0, 10.0, 18.0, 24.0, 36.0, 57.0, 99.0, 163.0, 292.0, 580.0, 1585.0, 10450.0, 490817.0, 3602586.0, 81371.0, 4194.0, 975.0, 409.0, 218.0, 134.0, 69.0, 58.0, 44.0, 24.0, 14.0, 9.0, 9.0, 7.0, 11.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.6640625, -15.275390625, -14.88671875, -14.498046875, -14.109375, -13.720703125, -13.33203125, -12.943359375, -12.5546875, -12.166015625, -11.77734375, -11.388671875, -11.0, -10.611328125, -10.22265625, -9.833984375, -9.4453125, -9.056640625, -8.66796875, -8.279296875, -7.890625, -7.501953125, -7.11328125, -6.724609375, -6.3359375, -5.947265625, -5.55859375, -5.169921875, -4.78125, -4.392578125, -4.00390625, -3.615234375, -3.2265625, -2.837890625, -2.44921875, -2.060546875, -1.671875, -1.283203125, -0.89453125, -0.505859375, -0.1171875, 0.271484375, 0.66015625, 1.048828125, 1.4375, 1.826171875, 2.21484375, 2.603515625, 2.9921875, 3.380859375, 3.76953125, 4.158203125, 4.546875, 4.935546875, 5.32421875, 5.712890625, 6.1015625, 6.490234375, 6.87890625, 7.267578125, 7.65625, 8.044921875, 8.43359375, 8.822265625, 9.2109375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 10.0, 13.0, 5.0, 12.0, 20.0, 25.0, 26.0, 39.0, 43.0, 61.0, 88.0, 133.0, 160.0, 196.0, 296.0, 356.0, 371.0, 395.0, 391.0, 348.0, 245.0, 206.0, 166.0, 117.0, 97.0, 68.0, 46.0, 32.0, 35.0, 17.0, 18.0, 9.0, 3.0, 6.0, 4.0, 6.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.529296875, -1.4757843017578125, -1.422271728515625, -1.3687591552734375, -1.31524658203125, -1.2617340087890625, -1.208221435546875, -1.1547088623046875, -1.1011962890625, -1.0476837158203125, -0.994171142578125, -0.9406585693359375, -0.88714599609375, -0.8336334228515625, -0.780120849609375, -0.7266082763671875, -0.673095703125, -0.6195831298828125, -0.566070556640625, -0.5125579833984375, -0.45904541015625, -0.4055328369140625, -0.352020263671875, -0.2985076904296875, -0.2449951171875, -0.1914825439453125, -0.137969970703125, -0.0844573974609375, -0.03094482421875, 0.0225677490234375, 0.076080322265625, 0.1295928955078125, 0.18310546875, 0.2366180419921875, 0.290130615234375, 0.3436431884765625, 0.39715576171875, 0.4506683349609375, 0.504180908203125, 0.5576934814453125, 0.6112060546875, 0.6647186279296875, 0.718231201171875, 0.7717437744140625, 0.82525634765625, 0.8787689208984375, 0.932281494140625, 0.9857940673828125, 1.039306640625, 1.0928192138671875, 1.146331787109375, 1.1998443603515625, 1.25335693359375, 1.3068695068359375, 1.360382080078125, 1.4138946533203125, 1.4674072265625, 1.5209197998046875, 1.574432373046875, 1.6279449462890625, 1.68145751953125, 1.7349700927734375, 1.788482666015625, 1.8419952392578125, 1.8955078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 13.0, 39.0, 58.0, 83.0, 80.0, 139.0, 148.0, 144.0, 109.0, 83.0, 49.0, 25.0, 13.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.708285331726074, -4.360116481781006, -4.0119476318359375, -3.6637792587280273, -3.315610408782959, -2.9674415588378906, -2.6192729473114014, -2.271104335784912, -1.9229354858398438, -1.574766755104065, -1.2265980243682861, -0.8784292936325073, -0.5302605628967285, -0.1820918321609497, 0.1660768985748291, 0.5142455101013184, 0.8624143600463867, 1.2105830907821655, 1.5587518215179443, 1.9069205522537231, 2.255089282989502, 2.6032581329345703, 2.9514267444610596, 3.299595355987549, 3.647764205932617, 3.9959330558776855, 4.344101905822754, 4.692270278930664, 5.040439128875732, 5.388607978820801, 5.736776351928711, 6.084945201873779, 6.433113098144531, 6.7812819480896, 7.129450798034668, 7.477619171142578, 7.8257880210876465, 8.173956871032715, 8.522125244140625, 8.870294570922852, 9.218462944030762, 9.566631317138672, 9.914800643920898, 10.262969017028809, 10.611137390136719, 10.959306716918945, 11.307475090026855, 11.655643463134766, 12.003812789916992, 12.351981163024902, 12.700150489807129, 13.048318862915039, 13.396488189697266, 13.744656562805176, 14.092824935913086, 14.440994262695312, 14.789162635803223, 15.137331008911133, 15.48550033569336, 15.83366870880127, 16.18183708190918, 16.530006408691406, 16.878175735473633, 17.226343154907227, 17.574512481689453]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 5.0, 10.0, 11.0, 17.0, 16.0, 20.0, 18.0, 15.0, 30.0, 25.0, 27.0, 31.0, 26.0, 27.0, 38.0, 38.0, 31.0, 49.0, 33.0, 38.0, 43.0, 38.0, 40.0, 30.0, 49.0, 37.0, 34.0, 21.0, 28.0, 27.0, 18.0, 13.0, 13.0, 13.0, 17.0, 13.0, 7.0, 11.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.094571113586426, -3.9765985012054443, -3.858625650405884, -3.7406530380249023, -3.622680187225342, -3.5047075748443604, -3.3867347240448, -3.2687621116638184, -3.150789260864258, -3.0328166484832764, -2.914843797683716, -2.7968711853027344, -2.678898334503174, -2.5609257221221924, -2.442952871322632, -2.3249802589416504, -2.20700740814209, -2.0890347957611084, -1.9710619449615479, -1.8530892133712769, -1.7351164817810059, -1.6171438694000244, -1.4991710186004639, -1.3811984062194824, -1.263225793838501, -1.14525306224823, -1.027280330657959, -0.909307599067688, -0.791334867477417, -0.6733621954917908, -0.5553894639015198, -0.4374167323112488, -0.319443941116333, -0.201471209526062, -0.08349849283695221, 0.03447422385215759, 0.1524469554424286, 0.2704196572303772, 0.3883923888206482, 0.5063651204109192, 0.6243378520011902, 0.7423105835914612, 0.8602833151817322, 0.9782559871673584, 1.0962287187576294, 1.2142014503479004, 1.3321741819381714, 1.4501469135284424, 1.5681196451187134, 1.6860923767089844, 1.8040651082992554, 1.9220378398895264, 2.040010452270508, 2.1579833030700684, 2.27595591545105, 2.3939287662506104, 2.511901378631592, 2.6298739910125732, 2.747846841812134, 2.8658194541931152, 2.983792304992676, 3.1017649173736572, 3.2197377681732178, 3.337710380554199, 3.4556832313537598]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 17.0, 8.0, 31.0, 70.0, 113.0, 293.0, 817.0, 2616.0, 28090.0, 904667.0, 105867.0, 4161.0, 1130.0, 383.0, 140.0, 77.0, 30.0, 12.0, 9.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6875, -1.60577392578125, -1.5240478515625, -1.44232177734375, -1.360595703125, -1.27886962890625, -1.1971435546875, -1.11541748046875, -1.03369140625, -0.95196533203125, -0.8702392578125, -0.78851318359375, -0.706787109375, -0.62506103515625, -0.5433349609375, -0.46160888671875, -0.3798828125, -0.29815673828125, -0.2164306640625, -0.13470458984375, -0.052978515625, 0.02874755859375, 0.1104736328125, 0.19219970703125, 0.27392578125, 0.35565185546875, 0.4373779296875, 0.51910400390625, 0.600830078125, 0.68255615234375, 0.7642822265625, 0.84600830078125, 0.927734375, 1.00946044921875, 1.0911865234375, 1.17291259765625, 1.254638671875, 1.33636474609375, 1.4180908203125, 1.49981689453125, 1.58154296875, 1.66326904296875, 1.7449951171875, 1.82672119140625, 1.908447265625, 1.99017333984375, 2.0718994140625, 2.15362548828125, 2.2353515625, 2.31707763671875, 2.3988037109375, 2.48052978515625, 2.562255859375, 2.64398193359375, 2.7257080078125, 2.80743408203125, 2.88916015625, 2.97088623046875, 3.0526123046875, 3.13433837890625, 3.216064453125, 3.29779052734375, 3.3795166015625, 3.46124267578125, 3.54296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 21.0, 37.0, 30.0, 46.0, 57.0, 85.0, 75.0, 110.0, 100.0, 106.0, 102.0, 62.0, 60.0, 26.0, 36.0, 16.0, 8.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.72906494140625, -2.5479736328125, -2.36688232421875, -2.185791015625, -2.00469970703125, -1.8236083984375, -1.64251708984375, -1.46142578125, -1.28033447265625, -1.0992431640625, -0.91815185546875, -0.737060546875, -0.55596923828125, -0.3748779296875, -0.19378662109375, -0.0126953125, 0.16839599609375, 0.3494873046875, 0.53057861328125, 0.711669921875, 0.89276123046875, 1.0738525390625, 1.25494384765625, 1.43603515625, 1.61712646484375, 1.7982177734375, 1.97930908203125, 2.160400390625, 2.34149169921875, 2.5225830078125, 2.70367431640625, 2.884765625, 3.06585693359375, 3.2469482421875, 3.42803955078125, 3.609130859375, 3.79022216796875, 3.9713134765625, 4.15240478515625, 4.33349609375, 4.51458740234375, 4.6956787109375, 4.87677001953125, 5.057861328125, 5.23895263671875, 5.4200439453125, 5.60113525390625, 5.7822265625, 5.96331787109375, 6.1444091796875, 6.32550048828125, 6.506591796875, 6.68768310546875, 6.8687744140625, 7.04986572265625, 7.23095703125, 7.41204833984375, 7.5931396484375, 7.77423095703125, 7.955322265625, 8.13641357421875, 8.3175048828125, 8.49859619140625, 8.6796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 11.0, 17.0, 34.0, 43.0, 81.0, 174.0, 351.0, 717.0, 1593.0, 3718.0, 8812.0, 20570.0, 48460.0, 107675.0, 208792.0, 273954.0, 196187.0, 99365.0, 44586.0, 18920.0, 8165.0, 3406.0, 1532.0, 676.0, 340.0, 156.0, 98.0, 44.0, 30.0, 23.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.39208984375, -0.3816184997558594, -0.37114715576171875, -0.3606758117675781, -0.3502044677734375, -0.3397331237792969, -0.32926177978515625, -0.3187904357910156, -0.308319091796875, -0.2978477478027344, -0.28737640380859375, -0.2769050598144531, -0.2664337158203125, -0.2559623718261719, -0.24549102783203125, -0.23501968383789062, -0.22454833984375, -0.21407699584960938, -0.20360565185546875, -0.19313430786132812, -0.1826629638671875, -0.17219161987304688, -0.16172027587890625, -0.15124893188476562, -0.140777587890625, -0.13030624389648438, -0.11983489990234375, -0.10936355590820312, -0.0988922119140625, -0.08842086791992188, -0.07794952392578125, -0.06747817993164062, -0.0570068359375, -0.046535491943359375, -0.03606414794921875, -0.025592803955078125, -0.0151214599609375, -0.004650115966796875, 0.00582122802734375, 0.016292572021484375, 0.026763916015625, 0.037235260009765625, 0.04770660400390625, 0.058177947998046875, 0.0686492919921875, 0.07912063598632812, 0.08959197998046875, 0.10006332397460938, 0.11053466796875, 0.12100601196289062, 0.13147735595703125, 0.14194869995117188, 0.1524200439453125, 0.16289138793945312, 0.17336273193359375, 0.18383407592773438, 0.194305419921875, 0.20477676391601562, 0.21524810791015625, 0.22571945190429688, 0.2361907958984375, 0.24666213989257812, 0.25713348388671875, 0.2676048278808594, 0.278076171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 12.0, 18.0, 17.0, 27.0, 41.0, 47.0, 45.0, 49.0, 75.0, 77.0, 73.0, 85.0, 69.0, 71.0, 47.0, 62.0, 29.0, 22.0, 37.0, 22.0, 18.0, 19.0, 16.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2952880859375, -8.051513671875, -7.8077392578125, -7.56396484375, -7.3201904296875, -7.076416015625, -6.8326416015625, -6.5888671875, -6.3450927734375, -6.101318359375, -5.8575439453125, -5.61376953125, -5.3699951171875, -5.126220703125, -4.8824462890625, -4.638671875, -4.3948974609375, -4.151123046875, -3.9073486328125, -3.66357421875, -3.4197998046875, -3.176025390625, -2.9322509765625, -2.6884765625, -2.4447021484375, -2.200927734375, -1.9571533203125, -1.71337890625, -1.4696044921875, -1.225830078125, -0.9820556640625, -0.73828125, -0.4945068359375, -0.250732421875, -0.0069580078125, 0.23681640625, 0.4805908203125, 0.724365234375, 0.9681396484375, 1.2119140625, 1.4556884765625, 1.699462890625, 1.9432373046875, 2.18701171875, 2.4307861328125, 2.674560546875, 2.9183349609375, 3.162109375, 3.4058837890625, 3.649658203125, 3.8934326171875, 4.13720703125, 4.3809814453125, 4.624755859375, 4.8685302734375, 5.1123046875, 5.3560791015625, 5.599853515625, 5.8436279296875, 6.08740234375, 6.3311767578125, 6.574951171875, 6.8187255859375, 7.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 7.0, 22.0, 32.0, 63.0, 73.0, 101.0, 177.0, 222.0, 330.0, 557.0, 1045.0, 1970.0, 4215.0, 9830.0, 26109.0, 78896.0, 246837.0, 411647.0, 176697.0, 55720.0, 19348.0, 7522.0, 3274.0, 1599.0, 869.0, 490.0, 301.0, 214.0, 136.0, 83.0, 36.0, 38.0, 21.0, 12.0, 10.0, 8.0, 8.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05169677734375, -0.04999351501464844, -0.048290252685546875, -0.04658699035644531, -0.04488372802734375, -0.04318046569824219, -0.041477203369140625, -0.03977394104003906, -0.0380706787109375, -0.03636741638183594, -0.034664154052734375, -0.03296089172363281, -0.03125762939453125, -0.029554367065429688, -0.027851104736328125, -0.026147842407226562, -0.024444580078125, -0.022741317749023438, -0.021038055419921875, -0.019334793090820312, -0.01763153076171875, -0.015928268432617188, -0.014225006103515625, -0.012521743774414062, -0.0108184814453125, -0.009115219116210938, -0.007411956787109375, -0.0057086944580078125, -0.00400543212890625, -0.0023021697998046875, -0.000598907470703125, 0.0011043548583984375, 0.0028076171875, 0.0045108795166015625, 0.006214141845703125, 0.007917404174804688, 0.00962066650390625, 0.011323928833007812, 0.013027191162109375, 0.014730453491210938, 0.0164337158203125, 0.018136978149414062, 0.019840240478515625, 0.021543502807617188, 0.02324676513671875, 0.024950027465820312, 0.026653289794921875, 0.028356552124023438, 0.030059814453125, 0.03176307678222656, 0.033466339111328125, 0.03516960144042969, 0.03687286376953125, 0.03857612609863281, 0.040279388427734375, 0.04198265075683594, 0.0436859130859375, 0.04538917541503906, 0.047092437744140625, 0.04879570007324219, 0.05049896240234375, 0.05220222473144531, 0.053905487060546875, 0.05560874938964844, 0.05731201171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 1.0, 8.0, 8.0, 15.0, 20.0, 28.0, 46.0, 49.0, 72.0, 71.0, 100.0, 108.0, 85.0, 92.0, 81.0, 46.0, 44.0, 39.0, 27.0, 15.0, 13.0, 10.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.802776336669922e-05, -3.6121346056461334e-05, -3.421492874622345e-05, -3.2308511435985565e-05, -3.040209412574768e-05, -2.8495676815509796e-05, -2.658925950527191e-05, -2.4682842195034027e-05, -2.2776424884796143e-05, -2.0870007574558258e-05, -1.8963590264320374e-05, -1.705717295408249e-05, -1.5150755643844604e-05, -1.324433833360672e-05, -1.1337921023368835e-05, -9.431503713130951e-06, -7.525086402893066e-06, -5.618669092655182e-06, -3.7122517824172974e-06, -1.8058344721794128e-06, 1.0058283805847168e-07, 2.007000148296356e-06, 3.913417458534241e-06, 5.819834768772125e-06, 7.72625207901001e-06, 9.632669389247894e-06, 1.1539086699485779e-05, 1.3445504009723663e-05, 1.5351921319961548e-05, 1.7258338630199432e-05, 1.9164755940437317e-05, 2.10711732506752e-05, 2.2977590560913086e-05, 2.488400787115097e-05, 2.6790425181388855e-05, 2.869684249162674e-05, 3.0603259801864624e-05, 3.250967711210251e-05, 3.441609442234039e-05, 3.632251173257828e-05, 3.822892904281616e-05, 4.013534635305405e-05, 4.204176366329193e-05, 4.3948180973529816e-05, 4.58545982837677e-05, 4.7761015594005585e-05, 4.966743290424347e-05, 5.1573850214481354e-05, 5.348026752471924e-05, 5.538668483495712e-05, 5.729310214519501e-05, 5.919951945543289e-05, 6.110593676567078e-05, 6.301235407590866e-05, 6.491877138614655e-05, 6.682518869638443e-05, 6.873160600662231e-05, 7.06380233168602e-05, 7.254444062709808e-05, 7.445085793733597e-05, 7.635727524757385e-05, 7.826369255781174e-05, 8.017010986804962e-05, 8.20765271782875e-05, 8.398294448852539e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 10.0, 5.0, 10.0, 13.0, 19.0, 28.0, 51.0, 90.0, 185.0, 472.0, 1119.0, 3595.0, 17202.0, 168866.0, 738138.0, 102299.0, 12152.0, 2619.0, 920.0, 354.0, 171.0, 88.0, 49.0, 26.0, 20.0, 13.0, 12.0, 5.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134765625, -0.1311626434326172, -0.12755966186523438, -0.12395668029785156, -0.12035369873046875, -0.11675071716308594, -0.11314773559570312, -0.10954475402832031, -0.1059417724609375, -0.10233879089355469, -0.09873580932617188, -0.09513282775878906, -0.09152984619140625, -0.08792686462402344, -0.08432388305664062, -0.08072090148925781, -0.077117919921875, -0.07351493835449219, -0.06991195678710938, -0.06630897521972656, -0.06270599365234375, -0.05910301208496094, -0.055500030517578125, -0.05189704895019531, -0.0482940673828125, -0.04469108581542969, -0.041088104248046875, -0.03748512268066406, -0.03388214111328125, -0.030279159545898438, -0.026676177978515625, -0.023073196411132812, -0.01947021484375, -0.015867233276367188, -0.012264251708984375, -0.008661270141601562, -0.00505828857421875, -0.0014553070068359375, 0.002147674560546875, 0.0057506561279296875, 0.0093536376953125, 0.012956619262695312, 0.016559600830078125, 0.020162582397460938, 0.02376556396484375, 0.027368545532226562, 0.030971527099609375, 0.03457450866699219, 0.038177490234375, 0.04178047180175781, 0.045383453369140625, 0.04898643493652344, 0.05258941650390625, 0.05619239807128906, 0.059795379638671875, 0.06339836120605469, 0.0670013427734375, 0.07060432434082031, 0.07420730590820312, 0.07781028747558594, 0.08141326904296875, 0.08501625061035156, 0.08861923217773438, 0.09222221374511719, 0.0958251953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 14.0, 12.0, 12.0, 30.0, 21.0, 36.0, 38.0, 73.0, 70.0, 87.0, 64.0, 63.0, 80.0, 65.0, 58.0, 66.0, 40.0, 30.0, 30.0, 16.0, 10.0, 8.0, 12.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.017303466796875, -0.01683521270751953, -0.016366958618164062, -0.015898704528808594, -0.015430450439453125, -0.014962196350097656, -0.014493942260742188, -0.014025688171386719, -0.01355743408203125, -0.013089179992675781, -0.012620925903320312, -0.012152671813964844, -0.011684417724609375, -0.011216163635253906, -0.010747909545898438, -0.010279655456542969, -0.0098114013671875, -0.009343147277832031, -0.008874893188476562, -0.008406639099121094, -0.007938385009765625, -0.007470130920410156, -0.0070018768310546875, -0.006533622741699219, -0.00606536865234375, -0.005597114562988281, -0.0051288604736328125, -0.004660606384277344, -0.004192352294921875, -0.0037240982055664062, -0.0032558441162109375, -0.0027875900268554688, -0.0023193359375, -0.0018510818481445312, -0.0013828277587890625, -0.0009145736694335938, -0.000446319580078125, 2.193450927734375e-05, 0.0004901885986328125, 0.0009584426879882812, 0.00142669677734375, 0.0018949508666992188, 0.0023632049560546875, 0.0028314590454101562, 0.003299713134765625, 0.0037679672241210938, 0.0042362213134765625, 0.004704475402832031, 0.0051727294921875, 0.005640983581542969, 0.0061092376708984375, 0.006577491760253906, 0.007045745849609375, 0.007513999938964844, 0.007982254028320312, 0.008450508117675781, 0.00891876220703125, 0.009387016296386719, 0.009855270385742188, 0.010323524475097656, 0.010791778564453125, 0.011260032653808594, 0.011728286743164062, 0.012196540832519531, 0.012664794921875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 45.0, 81.0, 169.0, 215.0, 231.0, 153.0, 61.0, 27.0, 10.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.830513000488281, -12.50902271270752, -12.187532424926758, -11.866042137145996, -11.544551849365234, -11.223062515258789, -10.901571273803711, -10.580081939697266, -10.258591651916504, -9.937101364135742, -9.61561107635498, -9.294120788574219, -8.972630500793457, -8.651140213012695, -8.32965087890625, -8.008160591125488, -7.686669826507568, -7.365179538726807, -7.043689250946045, -6.722199440002441, -6.40070915222168, -6.079218864440918, -5.757728576660156, -5.4362382888793945, -5.114748001098633, -4.793257713317871, -4.471767425537109, -4.150277137756348, -3.828787326812744, -3.5072970390319824, -3.1858067512512207, -2.864316701889038, -2.5428271293640137, -2.221336841583252, -1.8998467922210693, -1.5783565044403076, -1.2568663358688354, -0.9353761672973633, -0.6138858795166016, -0.29239583015441895, 0.029094457626342773, 0.35058465600013733, 0.6720748543739319, 0.9935650825500488, 1.315055251121521, 1.6365454196929932, 1.9580357074737549, 2.2795257568359375, 2.601016044616699, 2.922506332397461, 3.2439963817596436, 3.5654866695404053, 3.886976718902588, 4.20846700668335, 4.529957294464111, 4.851447105407715, 5.172937393188477, 5.494427680969238, 5.81591796875, 6.137408256530762, 6.458898067474365, 6.780388355255127, 7.101878643035889, 7.423368453979492, 7.744859218597412]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 15.0, 21.0, 36.0, 46.0, 65.0, 84.0, 84.0, 97.0, 106.0, 102.0, 110.0, 60.0, 64.0, 39.0, 33.0, 16.0, 9.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646125316619873, -2.4611449241638184, -2.2761645317077637, -2.091184139251709, -1.9062037467956543, -1.7212233543395996, -1.536242961883545, -1.3512625694274902, -1.1662821769714355, -0.9813017845153809, -0.7963213920593262, -0.6113409996032715, -0.4263606071472168, -0.2413802146911621, -0.05639982223510742, 0.12858057022094727, 0.31356096267700195, 0.49854135513305664, 0.6835217475891113, 0.868502140045166, 1.0534825325012207, 1.2384629249572754, 1.42344331741333, 1.6084237098693848, 1.7934041023254395, 1.9783844947814941, 2.163364887237549, 2.3483452796936035, 2.533325672149658, 2.718306064605713, 2.9032864570617676, 3.0882668495178223, 3.273247718811035, 3.45822811126709, 3.6432085037231445, 3.828188896179199, 4.013169288635254, 4.198149681091309, 4.383130073547363, 4.568110466003418, 4.753090858459473, 4.938071250915527, 5.123051643371582, 5.308032035827637, 5.493012428283691, 5.677992820739746, 5.862973213195801, 6.0479536056518555, 6.23293399810791, 6.417914390563965, 6.6028947830200195, 6.787875175476074, 6.972855567932129, 7.157835960388184, 7.342816352844238, 7.527796745300293, 7.712777137756348, 7.897757530212402, 8.082737922668457, 8.267718315124512, 8.452698707580566, 8.637679100036621, 8.822659492492676, 9.00763988494873, 9.192620277404785]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 13.0, 22.0, 56.0, 126.0, 290.0, 856.0, 3460.0, 17119.0, 96817.0, 401822.0, 406692.0, 99025.0, 17410.0, 3447.0, 871.0, 297.0, 119.0, 50.0, 32.0, 15.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.24530029296875, -6.0765380859375, -5.90777587890625, -5.739013671875, -5.57025146484375, -5.4014892578125, -5.23272705078125, -5.06396484375, -4.89520263671875, -4.7264404296875, -4.55767822265625, -4.388916015625, -4.22015380859375, -4.0513916015625, -3.88262939453125, -3.7138671875, -3.54510498046875, -3.3763427734375, -3.20758056640625, -3.038818359375, -2.87005615234375, -2.7012939453125, -2.53253173828125, -2.36376953125, -2.19500732421875, -2.0262451171875, -1.85748291015625, -1.688720703125, -1.51995849609375, -1.3511962890625, -1.18243408203125, -1.013671875, -0.84490966796875, -0.6761474609375, -0.50738525390625, -0.338623046875, -0.16986083984375, -0.0010986328125, 0.16766357421875, 0.33642578125, 0.50518798828125, 0.6739501953125, 0.84271240234375, 1.011474609375, 1.18023681640625, 1.3489990234375, 1.51776123046875, 1.6865234375, 1.85528564453125, 2.0240478515625, 2.19281005859375, 2.361572265625, 2.53033447265625, 2.6990966796875, 2.86785888671875, 3.03662109375, 3.20538330078125, 3.3741455078125, 3.54290771484375, 3.711669921875, 3.88043212890625, 4.0491943359375, 4.21795654296875, 4.38671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 6.0, 11.0, 16.0, 12.0, 34.0, 38.0, 60.0, 61.0, 73.0, 75.0, 91.0, 85.0, 88.0, 80.0, 75.0, 61.0, 42.0, 37.0, 17.0, 21.0, 14.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.78289794921875, -3.4993896484375, -3.21588134765625, -2.932373046875, -2.64886474609375, -2.3653564453125, -2.08184814453125, -1.79833984375, -1.51483154296875, -1.2313232421875, -0.94781494140625, -0.664306640625, -0.38079833984375, -0.0972900390625, 0.18621826171875, 0.4697265625, 0.75323486328125, 1.0367431640625, 1.32025146484375, 1.603759765625, 1.88726806640625, 2.1707763671875, 2.45428466796875, 2.73779296875, 3.02130126953125, 3.3048095703125, 3.58831787109375, 3.871826171875, 4.15533447265625, 4.4388427734375, 4.72235107421875, 5.005859375, 5.28936767578125, 5.5728759765625, 5.85638427734375, 6.139892578125, 6.42340087890625, 6.7069091796875, 6.99041748046875, 7.27392578125, 7.55743408203125, 7.8409423828125, 8.12445068359375, 8.407958984375, 8.69146728515625, 8.9749755859375, 9.25848388671875, 9.5419921875, 9.82550048828125, 10.1090087890625, 10.39251708984375, 10.676025390625, 10.95953369140625, 11.2430419921875, 11.52655029296875, 11.81005859375, 12.09356689453125, 12.3770751953125, 12.66058349609375, 12.944091796875, 13.22760009765625, 13.5111083984375, 13.79461669921875, 14.078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 1.0, 7.0, 10.0, 6.0, 11.0, 14.0, 7.0, 24.0, 26.0, 41.0, 41.0, 52.0, 72.0, 78.0, 93.0, 128.0, 155.0, 180.0, 327.0, 642.0, 9142.0, 467108.0, 556577.0, 11726.0, 768.0, 321.0, 220.0, 151.0, 118.0, 91.0, 74.0, 62.0, 49.0, 44.0, 32.0, 35.0, 21.0, 27.0, 14.0, 15.0, 7.0, 6.0, 3.0, 4.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.2109375, -10.837646484375, -10.46435546875, -10.091064453125, -9.7177734375, -9.344482421875, -8.97119140625, -8.597900390625, -8.224609375, -7.851318359375, -7.47802734375, -7.104736328125, -6.7314453125, -6.358154296875, -5.98486328125, -5.611572265625, -5.23828125, -4.864990234375, -4.49169921875, -4.118408203125, -3.7451171875, -3.371826171875, -2.99853515625, -2.625244140625, -2.251953125, -1.878662109375, -1.50537109375, -1.132080078125, -0.7587890625, -0.385498046875, -0.01220703125, 0.361083984375, 0.734375, 1.107666015625, 1.48095703125, 1.854248046875, 2.2275390625, 2.600830078125, 2.97412109375, 3.347412109375, 3.720703125, 4.093994140625, 4.46728515625, 4.840576171875, 5.2138671875, 5.587158203125, 5.96044921875, 6.333740234375, 6.70703125, 7.080322265625, 7.45361328125, 7.826904296875, 8.2001953125, 8.573486328125, 8.94677734375, 9.320068359375, 9.693359375, 10.066650390625, 10.43994140625, 10.813232421875, 11.1865234375, 11.559814453125, 11.93310546875, 12.306396484375, 12.6796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 10.0, 7.0, 10.0, 15.0, 13.0, 16.0, 20.0, 22.0, 17.0, 29.0, 30.0, 36.0, 33.0, 32.0, 26.0, 41.0, 31.0, 45.0, 38.0, 45.0, 42.0, 45.0, 31.0, 38.0, 26.0, 31.0, 34.0, 33.0, 31.0, 20.0, 13.0, 24.0, 18.0, 9.0, 8.0, 11.0, 8.0, 11.0, 5.0, 5.0, 4.0, 4.0, 7.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-3.9765625, -3.84600830078125, -3.7154541015625, -3.58489990234375, -3.454345703125, -3.32379150390625, -3.1932373046875, -3.06268310546875, -2.93212890625, -2.80157470703125, -2.6710205078125, -2.54046630859375, -2.409912109375, -2.27935791015625, -2.1488037109375, -2.01824951171875, -1.8876953125, -1.75714111328125, -1.6265869140625, -1.49603271484375, -1.365478515625, -1.23492431640625, -1.1043701171875, -0.97381591796875, -0.84326171875, -0.71270751953125, -0.5821533203125, -0.45159912109375, -0.321044921875, -0.19049072265625, -0.0599365234375, 0.07061767578125, 0.201171875, 0.33172607421875, 0.4622802734375, 0.59283447265625, 0.723388671875, 0.85394287109375, 0.9844970703125, 1.11505126953125, 1.24560546875, 1.37615966796875, 1.5067138671875, 1.63726806640625, 1.767822265625, 1.89837646484375, 2.0289306640625, 2.15948486328125, 2.2900390625, 2.42059326171875, 2.5511474609375, 2.68170166015625, 2.812255859375, 2.94281005859375, 3.0733642578125, 3.20391845703125, 3.33447265625, 3.46502685546875, 3.5955810546875, 3.72613525390625, 3.856689453125, 3.98724365234375, 4.1177978515625, 4.24835205078125, 4.37890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 7.0, 18.0, 28.0, 32.0, 57.0, 133.0, 208.0, 468.0, 1879.0, 18322.0, 618599.0, 395138.0, 11337.0, 1443.0, 411.0, 189.0, 108.0, 55.0, 45.0, 21.0, 15.0, 3.0, 9.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.67578125, -2.572540283203125, -2.46929931640625, -2.366058349609375, -2.2628173828125, -2.159576416015625, -2.05633544921875, -1.953094482421875, -1.849853515625, -1.746612548828125, -1.64337158203125, -1.540130615234375, -1.4368896484375, -1.333648681640625, -1.23040771484375, -1.127166748046875, -1.02392578125, -0.920684814453125, -0.81744384765625, -0.714202880859375, -0.6109619140625, -0.507720947265625, -0.40447998046875, -0.301239013671875, -0.197998046875, -0.094757080078125, 0.00848388671875, 0.111724853515625, 0.2149658203125, 0.318206787109375, 0.42144775390625, 0.524688720703125, 0.6279296875, 0.731170654296875, 0.83441162109375, 0.937652587890625, 1.0408935546875, 1.144134521484375, 1.24737548828125, 1.350616455078125, 1.453857421875, 1.557098388671875, 1.66033935546875, 1.763580322265625, 1.8668212890625, 1.970062255859375, 2.07330322265625, 2.176544189453125, 2.27978515625, 2.383026123046875, 2.48626708984375, 2.589508056640625, 2.6927490234375, 2.795989990234375, 2.89923095703125, 3.002471923828125, 3.105712890625, 3.208953857421875, 3.31219482421875, 3.415435791015625, 3.5186767578125, 3.621917724609375, 3.72515869140625, 3.828399658203125, 3.931640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 7.0, 4.0, 3.0, 9.0, 10.0, 16.0, 9.0, 16.0, 37.0, 32.0, 54.0, 44.0, 68.0, 57.0, 93.0, 92.0, 69.0, 64.0, 56.0, 61.0, 44.0, 32.0, 29.0, 22.0, 21.0, 6.0, 12.0, 7.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016260147094726562, -0.00015597790479660034, -0.00014935433864593506, -0.00014273077249526978, -0.0001361072063446045, -0.0001294836401939392, -0.00012286007404327393, -0.00011623650789260864, -0.00010961294174194336, -0.00010298937559127808, -9.636580944061279e-05, -8.974224328994751e-05, -8.311867713928223e-05, -7.649511098861694e-05, -6.987154483795166e-05, -6.324797868728638e-05, -5.6624412536621094e-05, -5.000084638595581e-05, -4.337728023529053e-05, -3.6753714084625244e-05, -3.013014793395996e-05, -2.3506581783294678e-05, -1.6883015632629395e-05, -1.0259449481964111e-05, -3.635883331298828e-06, 2.987682819366455e-06, 9.611248970031738e-06, 1.623481512069702e-05, 2.2858381271362305e-05, 2.9481947422027588e-05, 3.610551357269287e-05, 4.2729079723358154e-05, 4.935264587402344e-05, 5.597621202468872e-05, 6.2599778175354e-05, 6.922334432601929e-05, 7.584691047668457e-05, 8.247047662734985e-05, 8.909404277801514e-05, 9.571760892868042e-05, 0.0001023411750793457, 0.00010896474123001099, 0.00011558830738067627, 0.00012221187353134155, 0.00012883543968200684, 0.00013545900583267212, 0.0001420825719833374, 0.00014870613813400269, 0.00015532970428466797, 0.00016195327043533325, 0.00016857683658599854, 0.00017520040273666382, 0.0001818239688873291, 0.00018844753503799438, 0.00019507110118865967, 0.00020169466733932495, 0.00020831823348999023, 0.00021494179964065552, 0.0002215653657913208, 0.00022818893194198608, 0.00023481249809265137, 0.00024143606424331665, 0.00024805963039398193, 0.0002546831965446472, 0.0002613067626953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 9.0, 4.0, 8.0, 9.0, 13.0, 15.0, 25.0, 37.0, 50.0, 83.0, 114.0, 167.0, 429.0, 1408.0, 8125.0, 161767.0, 807209.0, 62546.0, 4748.0, 971.0, 324.0, 163.0, 97.0, 61.0, 40.0, 29.0, 25.0, 23.0, 11.0, 6.0, 5.0, 8.0, 1.0, 5.0, 1.0, 2.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.091796875, -3.0018310546875, -2.911865234375, -2.8218994140625, -2.73193359375, -2.6419677734375, -2.552001953125, -2.4620361328125, -2.3720703125, -2.2821044921875, -2.192138671875, -2.1021728515625, -2.01220703125, -1.9222412109375, -1.832275390625, -1.7423095703125, -1.65234375, -1.5623779296875, -1.472412109375, -1.3824462890625, -1.29248046875, -1.2025146484375, -1.112548828125, -1.0225830078125, -0.9326171875, -0.8426513671875, -0.752685546875, -0.6627197265625, -0.57275390625, -0.4827880859375, -0.392822265625, -0.3028564453125, -0.212890625, -0.1229248046875, -0.032958984375, 0.0570068359375, 0.14697265625, 0.2369384765625, 0.326904296875, 0.4168701171875, 0.5068359375, 0.5968017578125, 0.686767578125, 0.7767333984375, 0.86669921875, 0.9566650390625, 1.046630859375, 1.1365966796875, 1.2265625, 1.3165283203125, 1.406494140625, 1.4964599609375, 1.58642578125, 1.6763916015625, 1.766357421875, 1.8563232421875, 1.9462890625, 2.0362548828125, 2.126220703125, 2.2161865234375, 2.30615234375, 2.3961181640625, 2.486083984375, 2.5760498046875, 2.666015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 11.0, 10.0, 7.0, 15.0, 24.0, 28.0, 34.0, 48.0, 54.0, 66.0, 74.0, 71.0, 85.0, 83.0, 78.0, 69.0, 48.0, 46.0, 32.0, 25.0, 24.0, 11.0, 9.0, 7.0, 15.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66162109375, -0.641815185546875, -0.62200927734375, -0.602203369140625, -0.5823974609375, -0.562591552734375, -0.54278564453125, -0.522979736328125, -0.503173828125, -0.483367919921875, -0.46356201171875, -0.443756103515625, -0.4239501953125, -0.404144287109375, -0.38433837890625, -0.364532470703125, -0.3447265625, -0.324920654296875, -0.30511474609375, -0.285308837890625, -0.2655029296875, -0.245697021484375, -0.22589111328125, -0.206085205078125, -0.186279296875, -0.166473388671875, -0.14666748046875, -0.126861572265625, -0.1070556640625, -0.087249755859375, -0.06744384765625, -0.047637939453125, -0.02783203125, -0.008026123046875, 0.01177978515625, 0.031585693359375, 0.0513916015625, 0.071197509765625, 0.09100341796875, 0.110809326171875, 0.130615234375, 0.150421142578125, 0.17022705078125, 0.190032958984375, 0.2098388671875, 0.229644775390625, 0.24945068359375, 0.269256591796875, 0.2890625, 0.308868408203125, 0.32867431640625, 0.348480224609375, 0.3682861328125, 0.388092041015625, 0.40789794921875, 0.427703857421875, 0.447509765625, 0.467315673828125, 0.48712158203125, 0.506927490234375, 0.5267333984375, 0.546539306640625, 0.56634521484375, 0.586151123046875, 0.60595703125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 18.0, 41.0, 58.0, 105.0, 117.0, 171.0, 175.0, 129.0, 81.0, 55.0, 32.0, 18.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.838399410247803, -4.357330322265625, -3.8762612342834473, -3.3951919078826904, -2.9141228199005127, -2.433053731918335, -1.9519844055175781, -1.4709153175354004, -0.9898462295532227, -0.5087770819664001, -0.027707934379577637, 0.45336127281188965, 0.9344303607940674, 1.4154994487762451, 1.896568775177002, 2.3776378631591797, 2.8587069511413574, 3.339776039123535, 3.820845127105713, 4.301914215087891, 4.782983779907227, 5.264052391052246, 5.745121955871582, 6.22619104385376, 6.7072601318359375, 7.188329219818115, 7.669398307800293, 8.150467872619629, 8.631536483764648, 9.112606048583984, 9.59367561340332, 10.07474422454834, 10.55581283569336, 11.036882400512695, 11.517951011657715, 11.99902057647705, 12.48008918762207, 12.961158752441406, 13.442228317260742, 13.923296928405762, 14.404365539550781, 14.885435104370117, 15.366503715515137, 15.847573280334473, 16.328641891479492, 16.809711456298828, 17.290781021118164, 17.7718505859375, 18.252918243408203, 18.73398780822754, 19.215057373046875, 19.696125030517578, 20.177194595336914, 20.65826416015625, 21.139333724975586, 21.620403289794922, 22.101472854614258, 22.582542419433594, 23.06361198425293, 23.544679641723633, 24.02574920654297, 24.506818771362305, 24.98788833618164, 25.468955993652344, 25.95002555847168]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 9.0, 8.0, 15.0, 18.0, 24.0, 20.0, 31.0, 40.0, 30.0, 40.0, 39.0, 43.0, 63.0, 60.0, 58.0, 56.0, 51.0, 44.0, 65.0, 38.0, 47.0, 36.0, 35.0, 34.0, 15.0, 16.0, 14.0, 14.0, 6.0, 13.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.641651153564453, -6.327957630157471, -6.014264106750488, -5.700570583343506, -5.386877059936523, -5.073183536529541, -4.759490013122559, -4.445796489715576, -4.132102966308594, -3.8184094429016113, -3.504715919494629, -3.1910223960876465, -2.877328872680664, -2.5636353492736816, -2.249941825866699, -1.9362483024597168, -1.6225547790527344, -1.308861255645752, -0.9951677322387695, -0.6814742088317871, -0.3677806854248047, -0.054087162017822266, 0.25960636138916016, 0.5732998847961426, 0.886993408203125, 1.2006869316101074, 1.5143804550170898, 1.8280739784240723, 2.1417675018310547, 2.455461025238037, 2.7691545486450195, 3.082848072052002, 3.3965415954589844, 3.710235118865967, 4.023928642272949, 4.337622165679932, 4.651315689086914, 4.9650092124938965, 5.278702735900879, 5.592396259307861, 5.906089782714844, 6.219783306121826, 6.533476829528809, 6.847170352935791, 7.160863876342773, 7.474557399749756, 7.788250923156738, 8.101943969726562, 8.415637969970703, 8.729331970214844, 9.043025016784668, 9.356718063354492, 9.670412063598633, 9.984106063842773, 10.297799110412598, 10.611492156982422, 10.925186157226562, 11.238880157470703, 11.552573204040527, 11.866266250610352, 12.179960250854492, 12.493654251098633, 12.807347297668457, 13.121040344238281, 13.434734344482422]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 20.0, 40.0, 46.0, 83.0, 127.0, 150.0, 272.0, 515.0, 1453.0, 10023.0, 178537.0, 2205923.0, 1683057.0, 105000.0, 6636.0, 1109.0, 492.0, 266.0, 169.0, 122.0, 87.0, 57.0, 38.0, 14.0, 15.0, 10.0, 6.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.528076171875, -5.23583984375, -4.943603515625, -4.6513671875, -4.359130859375, -4.06689453125, -3.774658203125, -3.482421875, -3.190185546875, -2.89794921875, -2.605712890625, -2.3134765625, -2.021240234375, -1.72900390625, -1.436767578125, -1.14453125, -0.852294921875, -0.56005859375, -0.267822265625, 0.0244140625, 0.316650390625, 0.60888671875, 0.901123046875, 1.193359375, 1.485595703125, 1.77783203125, 2.070068359375, 2.3623046875, 2.654541015625, 2.94677734375, 3.239013671875, 3.53125, 3.823486328125, 4.11572265625, 4.407958984375, 4.7001953125, 4.992431640625, 5.28466796875, 5.576904296875, 5.869140625, 6.161376953125, 6.45361328125, 6.745849609375, 7.0380859375, 7.330322265625, 7.62255859375, 7.914794921875, 8.20703125, 8.499267578125, 8.79150390625, 9.083740234375, 9.3759765625, 9.668212890625, 9.96044921875, 10.252685546875, 10.544921875, 10.837158203125, 11.12939453125, 11.421630859375, 11.7138671875, 12.006103515625, 12.29833984375, 12.590576171875, 12.8828125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 3.0, 2.0, 7.0, 9.0, 10.0, 12.0, 17.0, 17.0, 16.0, 15.0, 22.0, 29.0, 22.0, 40.0, 32.0, 37.0, 29.0, 31.0, 40.0, 34.0, 38.0, 43.0, 38.0, 43.0, 41.0, 50.0, 43.0, 33.0, 38.0, 27.0, 22.0, 25.0, 21.0, 14.0, 19.0, 16.0, 6.0, 8.0, 9.0, 9.0, 5.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.28125, -3.173004150390625, -3.06475830078125, -2.956512451171875, -2.8482666015625, -2.740020751953125, -2.63177490234375, -2.523529052734375, -2.415283203125, -2.307037353515625, -2.19879150390625, -2.090545654296875, -1.9822998046875, -1.874053955078125, -1.76580810546875, -1.657562255859375, -1.54931640625, -1.441070556640625, -1.33282470703125, -1.224578857421875, -1.1163330078125, -1.008087158203125, -0.89984130859375, -0.791595458984375, -0.683349609375, -0.575103759765625, -0.46685791015625, -0.358612060546875, -0.2503662109375, -0.142120361328125, -0.03387451171875, 0.074371337890625, 0.1826171875, 0.290863037109375, 0.39910888671875, 0.507354736328125, 0.6156005859375, 0.723846435546875, 0.83209228515625, 0.940338134765625, 1.048583984375, 1.156829833984375, 1.26507568359375, 1.373321533203125, 1.4815673828125, 1.589813232421875, 1.69805908203125, 1.806304931640625, 1.91455078125, 2.022796630859375, 2.13104248046875, 2.239288330078125, 2.3475341796875, 2.455780029296875, 2.56402587890625, 2.672271728515625, 2.780517578125, 2.888763427734375, 2.99700927734375, 3.105255126953125, 3.2135009765625, 3.321746826171875, 3.42999267578125, 3.538238525390625, 3.646484375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 10.0, 19.0, 12.0, 28.0, 32.0, 38.0, 84.0, 135.0, 224.0, 531.0, 1574.0, 22504.0, 4022832.0, 142668.0, 2254.0, 650.0, 265.0, 151.0, 76.0, 60.0, 35.0, 14.0, 19.0, 15.0, 12.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-24.515625, -23.927001953125, -23.33837890625, -22.749755859375, -22.1611328125, -21.572509765625, -20.98388671875, -20.395263671875, -19.806640625, -19.218017578125, -18.62939453125, -18.040771484375, -17.4521484375, -16.863525390625, -16.27490234375, -15.686279296875, -15.09765625, -14.509033203125, -13.92041015625, -13.331787109375, -12.7431640625, -12.154541015625, -11.56591796875, -10.977294921875, -10.388671875, -9.800048828125, -9.21142578125, -8.622802734375, -8.0341796875, -7.445556640625, -6.85693359375, -6.268310546875, -5.6796875, -5.091064453125, -4.50244140625, -3.913818359375, -3.3251953125, -2.736572265625, -2.14794921875, -1.559326171875, -0.970703125, -0.382080078125, 0.20654296875, 0.795166015625, 1.3837890625, 1.972412109375, 2.56103515625, 3.149658203125, 3.73828125, 4.326904296875, 4.91552734375, 5.504150390625, 6.0927734375, 6.681396484375, 7.27001953125, 7.858642578125, 8.447265625, 9.035888671875, 9.62451171875, 10.213134765625, 10.8017578125, 11.390380859375, 11.97900390625, 12.567626953125, 13.15625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 10.0, 15.0, 20.0, 51.0, 61.0, 119.0, 205.0, 359.0, 598.0, 770.0, 695.0, 465.0, 288.0, 187.0, 95.0, 50.0, 32.0, 25.0, 13.0, 12.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.498046875, -1.403289794921875, -1.30853271484375, -1.213775634765625, -1.1190185546875, -1.024261474609375, -0.92950439453125, -0.834747314453125, -0.739990234375, -0.645233154296875, -0.55047607421875, -0.455718994140625, -0.3609619140625, -0.266204833984375, -0.17144775390625, -0.076690673828125, 0.01806640625, 0.112823486328125, 0.20758056640625, 0.302337646484375, 0.3970947265625, 0.491851806640625, 0.58660888671875, 0.681365966796875, 0.776123046875, 0.870880126953125, 0.96563720703125, 1.060394287109375, 1.1551513671875, 1.249908447265625, 1.34466552734375, 1.439422607421875, 1.5341796875, 1.628936767578125, 1.72369384765625, 1.818450927734375, 1.9132080078125, 2.007965087890625, 2.10272216796875, 2.197479248046875, 2.292236328125, 2.386993408203125, 2.48175048828125, 2.576507568359375, 2.6712646484375, 2.766021728515625, 2.86077880859375, 2.955535888671875, 3.05029296875, 3.145050048828125, 3.23980712890625, 3.334564208984375, 3.4293212890625, 3.524078369140625, 3.61883544921875, 3.713592529296875, 3.808349609375, 3.903106689453125, 3.99786376953125, 4.092620849609375, 4.1873779296875, 4.282135009765625, 4.37689208984375, 4.471649169921875, 4.56640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 8.0, 11.0, 21.0, 32.0, 36.0, 40.0, 61.0, 71.0, 83.0, 103.0, 94.0, 81.0, 75.0, 73.0, 67.0, 45.0, 39.0, 21.0, 20.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.012707233428955, -3.792933702468872, -3.573160171508789, -3.353386402130127, -3.133613109588623, -2.913839340209961, -2.694065809249878, -2.474292278289795, -2.254518747329712, -2.034745216369629, -1.814971685409546, -1.5951980352401733, -1.3754245042800903, -1.1556509733200073, -0.9358773231506348, -0.7161037921905518, -0.49633026123046875, -0.27655670046806335, -0.05678313970565796, 0.16299045085906982, 0.38276398181915283, 0.6025375127792358, 0.8223111629486084, 1.0420846939086914, 1.2618582248687744, 1.4816317558288574, 1.7014052867889404, 1.921178936958313, 2.1409525871276855, 2.3607258796691895, 2.5804996490478516, 2.8002731800079346, 3.020047187805176, 3.239820718765259, 3.459594249725342, 3.679368019104004, 3.899141311645508, 4.11891508102417, 4.338688850402832, 4.558462142944336, 4.77823543548584, 4.998009204864502, 5.217782497406006, 5.437556266784668, 5.657329559326172, 5.877103328704834, 6.096877098083496, 6.316650390625, 6.536424160003662, 6.756197929382324, 6.975971221923828, 7.19574499130249, 7.415518283843994, 7.635292053222656, 7.85506534576416, 8.074838638305664, 8.294612884521484, 8.514386177062988, 8.734160423278809, 8.953933715820312, 9.173707008361816, 9.39348030090332, 9.61325454711914, 9.833027839660645, 10.052801132202148]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 11.0, 12.0, 14.0, 18.0, 18.0, 8.0, 21.0, 25.0, 21.0, 20.0, 22.0, 27.0, 23.0, 29.0, 29.0, 34.0, 44.0, 40.0, 39.0, 43.0, 39.0, 33.0, 45.0, 46.0, 32.0, 34.0, 37.0, 34.0, 21.0, 23.0, 18.0, 19.0, 17.0, 14.0, 11.0, 10.0, 11.0, 9.0, 4.0, 6.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9131927490234375, -3.800863027572632, -3.688533306121826, -3.5762035846710205, -3.463873863220215, -3.351544141769409, -3.2392144203186035, -3.126884698867798, -3.014554977416992, -2.9022252559661865, -2.789895534515381, -2.677565813064575, -2.5652360916137695, -2.452906370162964, -2.340576648712158, -2.2282469272613525, -2.115917205810547, -2.003587484359741, -1.8912577629089355, -1.7789280414581299, -1.6665983200073242, -1.5542685985565186, -1.441938877105713, -1.3296091556549072, -1.2172791957855225, -1.1049494743347168, -0.9926197528839111, -0.8802900314331055, -0.7679603099822998, -0.6556305289268494, -0.5433008074760437, -0.43097108602523804, -0.31864142417907715, -0.20631170272827148, -0.09398196637630463, 0.01834776997566223, 0.1306774914264679, 0.24300724267959595, 0.3553369641304016, 0.4676666855812073, 0.5799964070320129, 0.6923261284828186, 0.8046558499336243, 0.9169856309890747, 1.0293153524398804, 1.141645073890686, 1.2539747953414917, 1.3663045167922974, 1.478634238243103, 1.5909639596939087, 1.7032936811447144, 1.81562340259552, 1.9279531240463257, 2.040282964706421, 2.1526126861572266, 2.2649424076080322, 2.377272129058838, 2.4896018505096436, 2.601931571960449, 2.714261293411255, 2.8265910148620605, 2.938920736312866, 3.051250457763672, 3.1635801792144775, 3.275909900665283]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 22.0, 22.0, 25.0, 32.0, 44.0, 69.0, 105.0, 150.0, 192.0, 259.0, 451.0, 822.0, 1790.0, 4943.0, 17049.0, 67077.0, 241275.0, 425730.0, 209385.0, 56270.0, 14697.0, 4423.0, 1676.0, 753.0, 428.0, 262.0, 172.0, 107.0, 86.0, 74.0, 49.0, 25.0, 18.0, 22.0, 6.0, 9.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.6367874145507812, -0.6143951416015625, -0.5920028686523438, -0.569610595703125, -0.5472183227539062, -0.5248260498046875, -0.5024337768554688, -0.48004150390625, -0.45764923095703125, -0.4352569580078125, -0.41286468505859375, -0.390472412109375, -0.36808013916015625, -0.3456878662109375, -0.32329559326171875, -0.3009033203125, -0.27851104736328125, -0.2561187744140625, -0.23372650146484375, -0.211334228515625, -0.18894195556640625, -0.1665496826171875, -0.14415740966796875, -0.12176513671875, -0.09937286376953125, -0.0769805908203125, -0.05458831787109375, -0.032196044921875, -0.00980377197265625, 0.0125885009765625, 0.03498077392578125, 0.057373046875, 0.07976531982421875, 0.1021575927734375, 0.12454986572265625, 0.146942138671875, 0.16933441162109375, 0.1917266845703125, 0.21411895751953125, 0.23651123046875, 0.25890350341796875, 0.2812957763671875, 0.30368804931640625, 0.326080322265625, 0.34847259521484375, 0.3708648681640625, 0.39325714111328125, 0.4156494140625, 0.43804168701171875, 0.4604339599609375, 0.48282623291015625, 0.505218505859375, 0.5276107788085938, 0.5500030517578125, 0.5723953247070312, 0.59478759765625, 0.6171798706054688, 0.6395721435546875, 0.6619644165039062, 0.684356689453125, 0.7067489624023438, 0.7291412353515625, 0.7515335083007812, 0.77392578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 5.0, 4.0, 5.0, 6.0, 18.0, 12.0, 21.0, 20.0, 19.0, 22.0, 26.0, 32.0, 35.0, 32.0, 46.0, 45.0, 41.0, 43.0, 53.0, 62.0, 44.0, 49.0, 44.0, 41.0, 34.0, 47.0, 30.0, 32.0, 27.0, 25.0, 19.0, 15.0, 10.0, 7.0, 9.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.486328125, -3.39398193359375, -3.3016357421875, -3.20928955078125, -3.116943359375, -3.02459716796875, -2.9322509765625, -2.83990478515625, -2.74755859375, -2.65521240234375, -2.5628662109375, -2.47052001953125, -2.378173828125, -2.28582763671875, -2.1934814453125, -2.10113525390625, -2.0087890625, -1.91644287109375, -1.8240966796875, -1.73175048828125, -1.639404296875, -1.54705810546875, -1.4547119140625, -1.36236572265625, -1.27001953125, -1.17767333984375, -1.0853271484375, -0.99298095703125, -0.900634765625, -0.80828857421875, -0.7159423828125, -0.62359619140625, -0.53125, -0.43890380859375, -0.3465576171875, -0.25421142578125, -0.161865234375, -0.06951904296875, 0.0228271484375, 0.11517333984375, 0.20751953125, 0.29986572265625, 0.3922119140625, 0.48455810546875, 0.576904296875, 0.66925048828125, 0.7615966796875, 0.85394287109375, 0.9462890625, 1.03863525390625, 1.1309814453125, 1.22332763671875, 1.315673828125, 1.40802001953125, 1.5003662109375, 1.59271240234375, 1.68505859375, 1.77740478515625, 1.8697509765625, 1.96209716796875, 2.054443359375, 2.14678955078125, 2.2391357421875, 2.33148193359375, 2.423828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 13.0, 25.0, 31.0, 43.0, 77.0, 151.0, 301.0, 623.0, 1415.0, 2884.0, 6109.0, 13227.0, 28220.0, 58832.0, 115219.0, 192442.0, 233742.0, 183379.0, 107140.0, 54753.0, 26394.0, 12384.0, 5718.0, 2790.0, 1302.0, 617.0, 320.0, 156.0, 91.0, 43.0, 34.0, 21.0, 8.0, 10.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.34423828125, -0.3342437744140625, -0.324249267578125, -0.3142547607421875, -0.30426025390625, -0.2942657470703125, -0.284271240234375, -0.2742767333984375, -0.2642822265625, -0.2542877197265625, -0.244293212890625, -0.2342987060546875, -0.22430419921875, -0.2143096923828125, -0.204315185546875, -0.1943206787109375, -0.184326171875, -0.1743316650390625, -0.164337158203125, -0.1543426513671875, -0.14434814453125, -0.1343536376953125, -0.124359130859375, -0.1143646240234375, -0.1043701171875, -0.0943756103515625, -0.084381103515625, -0.0743865966796875, -0.06439208984375, -0.0543975830078125, -0.044403076171875, -0.0344085693359375, -0.0244140625, -0.0144195556640625, -0.004425048828125, 0.0055694580078125, 0.01556396484375, 0.0255584716796875, 0.035552978515625, 0.0455474853515625, 0.0555419921875, 0.0655364990234375, 0.075531005859375, 0.0855255126953125, 0.09552001953125, 0.1055145263671875, 0.115509033203125, 0.1255035400390625, 0.135498046875, 0.1454925537109375, 0.155487060546875, 0.1654815673828125, 0.17547607421875, 0.1854705810546875, 0.195465087890625, 0.2054595947265625, 0.2154541015625, 0.2254486083984375, 0.235443115234375, 0.2454376220703125, 0.25543212890625, 0.2654266357421875, 0.275421142578125, 0.2854156494140625, 0.29541015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 6.0, 2.0, 5.0, 7.0, 7.0, 5.0, 12.0, 11.0, 18.0, 22.0, 28.0, 30.0, 32.0, 26.0, 25.0, 45.0, 39.0, 25.0, 34.0, 47.0, 41.0, 47.0, 32.0, 50.0, 29.0, 44.0, 37.0, 22.0, 40.0, 35.0, 33.0, 32.0, 19.0, 18.0, 15.0, 14.0, 7.0, 13.0, 7.0, 7.0, 5.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.6171875, -4.46002197265625, -4.3028564453125, -4.14569091796875, -3.988525390625, -3.83135986328125, -3.6741943359375, -3.51702880859375, -3.35986328125, -3.20269775390625, -3.0455322265625, -2.88836669921875, -2.731201171875, -2.57403564453125, -2.4168701171875, -2.25970458984375, -2.1025390625, -1.94537353515625, -1.7882080078125, -1.63104248046875, -1.473876953125, -1.31671142578125, -1.1595458984375, -1.00238037109375, -0.84521484375, -0.68804931640625, -0.5308837890625, -0.37371826171875, -0.216552734375, -0.05938720703125, 0.0977783203125, 0.25494384765625, 0.412109375, 0.56927490234375, 0.7264404296875, 0.88360595703125, 1.040771484375, 1.19793701171875, 1.3551025390625, 1.51226806640625, 1.66943359375, 1.82659912109375, 1.9837646484375, 2.14093017578125, 2.298095703125, 2.45526123046875, 2.6124267578125, 2.76959228515625, 2.9267578125, 3.08392333984375, 3.2410888671875, 3.39825439453125, 3.555419921875, 3.71258544921875, 3.8697509765625, 4.02691650390625, 4.18408203125, 4.34124755859375, 4.4984130859375, 4.65557861328125, 4.812744140625, 4.96990966796875, 5.1270751953125, 5.28424072265625, 5.44140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 9.0, 3.0, 9.0, 8.0, 17.0, 30.0, 44.0, 76.0, 111.0, 178.0, 287.0, 497.0, 815.0, 1613.0, 2979.0, 5959.0, 13825.0, 36361.0, 108812.0, 296404.0, 350445.0, 147977.0, 48731.0, 17778.0, 7648.0, 3568.0, 1834.0, 990.0, 583.0, 328.0, 224.0, 147.0, 93.0, 58.0, 32.0, 27.0, 17.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0611572265625, -0.059416770935058594, -0.05767631530761719, -0.05593585968017578, -0.054195404052734375, -0.05245494842529297, -0.05071449279785156, -0.048974037170410156, -0.04723358154296875, -0.045493125915527344, -0.04375267028808594, -0.04201221466064453, -0.040271759033203125, -0.03853130340576172, -0.03679084777832031, -0.035050392150878906, -0.0333099365234375, -0.031569480895996094, -0.029829025268554688, -0.02808856964111328, -0.026348114013671875, -0.02460765838623047, -0.022867202758789062, -0.021126747131347656, -0.01938629150390625, -0.017645835876464844, -0.015905380249023438, -0.014164924621582031, -0.012424468994140625, -0.010684013366699219, -0.008943557739257812, -0.007203102111816406, -0.005462646484375, -0.0037221908569335938, -0.0019817352294921875, -0.00024127960205078125, 0.001499176025390625, 0.0032396316528320312, 0.0049800872802734375, 0.006720542907714844, 0.00846099853515625, 0.010201454162597656, 0.011941909790039062, 0.013682365417480469, 0.015422821044921875, 0.01716327667236328, 0.018903732299804688, 0.020644187927246094, 0.0223846435546875, 0.024125099182128906, 0.025865554809570312, 0.02760601043701172, 0.029346466064453125, 0.03108692169189453, 0.03282737731933594, 0.034567832946777344, 0.03630828857421875, 0.038048744201660156, 0.03978919982910156, 0.04152965545654297, 0.043270111083984375, 0.04501056671142578, 0.04675102233886719, 0.048491477966308594, 0.05023193359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 13.0, 18.0, 18.0, 24.0, 29.0, 37.0, 71.0, 105.0, 111.0, 118.0, 124.0, 89.0, 68.0, 50.0, 27.0, 26.0, 18.0, 16.0, 9.0, 9.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010859966278076172, -0.00010605063289403915, -0.00010350160300731659, -0.00010095257312059402, -9.840354323387146e-05, -9.58545133471489e-05, -9.330548346042633e-05, -9.075645357370377e-05, -8.82074236869812e-05, -8.565839380025864e-05, -8.310936391353607e-05, -8.056033402681351e-05, -7.801130414009094e-05, -7.546227425336838e-05, -7.291324436664581e-05, -7.036421447992325e-05, -6.781518459320068e-05, -6.526615470647812e-05, -6.271712481975555e-05, -6.016809493303299e-05, -5.7619065046310425e-05, -5.507003515958786e-05, -5.2521005272865295e-05, -4.997197538614273e-05, -4.7422945499420166e-05, -4.48739156126976e-05, -4.232488572597504e-05, -3.977585583925247e-05, -3.722682595252991e-05, -3.467779606580734e-05, -3.212876617908478e-05, -2.9579736292362213e-05, -2.703070640563965e-05, -2.4481676518917084e-05, -2.193264663219452e-05, -1.9383616745471954e-05, -1.683458685874939e-05, -1.4285556972026825e-05, -1.173652708530426e-05, -9.187497198581696e-06, -6.638467311859131e-06, -4.089437425136566e-06, -1.5404075384140015e-06, 1.0086223483085632e-06, 3.557652235031128e-06, 6.106682121753693e-06, 8.655712008476257e-06, 1.1204741895198822e-05, 1.3753771781921387e-05, 1.630280166864395e-05, 1.8851831555366516e-05, 2.140086144208908e-05, 2.3949891328811646e-05, 2.649892121553421e-05, 2.9047951102256775e-05, 3.159698098897934e-05, 3.4146010875701904e-05, 3.669504076242447e-05, 3.9244070649147034e-05, 4.17931005358696e-05, 4.434213042259216e-05, 4.689116030931473e-05, 4.944019019603729e-05, 5.198922008275986e-05, 5.453824996948242e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 24.0, 11.0, 17.0, 31.0, 50.0, 93.0, 221.0, 687.0, 3211.0, 25030.0, 370956.0, 599088.0, 42810.0, 4749.0, 980.0, 286.0, 116.0, 56.0, 29.0, 24.0, 18.0, 13.0, 15.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11509895324707031, -0.11069107055664062, -0.10628318786621094, -0.10187530517578125, -0.09746742248535156, -0.09305953979492188, -0.08865165710449219, -0.0842437744140625, -0.07983589172363281, -0.07542800903320312, -0.07102012634277344, -0.06661224365234375, -0.06220436096191406, -0.057796478271484375, -0.05338859558105469, -0.048980712890625, -0.04457283020019531, -0.040164947509765625, -0.03575706481933594, -0.03134918212890625, -0.026941299438476562, -0.022533416748046875, -0.018125534057617188, -0.0137176513671875, -0.009309768676757812, -0.004901885986328125, -0.0004940032958984375, 0.00391387939453125, 0.008321762084960938, 0.012729644775390625, 0.017137527465820312, 0.02154541015625, 0.025953292846679688, 0.030361175537109375, 0.03476905822753906, 0.03917694091796875, 0.04358482360839844, 0.047992706298828125, 0.05240058898925781, 0.0568084716796875, 0.06121635437011719, 0.06562423706054688, 0.07003211975097656, 0.07444000244140625, 0.07884788513183594, 0.08325576782226562, 0.08766365051269531, 0.092071533203125, 0.09647941589355469, 0.10088729858398438, 0.10529518127441406, 0.10970306396484375, 0.11411094665527344, 0.11851882934570312, 0.12292671203613281, 0.1273345947265625, 0.1317424774169922, 0.13615036010742188, 0.14055824279785156, 0.14496612548828125, 0.14937400817871094, 0.15378189086914062, 0.1581897735595703, 0.16259765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 21.0, 12.0, 35.0, 53.0, 48.0, 60.0, 76.0, 88.0, 76.0, 91.0, 86.0, 72.0, 40.0, 48.0, 40.0, 30.0, 20.0, 15.0, 18.0, 12.0, 4.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0156402587890625, -0.015057086944580078, -0.014473915100097656, -0.013890743255615234, -0.013307571411132812, -0.01272439956665039, -0.012141227722167969, -0.011558055877685547, -0.010974884033203125, -0.010391712188720703, -0.009808540344238281, -0.00922536849975586, -0.008642196655273438, -0.008059024810791016, -0.007475852966308594, -0.006892681121826172, -0.00630950927734375, -0.005726337432861328, -0.005143165588378906, -0.004559993743896484, -0.0039768218994140625, -0.0033936500549316406, -0.0028104782104492188, -0.002227306365966797, -0.001644134521484375, -0.0010609626770019531, -0.00047779083251953125, 0.00010538101196289062, 0.0006885528564453125, 0.0012717247009277344, 0.0018548965454101562, 0.002438068389892578, 0.003021240234375, 0.003604412078857422, 0.004187583923339844, 0.004770755767822266, 0.0053539276123046875, 0.005937099456787109, 0.006520271301269531, 0.007103443145751953, 0.007686614990234375, 0.008269786834716797, 0.008852958679199219, 0.00943613052368164, 0.010019302368164062, 0.010602474212646484, 0.011185646057128906, 0.011768817901611328, 0.01235198974609375, 0.012935161590576172, 0.013518333435058594, 0.014101505279541016, 0.014684677124023438, 0.01526784896850586, 0.01585102081298828, 0.016434192657470703, 0.017017364501953125, 0.017600536346435547, 0.01818370819091797, 0.01876688003540039, 0.019350051879882812, 0.019933223724365234, 0.020516395568847656, 0.021099567413330078, 0.0216827392578125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 16.0, 30.0, 42.0, 86.0, 122.0, 153.0, 144.0, 132.0, 114.0, 92.0, 39.0, 21.0, 3.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.160707473754883, -9.941709518432617, -9.722711563110352, -9.50371265411377, -9.284714698791504, -9.065716743469238, -8.846718788146973, -8.627720832824707, -8.408721923828125, -8.18972396850586, -7.9707255363464355, -7.75172758102417, -7.532729148864746, -7.3137311935424805, -7.094733238220215, -6.875734806060791, -6.656737327575684, -6.437739372253418, -6.218740940093994, -5.9997429847717285, -5.780744552612305, -5.561746597290039, -5.342748641967773, -5.12375020980835, -4.904751777648926, -4.68575382232666, -4.466755390167236, -4.247757434844971, -4.028759002685547, -3.8097610473632812, -3.5907628536224365, -3.371764659881592, -3.152766704559326, -2.9337685108184814, -2.7147703170776367, -2.495772361755371, -2.2767741680145264, -2.0577759742736816, -1.838777780532837, -1.6197797060012817, -1.400781512260437, -1.1817833185195923, -0.9627852439880371, -0.7437870502471924, -0.5247889161109924, -0.3057907819747925, -0.08679258823394775, 0.13220548629760742, 0.35120368003845215, 0.5702018141746521, 0.789199948310852, 1.0081981420516968, 1.227196216583252, 1.4461944103240967, 1.6651926040649414, 1.8841906785964966, 2.103188991546631, 2.3221871852874756, 2.5411853790283203, 2.760183334350586, 2.9791815280914307, 3.1981797218322754, 3.41717791557312, 3.636176109313965, 3.8551740646362305]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 17.0, 9.0, 17.0, 24.0, 19.0, 28.0, 28.0, 31.0, 29.0, 40.0, 35.0, 52.0, 52.0, 50.0, 67.0, 60.0, 57.0, 59.0, 49.0, 53.0, 45.0, 40.0, 27.0, 27.0, 18.0, 14.0, 18.0, 10.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.067600250244141, -3.964730739593506, -3.861861228942871, -3.7589914798736572, -3.6561219692230225, -3.5532524585723877, -3.450382709503174, -3.347513198852539, -3.2446436882019043, -3.1417741775512695, -3.0389046669006348, -2.936034917831421, -2.833165407180786, -2.7302958965301514, -2.6274261474609375, -2.5245566368103027, -2.421687126159668, -2.318817615509033, -2.2159481048583984, -2.1130783557891846, -2.01020884513855, -1.907339334487915, -1.8044697046279907, -1.7016000747680664, -1.5987305641174316, -1.4958610534667969, -1.3929914236068726, -1.2901217937469482, -1.1872522830963135, -1.0843827724456787, -0.9815131425857544, -0.8786435723304749, -0.7757737636566162, -0.6729041934013367, -0.5700346231460571, -0.4671650528907776, -0.36429548263549805, -0.2614259123802185, -0.15855634212493896, -0.055686771869659424, 0.04718279838562012, 0.15005236864089966, 0.2529219388961792, 0.35579150915145874, 0.4586610794067383, 0.5615306496620178, 0.6644002199172974, 0.7672697901725769, 0.8701393604278564, 0.973008930683136, 1.0758785009384155, 1.1787481307983398, 1.2816176414489746, 1.3844871520996094, 1.4873567819595337, 1.590226411819458, 1.6930959224700928, 1.7959654331207275, 1.8988350629806519, 2.001704692840576, 2.104574203491211, 2.2074437141418457, 2.3103132247924805, 2.4131829738616943, 2.516052484512329]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 3.0, 10.0, 7.0, 11.0, 21.0, 24.0, 30.0, 47.0, 64.0, 157.0, 662.0, 4649.0, 58897.0, 504056.0, 431860.0, 43327.0, 3703.0, 583.0, 177.0, 70.0, 47.0, 28.0, 21.0, 25.0, 15.0, 12.0, 7.0, 7.0, 7.0, 8.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.25592041015625, -8.0196533203125, -7.78338623046875, -7.547119140625, -7.31085205078125, -7.0745849609375, -6.83831787109375, -6.60205078125, -6.36578369140625, -6.1295166015625, -5.89324951171875, -5.656982421875, -5.42071533203125, -5.1844482421875, -4.94818115234375, -4.7119140625, -4.47564697265625, -4.2393798828125, -4.00311279296875, -3.766845703125, -3.53057861328125, -3.2943115234375, -3.05804443359375, -2.82177734375, -2.58551025390625, -2.3492431640625, -2.11297607421875, -1.876708984375, -1.64044189453125, -1.4041748046875, -1.16790771484375, -0.931640625, -0.69537353515625, -0.4591064453125, -0.22283935546875, 0.013427734375, 0.24969482421875, 0.4859619140625, 0.72222900390625, 0.95849609375, 1.19476318359375, 1.4310302734375, 1.66729736328125, 1.903564453125, 2.13983154296875, 2.3760986328125, 2.61236572265625, 2.8486328125, 3.08489990234375, 3.3211669921875, 3.55743408203125, 3.793701171875, 4.02996826171875, 4.2662353515625, 4.50250244140625, 4.73876953125, 4.97503662109375, 5.2113037109375, 5.44757080078125, 5.683837890625, 5.92010498046875, 6.1563720703125, 6.39263916015625, 6.62890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 13.0, 11.0, 12.0, 21.0, 27.0, 27.0, 26.0, 25.0, 21.0, 34.0, 37.0, 42.0, 44.0, 47.0, 47.0, 47.0, 46.0, 46.0, 57.0, 54.0, 38.0, 39.0, 29.0, 35.0, 27.0, 25.0, 24.0, 17.0, 15.0, 12.0, 4.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.18359375, -5.02825927734375, -4.8729248046875, -4.71759033203125, -4.562255859375, -4.40692138671875, -4.2515869140625, -4.09625244140625, -3.94091796875, -3.78558349609375, -3.6302490234375, -3.47491455078125, -3.319580078125, -3.16424560546875, -3.0089111328125, -2.85357666015625, -2.6982421875, -2.54290771484375, -2.3875732421875, -2.23223876953125, -2.076904296875, -1.92156982421875, -1.7662353515625, -1.61090087890625, -1.45556640625, -1.30023193359375, -1.1448974609375, -0.98956298828125, -0.834228515625, -0.67889404296875, -0.5235595703125, -0.36822509765625, -0.212890625, -0.05755615234375, 0.0977783203125, 0.25311279296875, 0.408447265625, 0.56378173828125, 0.7191162109375, 0.87445068359375, 1.02978515625, 1.18511962890625, 1.3404541015625, 1.49578857421875, 1.651123046875, 1.80645751953125, 1.9617919921875, 2.11712646484375, 2.2724609375, 2.42779541015625, 2.5831298828125, 2.73846435546875, 2.893798828125, 3.04913330078125, 3.2044677734375, 3.35980224609375, 3.51513671875, 3.67047119140625, 3.8258056640625, 3.98114013671875, 4.136474609375, 4.29180908203125, 4.4471435546875, 4.60247802734375, 4.7578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 6.0, 10.0, 9.0, 9.0, 10.0, 21.0, 20.0, 34.0, 45.0, 57.0, 82.0, 92.0, 142.0, 150.0, 228.0, 288.0, 570.0, 3701.0, 209477.0, 801207.0, 29750.0, 1144.0, 439.0, 292.0, 177.0, 147.0, 111.0, 63.0, 68.0, 55.0, 45.0, 38.0, 23.0, 10.0, 10.0, 9.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.2572021484375, -10.897216796875, -10.5372314453125, -10.17724609375, -9.8172607421875, -9.457275390625, -9.0972900390625, -8.7373046875, -8.3773193359375, -8.017333984375, -7.6573486328125, -7.29736328125, -6.9373779296875, -6.577392578125, -6.2174072265625, -5.857421875, -5.4974365234375, -5.137451171875, -4.7774658203125, -4.41748046875, -4.0574951171875, -3.697509765625, -3.3375244140625, -2.9775390625, -2.6175537109375, -2.257568359375, -1.8975830078125, -1.53759765625, -1.1776123046875, -0.817626953125, -0.4576416015625, -0.09765625, 0.2623291015625, 0.622314453125, 0.9822998046875, 1.34228515625, 1.7022705078125, 2.062255859375, 2.4222412109375, 2.7822265625, 3.1422119140625, 3.502197265625, 3.8621826171875, 4.22216796875, 4.5821533203125, 4.942138671875, 5.3021240234375, 5.662109375, 6.0220947265625, 6.382080078125, 6.7420654296875, 7.10205078125, 7.4620361328125, 7.822021484375, 8.1820068359375, 8.5419921875, 8.9019775390625, 9.261962890625, 9.6219482421875, 9.98193359375, 10.3419189453125, 10.701904296875, 11.0618896484375, 11.421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 8.0, 13.0, 7.0, 7.0, 14.0, 11.0, 9.0, 18.0, 18.0, 21.0, 16.0, 28.0, 21.0, 36.0, 42.0, 31.0, 45.0, 37.0, 41.0, 48.0, 44.0, 53.0, 27.0, 42.0, 42.0, 33.0, 45.0, 37.0, 31.0, 28.0, 30.0, 18.0, 19.0, 18.0, 13.0, 13.0, 8.0, 5.0, 3.0, 6.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.42706298828125, -4.2760009765625, -4.12493896484375, -3.973876953125, -3.82281494140625, -3.6717529296875, -3.52069091796875, -3.36962890625, -3.21856689453125, -3.0675048828125, -2.91644287109375, -2.765380859375, -2.61431884765625, -2.4632568359375, -2.31219482421875, -2.1611328125, -2.01007080078125, -1.8590087890625, -1.70794677734375, -1.556884765625, -1.40582275390625, -1.2547607421875, -1.10369873046875, -0.95263671875, -0.80157470703125, -0.6505126953125, -0.49945068359375, -0.348388671875, -0.19732666015625, -0.0462646484375, 0.10479736328125, 0.255859375, 0.40692138671875, 0.5579833984375, 0.70904541015625, 0.860107421875, 1.01116943359375, 1.1622314453125, 1.31329345703125, 1.46435546875, 1.61541748046875, 1.7664794921875, 1.91754150390625, 2.068603515625, 2.21966552734375, 2.3707275390625, 2.52178955078125, 2.6728515625, 2.82391357421875, 2.9749755859375, 3.12603759765625, 3.277099609375, 3.42816162109375, 3.5792236328125, 3.73028564453125, 3.88134765625, 4.03240966796875, 4.1834716796875, 4.33453369140625, 4.485595703125, 4.63665771484375, 4.7877197265625, 4.93878173828125, 5.08984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 13.0, 15.0, 23.0, 44.0, 100.0, 233.0, 373.0, 1159.0, 9158.0, 488528.0, 537224.0, 9615.0, 1294.0, 374.0, 177.0, 89.0, 48.0, 30.0, 15.0, 8.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.76953125, -4.62506103515625, -4.4805908203125, -4.33612060546875, -4.191650390625, -4.04718017578125, -3.9027099609375, -3.75823974609375, -3.61376953125, -3.46929931640625, -3.3248291015625, -3.18035888671875, -3.035888671875, -2.89141845703125, -2.7469482421875, -2.60247802734375, -2.4580078125, -2.31353759765625, -2.1690673828125, -2.02459716796875, -1.880126953125, -1.73565673828125, -1.5911865234375, -1.44671630859375, -1.30224609375, -1.15777587890625, -1.0133056640625, -0.86883544921875, -0.724365234375, -0.57989501953125, -0.4354248046875, -0.29095458984375, -0.146484375, -0.00201416015625, 0.1424560546875, 0.28692626953125, 0.431396484375, 0.57586669921875, 0.7203369140625, 0.86480712890625, 1.00927734375, 1.15374755859375, 1.2982177734375, 1.44268798828125, 1.587158203125, 1.73162841796875, 1.8760986328125, 2.02056884765625, 2.1650390625, 2.30950927734375, 2.4539794921875, 2.59844970703125, 2.742919921875, 2.88739013671875, 3.0318603515625, 3.17633056640625, 3.32080078125, 3.46527099609375, 3.6097412109375, 3.75421142578125, 3.898681640625, 4.04315185546875, 4.1876220703125, 4.33209228515625, 4.4765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 11.0, 19.0, 30.0, 54.0, 107.0, 152.0, 167.0, 168.0, 104.0, 88.0, 44.0, 18.0, 19.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034332275390625, -0.00032749027013778687, -0.00031165778636932373, -0.0002958253026008606, -0.00027999281883239746, -0.0002641603350639343, -0.0002483278512954712, -0.00023249536752700806, -0.00021666288375854492, -0.0002008303999900818, -0.00018499791622161865, -0.00016916543245315552, -0.00015333294868469238, -0.00013750046491622925, -0.00012166798114776611, -0.00010583549737930298, -9.000301361083984e-05, -7.417052984237671e-05, -5.8338046073913574e-05, -4.250556230545044e-05, -2.6673078536987305e-05, -1.084059476852417e-05, 4.991888999938965e-06, 2.08243727684021e-05, 3.6656856536865234e-05, 5.248934030532837e-05, 6.83218240737915e-05, 8.415430784225464e-05, 9.998679161071777e-05, 0.00011581927537918091, 0.00013165175914764404, 0.00014748424291610718, 0.0001633167266845703, 0.00017914921045303345, 0.00019498169422149658, 0.00021081417798995972, 0.00022664666175842285, 0.00024247914552688599, 0.0002583116292953491, 0.00027414411306381226, 0.0002899765968322754, 0.0003058090806007385, 0.00032164156436920166, 0.0003374740481376648, 0.00035330653190612793, 0.00036913901567459106, 0.0003849714994430542, 0.00040080398321151733, 0.00041663646697998047, 0.0004324689507484436, 0.00044830143451690674, 0.0004641339182853699, 0.000479966402053833, 0.0004957988858222961, 0.0005116313695907593, 0.0005274638533592224, 0.0005432963371276855, 0.0005591288208961487, 0.0005749613046646118, 0.000590793788433075, 0.0006066262722015381, 0.0006224587559700012, 0.0006382912397384644, 0.0006541237235069275, 0.0006699562072753906]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 5.0, 6.0, 9.0, 13.0, 14.0, 18.0, 42.0, 77.0, 108.0, 195.0, 583.0, 4027.0, 144940.0, 882042.0, 14351.0, 1375.0, 351.0, 146.0, 90.0, 45.0, 28.0, 26.0, 13.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.27642822265625, -5.1075439453125, -4.93865966796875, -4.769775390625, -4.60089111328125, -4.4320068359375, -4.26312255859375, -4.09423828125, -3.92535400390625, -3.7564697265625, -3.58758544921875, -3.418701171875, -3.24981689453125, -3.0809326171875, -2.91204833984375, -2.7431640625, -2.57427978515625, -2.4053955078125, -2.23651123046875, -2.067626953125, -1.89874267578125, -1.7298583984375, -1.56097412109375, -1.39208984375, -1.22320556640625, -1.0543212890625, -0.88543701171875, -0.716552734375, -0.54766845703125, -0.3787841796875, -0.20989990234375, -0.041015625, 0.12786865234375, 0.2967529296875, 0.46563720703125, 0.634521484375, 0.80340576171875, 0.9722900390625, 1.14117431640625, 1.31005859375, 1.47894287109375, 1.6478271484375, 1.81671142578125, 1.985595703125, 2.15447998046875, 2.3233642578125, 2.49224853515625, 2.6611328125, 2.83001708984375, 2.9989013671875, 3.16778564453125, 3.336669921875, 3.50555419921875, 3.6744384765625, 3.84332275390625, 4.01220703125, 4.18109130859375, 4.3499755859375, 4.51885986328125, 4.687744140625, 4.85662841796875, 5.0255126953125, 5.19439697265625, 5.36328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 15.0, 16.0, 35.0, 41.0, 61.0, 75.0, 102.0, 112.0, 120.0, 111.0, 89.0, 66.0, 48.0, 25.0, 17.0, 10.0, 11.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99365234375, -0.9593582153320312, -0.9250640869140625, -0.8907699584960938, -0.856475830078125, -0.8221817016601562, -0.7878875732421875, -0.7535934448242188, -0.71929931640625, -0.6850051879882812, -0.6507110595703125, -0.6164169311523438, -0.582122802734375, -0.5478286743164062, -0.5135345458984375, -0.47924041748046875, -0.4449462890625, -0.41065216064453125, -0.3763580322265625, -0.34206390380859375, -0.307769775390625, -0.27347564697265625, -0.2391815185546875, -0.20488739013671875, -0.17059326171875, -0.13629913330078125, -0.1020050048828125, -0.06771087646484375, -0.033416748046875, 0.00087738037109375, 0.0351715087890625, 0.06946563720703125, 0.103759765625, 0.13805389404296875, 0.1723480224609375, 0.20664215087890625, 0.240936279296875, 0.27523040771484375, 0.3095245361328125, 0.34381866455078125, 0.37811279296875, 0.41240692138671875, 0.4467010498046875, 0.48099517822265625, 0.515289306640625, 0.5495834350585938, 0.5838775634765625, 0.6181716918945312, 0.6524658203125, 0.6867599487304688, 0.7210540771484375, 0.7553482055664062, 0.789642333984375, 0.8239364624023438, 0.8582305908203125, 0.8925247192382812, 0.92681884765625, 0.9611129760742188, 0.9954071044921875, 1.0297012329101562, 1.063995361328125, 1.0982894897460938, 1.1325836181640625, 1.1668777465820312, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 16.0, 14.0, 11.0, 16.0, 30.0, 38.0, 50.0, 66.0, 59.0, 76.0, 86.0, 94.0, 86.0, 82.0, 69.0, 51.0, 44.0, 38.0, 25.0, 9.0, 11.0, 12.0, 5.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.144302368164062, -9.90947437286377, -9.674646377563477, -9.439818382263184, -9.20499038696289, -8.970162391662598, -8.735334396362305, -8.500506401062012, -8.265678405761719, -8.030850410461426, -7.796022415161133, -7.56119441986084, -7.326366424560547, -7.091538429260254, -6.856710433959961, -6.621882915496826, -6.387055397033691, -6.152227401733398, -5.9173994064331055, -5.6825714111328125, -5.4477434158325195, -5.212915420532227, -4.978087425231934, -4.743259906768799, -4.508431434631348, -4.273603439331055, -4.038775444030762, -3.8039474487304688, -3.569119691848755, -3.334291696548462, -3.099463701248169, -2.864635944366455, -2.629807949066162, -2.394979953765869, -2.160151958465576, -1.9253240823745728, -1.6904962062835693, -1.4556682109832764, -1.2208402156829834, -0.98601233959198, -0.751184344291687, -0.5163564085960388, -0.28152844309806824, -0.046700477600097656, 0.18812745809555054, 0.42295539379119873, 0.6577833890914917, 0.8926112651824951, 1.127439260482788, 1.362267255783081, 1.5970951318740845, 1.8319231271743774, 2.066751003265381, 2.301578998565674, 2.536406993865967, 2.7712349891662598, 3.0060629844665527, 3.2408909797668457, 3.4757189750671387, 3.7105469703674316, 3.9453747272491455, 4.180202484130859, 4.415030479431152, 4.649858474731445, 4.884686470031738]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 4.0, 3.0, 8.0, 9.0, 9.0, 9.0, 17.0, 12.0, 14.0, 15.0, 16.0, 24.0, 24.0, 19.0, 23.0, 30.0, 30.0, 28.0, 36.0, 35.0, 30.0, 37.0, 37.0, 48.0, 38.0, 36.0, 45.0, 37.0, 34.0, 48.0, 32.0, 21.0, 27.0, 34.0, 24.0, 22.0, 14.0, 15.0, 10.0, 12.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.59603214263916, -7.35667085647583, -7.117309093475342, -6.877947807312012, -6.638586044311523, -6.399224758148193, -6.159863471984863, -5.920501708984375, -5.681139945983887, -5.441778659820557, -5.202416896820068, -4.963055610656738, -4.72369384765625, -4.48433256149292, -4.24497127532959, -4.005609512329102, -3.7662482261657715, -3.5268867015838623, -3.287525177001953, -3.048163890838623, -2.8088021278381348, -2.5694408416748047, -2.3300793170928955, -2.0907177925109863, -1.8513562679290771, -1.611994743347168, -1.3726332187652588, -1.1332718133926392, -0.89391028881073, -0.6545487642288208, -0.41518735885620117, -0.175825834274292, 0.06353569030761719, 0.302897185087204, 0.5422586798667908, 0.7816201448440552, 1.0209816694259644, 1.2603431940078735, 1.4997045993804932, 1.7390661239624023, 1.9784276485443115, 2.2177891731262207, 2.45715069770813, 2.696512222290039, 2.935873508453369, 3.1752352714538574, 3.4145965576171875, 3.6539580821990967, 3.893319606781006, 4.132680892944336, 4.372042655944824, 4.611403942108154, 4.850765705108643, 5.090126991271973, 5.329488754272461, 5.568850040435791, 5.808211326599121, 6.047572612762451, 6.2869343757629395, 6.5262956619262695, 6.765657424926758, 7.005018711090088, 7.244379997253418, 7.483741760253906, 7.7231035232543945]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 5.0, 9.0, 12.0, 13.0, 22.0, 27.0, 44.0, 41.0, 67.0, 96.0, 114.0, 159.0, 235.0, 364.0, 897.0, 4041.0, 36543.0, 520048.0, 2663959.0, 891779.0, 66961.0, 6225.0, 1182.0, 450.0, 258.0, 199.0, 131.0, 88.0, 72.0, 56.0, 35.0, 22.0, 26.0, 13.0, 23.0, 14.0, 11.0, 8.0, 5.0, 7.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.1328125, -7.89080810546875, -7.6488037109375, -7.40679931640625, -7.164794921875, -6.92279052734375, -6.6807861328125, -6.43878173828125, -6.19677734375, -5.95477294921875, -5.7127685546875, -5.47076416015625, -5.228759765625, -4.98675537109375, -4.7447509765625, -4.50274658203125, -4.2607421875, -4.01873779296875, -3.7767333984375, -3.53472900390625, -3.292724609375, -3.05072021484375, -2.8087158203125, -2.56671142578125, -2.32470703125, -2.08270263671875, -1.8406982421875, -1.59869384765625, -1.356689453125, -1.11468505859375, -0.8726806640625, -0.63067626953125, -0.388671875, -0.14666748046875, 0.0953369140625, 0.33734130859375, 0.579345703125, 0.82135009765625, 1.0633544921875, 1.30535888671875, 1.54736328125, 1.78936767578125, 2.0313720703125, 2.27337646484375, 2.515380859375, 2.75738525390625, 2.9993896484375, 3.24139404296875, 3.4833984375, 3.72540283203125, 3.9674072265625, 4.20941162109375, 4.451416015625, 4.69342041015625, 4.9354248046875, 5.17742919921875, 5.41943359375, 5.66143798828125, 5.9034423828125, 6.14544677734375, 6.387451171875, 6.62945556640625, 6.8714599609375, 7.11346435546875, 7.35546875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 9.0, 6.0, 13.0, 13.0, 9.0, 17.0, 16.0, 16.0, 30.0, 25.0, 28.0, 22.0, 32.0, 29.0, 37.0, 30.0, 27.0, 48.0, 41.0, 42.0, 38.0, 56.0, 45.0, 49.0, 54.0, 36.0, 39.0, 30.0, 31.0, 23.0, 21.0, 20.0, 15.0, 10.0, 13.0, 5.0, 9.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.507537841796875, -3.38812255859375, -3.268707275390625, -3.1492919921875, -3.029876708984375, -2.91046142578125, -2.791046142578125, -2.671630859375, -2.552215576171875, -2.43280029296875, -2.313385009765625, -2.1939697265625, -2.074554443359375, -1.95513916015625, -1.835723876953125, -1.71630859375, -1.596893310546875, -1.47747802734375, -1.358062744140625, -1.2386474609375, -1.119232177734375, -0.99981689453125, -0.880401611328125, -0.760986328125, -0.641571044921875, -0.52215576171875, -0.402740478515625, -0.2833251953125, -0.163909912109375, -0.04449462890625, 0.074920654296875, 0.1943359375, 0.313751220703125, 0.43316650390625, 0.552581787109375, 0.6719970703125, 0.791412353515625, 0.91082763671875, 1.030242919921875, 1.149658203125, 1.269073486328125, 1.38848876953125, 1.507904052734375, 1.6273193359375, 1.746734619140625, 1.86614990234375, 1.985565185546875, 2.10498046875, 2.224395751953125, 2.34381103515625, 2.463226318359375, 2.5826416015625, 2.702056884765625, 2.82147216796875, 2.940887451171875, 3.060302734375, 3.179718017578125, 3.29913330078125, 3.418548583984375, 3.5379638671875, 3.657379150390625, 3.77679443359375, 3.896209716796875, 4.015625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 14.0, 16.0, 29.0, 39.0, 70.0, 102.0, 269.0, 490.0, 1132.0, 3714.0, 107628.0, 3957419.0, 117314.0, 3872.0, 1122.0, 471.0, 221.0, 147.0, 69.0, 45.0, 27.0, 17.0, 20.0, 11.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.544677734375, -9.12060546875, -8.696533203125, -8.2724609375, -7.848388671875, -7.42431640625, -7.000244140625, -6.576171875, -6.152099609375, -5.72802734375, -5.303955078125, -4.8798828125, -4.455810546875, -4.03173828125, -3.607666015625, -3.18359375, -2.759521484375, -2.33544921875, -1.911376953125, -1.4873046875, -1.063232421875, -0.63916015625, -0.215087890625, 0.208984375, 0.633056640625, 1.05712890625, 1.481201171875, 1.9052734375, 2.329345703125, 2.75341796875, 3.177490234375, 3.6015625, 4.025634765625, 4.44970703125, 4.873779296875, 5.2978515625, 5.721923828125, 6.14599609375, 6.570068359375, 6.994140625, 7.418212890625, 7.84228515625, 8.266357421875, 8.6904296875, 9.114501953125, 9.53857421875, 9.962646484375, 10.38671875, 10.810791015625, 11.23486328125, 11.658935546875, 12.0830078125, 12.507080078125, 12.93115234375, 13.355224609375, 13.779296875, 14.203369140625, 14.62744140625, 15.051513671875, 15.4755859375, 15.899658203125, 16.32373046875, 16.747802734375, 17.171875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 9.0, 16.0, 24.0, 22.0, 39.0, 58.0, 83.0, 130.0, 178.0, 284.0, 385.0, 461.0, 555.0, 472.0, 430.0, 290.0, 220.0, 141.0, 97.0, 55.0, 31.0, 28.0, 19.0, 13.0, 6.0, 4.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.66796875, -2.606658935546875, -2.54534912109375, -2.484039306640625, -2.4227294921875, -2.361419677734375, -2.30010986328125, -2.238800048828125, -2.177490234375, -2.116180419921875, -2.05487060546875, -1.993560791015625, -1.9322509765625, -1.870941162109375, -1.80963134765625, -1.748321533203125, -1.68701171875, -1.625701904296875, -1.56439208984375, -1.503082275390625, -1.4417724609375, -1.380462646484375, -1.31915283203125, -1.257843017578125, -1.196533203125, -1.135223388671875, -1.07391357421875, -1.012603759765625, -0.9512939453125, -0.889984130859375, -0.82867431640625, -0.767364501953125, -0.7060546875, -0.644744873046875, -0.58343505859375, -0.522125244140625, -0.4608154296875, -0.399505615234375, -0.33819580078125, -0.276885986328125, -0.215576171875, -0.154266357421875, -0.09295654296875, -0.031646728515625, 0.0296630859375, 0.090972900390625, 0.15228271484375, 0.213592529296875, 0.27490234375, 0.336212158203125, 0.39752197265625, 0.458831787109375, 0.5201416015625, 0.581451416015625, 0.64276123046875, 0.704071044921875, 0.765380859375, 0.826690673828125, 0.88800048828125, 0.949310302734375, 1.0106201171875, 1.071929931640625, 1.13323974609375, 1.194549560546875, 1.255859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 6.0, 15.0, 37.0, 55.0, 116.0, 163.0, 180.0, 173.0, 119.0, 72.0, 45.0, 13.0, 13.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.672292709350586, -13.251670837402344, -12.831049919128418, -12.410428047180176, -11.989806175231934, -11.569185256958008, -11.148563385009766, -10.727941513061523, -10.307319641113281, -9.886697769165039, -9.466076850891113, -9.045454978942871, -8.624833106994629, -8.204212188720703, -7.783590316772461, -7.362968444824219, -6.942347049713135, -6.521725654602051, -6.101103782653809, -5.680482387542725, -5.259860515594482, -4.839239120483398, -4.418617248535156, -3.9979958534240723, -3.577374219894409, -3.156752586364746, -2.736130952835083, -2.31550931930542, -1.8948878049850464, -1.4742662906646729, -1.0536446571350098, -0.6330230236053467, -0.2124013900756836, 0.2082202136516571, 0.6288418173789978, 1.0494633913040161, 1.4700850248336792, 1.8907065391540527, 2.311328172683716, 2.731949806213379, 3.152571439743042, 3.573193073272705, 3.993814706802368, 4.414436340332031, 4.835057735443115, 5.255679130554199, 5.676301002502441, 6.096922874450684, 6.517544269561768, 6.938165664672852, 7.358787536621094, 7.779408931732178, 8.200030326843262, 8.620652198791504, 9.041274070739746, 9.461894989013672, 9.882516860961914, 10.303138732910156, 10.723759651184082, 11.144381523132324, 11.565003395080566, 11.985624313354492, 12.406246185302734, 12.826868057250977, 13.247489929199219]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 4.0, 11.0, 17.0, 22.0, 17.0, 18.0, 24.0, 29.0, 20.0, 23.0, 29.0, 36.0, 36.0, 29.0, 40.0, 37.0, 49.0, 46.0, 56.0, 42.0, 40.0, 46.0, 36.0, 49.0, 28.0, 36.0, 23.0, 30.0, 20.0, 19.0, 18.0, 16.0, 7.0, 5.0, 10.0, 10.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.525993824005127, -3.3983798027038574, -3.270765781402588, -3.1431517601013184, -3.015537738800049, -2.8879237174987793, -2.7603094577789307, -2.632695436477661, -2.5050814151763916, -2.377467393875122, -2.2498533725738525, -2.122239351272583, -1.994625210762024, -1.8670111894607544, -1.7393970489501953, -1.6117830276489258, -1.4841690063476562, -1.3565549850463867, -1.2289409637451172, -1.101326823234558, -0.9737128019332886, -0.846098780632019, -0.7184846997261047, -0.5908706188201904, -0.4632565975189209, -0.335642546415329, -0.20802849531173706, -0.08041444420814514, 0.04719960689544678, 0.1748136281967163, 0.3024277091026306, 0.4300417900085449, 0.5576558113098145, 0.685269832611084, 0.8128839135169983, 0.9404979944229126, 1.0681120157241821, 1.1957260370254517, 1.3233401775360107, 1.4509541988372803, 1.5785682201385498, 1.7061822414398193, 1.8337962627410889, 1.961410403251648, 2.089024543762207, 2.2166385650634766, 2.344252586364746, 2.4718666076660156, 2.599480628967285, 2.7270946502685547, 2.854708671569824, 2.9823226928710938, 3.1099367141723633, 3.237550735473633, 3.3651649951934814, 3.492779016494751, 3.6203930377960205, 3.74800705909729, 3.8756210803985596, 4.003235340118408, 4.130849361419678, 4.258463382720947, 4.386077404022217, 4.513691425323486, 4.641305446624756]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 10.0, 11.0, 12.0, 21.0, 30.0, 47.0, 73.0, 118.0, 172.0, 323.0, 532.0, 1059.0, 2108.0, 4655.0, 11643.0, 30944.0, 83954.0, 208795.0, 329231.0, 225459.0, 92658.0, 33966.0, 12675.0, 5124.0, 2335.0, 1112.0, 596.0, 342.0, 197.0, 123.0, 70.0, 62.0, 35.0, 18.0, 14.0, 11.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61328125, -0.595001220703125, -0.57672119140625, -0.558441162109375, -0.5401611328125, -0.521881103515625, -0.50360107421875, -0.485321044921875, -0.467041015625, -0.448760986328125, -0.43048095703125, -0.412200927734375, -0.3939208984375, -0.375640869140625, -0.35736083984375, -0.339080810546875, -0.32080078125, -0.302520751953125, -0.28424072265625, -0.265960693359375, -0.2476806640625, -0.229400634765625, -0.21112060546875, -0.192840576171875, -0.174560546875, -0.156280517578125, -0.13800048828125, -0.119720458984375, -0.1014404296875, -0.083160400390625, -0.06488037109375, -0.046600341796875, -0.0283203125, -0.010040283203125, 0.00823974609375, 0.026519775390625, 0.0447998046875, 0.063079833984375, 0.08135986328125, 0.099639892578125, 0.117919921875, 0.136199951171875, 0.15447998046875, 0.172760009765625, 0.1910400390625, 0.209320068359375, 0.22760009765625, 0.245880126953125, 0.26416015625, 0.282440185546875, 0.30072021484375, 0.319000244140625, 0.3372802734375, 0.355560302734375, 0.37384033203125, 0.392120361328125, 0.410400390625, 0.428680419921875, 0.44696044921875, 0.465240478515625, 0.4835205078125, 0.501800537109375, 0.52008056640625, 0.538360595703125, 0.556640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 13.0, 21.0, 20.0, 29.0, 19.0, 30.0, 39.0, 34.0, 36.0, 42.0, 50.0, 54.0, 41.0, 61.0, 53.0, 61.0, 58.0, 48.0, 49.0, 40.0, 42.0, 29.0, 17.0, 15.0, 15.0, 17.0, 16.0, 10.0, 9.0, 1.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.57379150390625, -2.4639892578125, -2.35418701171875, -2.244384765625, -2.13458251953125, -2.0247802734375, -1.91497802734375, -1.80517578125, -1.69537353515625, -1.5855712890625, -1.47576904296875, -1.365966796875, -1.25616455078125, -1.1463623046875, -1.03656005859375, -0.9267578125, -0.81695556640625, -0.7071533203125, -0.59735107421875, -0.487548828125, -0.37774658203125, -0.2679443359375, -0.15814208984375, -0.04833984375, 0.06146240234375, 0.1712646484375, 0.28106689453125, 0.390869140625, 0.50067138671875, 0.6104736328125, 0.72027587890625, 0.830078125, 0.93988037109375, 1.0496826171875, 1.15948486328125, 1.269287109375, 1.37908935546875, 1.4888916015625, 1.59869384765625, 1.70849609375, 1.81829833984375, 1.9281005859375, 2.03790283203125, 2.147705078125, 2.25750732421875, 2.3673095703125, 2.47711181640625, 2.5869140625, 2.69671630859375, 2.8065185546875, 2.91632080078125, 3.026123046875, 3.13592529296875, 3.2457275390625, 3.35552978515625, 3.46533203125, 3.57513427734375, 3.6849365234375, 3.79473876953125, 3.904541015625, 4.01434326171875, 4.1241455078125, 4.23394775390625, 4.34375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 13.0, 20.0, 31.0, 50.0, 100.0, 185.0, 440.0, 934.0, 2126.0, 4938.0, 10851.0, 23727.0, 51615.0, 103441.0, 178520.0, 233081.0, 200045.0, 122063.0, 62455.0, 29608.0, 13504.0, 5959.0, 2700.0, 1161.0, 494.0, 237.0, 100.0, 65.0, 28.0, 17.0, 10.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.319091796875, -0.3079490661621094, -0.29680633544921875, -0.2856636047363281, -0.2745208740234375, -0.2633781433105469, -0.25223541259765625, -0.24109268188476562, -0.229949951171875, -0.21880722045898438, -0.20766448974609375, -0.19652175903320312, -0.1853790283203125, -0.17423629760742188, -0.16309356689453125, -0.15195083618164062, -0.14080810546875, -0.12966537475585938, -0.11852264404296875, -0.10737991333007812, -0.0962371826171875, -0.08509445190429688, -0.07395172119140625, -0.06280899047851562, -0.051666259765625, -0.040523529052734375, -0.02938079833984375, -0.018238067626953125, -0.0070953369140625, 0.004047393798828125, 0.01519012451171875, 0.026332855224609375, 0.0374755859375, 0.048618316650390625, 0.05976104736328125, 0.07090377807617188, 0.0820465087890625, 0.09318923950195312, 0.10433197021484375, 0.11547470092773438, 0.126617431640625, 0.13776016235351562, 0.14890289306640625, 0.16004562377929688, 0.1711883544921875, 0.18233108520507812, 0.19347381591796875, 0.20461654663085938, 0.21575927734375, 0.22690200805664062, 0.23804473876953125, 0.24918746948242188, 0.2603302001953125, 0.2714729309082031, 0.28261566162109375, 0.2937583923339844, 0.304901123046875, 0.3160438537597656, 0.32718658447265625, 0.3383293151855469, 0.3494720458984375, 0.3606147766113281, 0.37175750732421875, 0.3829002380371094, 0.39404296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 10.0, 4.0, 10.0, 11.0, 11.0, 17.0, 18.0, 22.0, 20.0, 27.0, 32.0, 34.0, 54.0, 61.0, 34.0, 37.0, 46.0, 46.0, 47.0, 57.0, 50.0, 39.0, 36.0, 49.0, 39.0, 31.0, 26.0, 25.0, 11.0, 22.0, 10.0, 13.0, 12.0, 12.0, 7.0, 2.0, 2.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.22265625, -6.0350341796875, -5.847412109375, -5.6597900390625, -5.47216796875, -5.2845458984375, -5.096923828125, -4.9093017578125, -4.7216796875, -4.5340576171875, -4.346435546875, -4.1588134765625, -3.97119140625, -3.7835693359375, -3.595947265625, -3.4083251953125, -3.220703125, -3.0330810546875, -2.845458984375, -2.6578369140625, -2.47021484375, -2.2825927734375, -2.094970703125, -1.9073486328125, -1.7197265625, -1.5321044921875, -1.344482421875, -1.1568603515625, -0.96923828125, -0.7816162109375, -0.593994140625, -0.4063720703125, -0.21875, -0.0311279296875, 0.156494140625, 0.3441162109375, 0.53173828125, 0.7193603515625, 0.906982421875, 1.0946044921875, 1.2822265625, 1.4698486328125, 1.657470703125, 1.8450927734375, 2.03271484375, 2.2203369140625, 2.407958984375, 2.5955810546875, 2.783203125, 2.9708251953125, 3.158447265625, 3.3460693359375, 3.53369140625, 3.7213134765625, 3.908935546875, 4.0965576171875, 4.2841796875, 4.4718017578125, 4.659423828125, 4.8470458984375, 5.03466796875, 5.2222900390625, 5.409912109375, 5.5975341796875, 5.78515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 12.0, 13.0, 28.0, 30.0, 58.0, 112.0, 172.0, 251.0, 441.0, 597.0, 1071.0, 2083.0, 4085.0, 8684.0, 21257.0, 62843.0, 215208.0, 444229.0, 194137.0, 56897.0, 19597.0, 8229.0, 3901.0, 1929.0, 1113.0, 556.0, 353.0, 236.0, 147.0, 96.0, 58.0, 45.0, 25.0, 17.0, 13.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08323097229003906, -0.08058547973632812, -0.07793998718261719, -0.07529449462890625, -0.07264900207519531, -0.07000350952148438, -0.06735801696777344, -0.0647125244140625, -0.06206703186035156, -0.059421539306640625, -0.05677604675292969, -0.05413055419921875, -0.05148506164550781, -0.048839569091796875, -0.04619407653808594, -0.043548583984375, -0.04090309143066406, -0.038257598876953125, -0.03561210632324219, -0.03296661376953125, -0.030321121215820312, -0.027675628662109375, -0.025030136108398438, -0.0223846435546875, -0.019739151000976562, -0.017093658447265625, -0.014448165893554688, -0.01180267333984375, -0.009157180786132812, -0.006511688232421875, -0.0038661956787109375, -0.001220703125, 0.0014247894287109375, 0.004070281982421875, 0.0067157745361328125, 0.00936126708984375, 0.012006759643554688, 0.014652252197265625, 0.017297744750976562, 0.0199432373046875, 0.022588729858398438, 0.025234222412109375, 0.027879714965820312, 0.03052520751953125, 0.03317070007324219, 0.035816192626953125, 0.03846168518066406, 0.041107177734375, 0.04375267028808594, 0.046398162841796875, 0.04904365539550781, 0.05168914794921875, 0.05433464050292969, 0.056980133056640625, 0.05962562561035156, 0.0622711181640625, 0.06491661071777344, 0.06756210327148438, 0.07020759582519531, 0.07285308837890625, 0.07549858093261719, 0.07814407348632812, 0.08078956604003906, 0.08343505859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 11.0, 11.0, 20.0, 33.0, 41.0, 59.0, 81.0, 154.0, 134.0, 126.0, 93.0, 72.0, 48.0, 31.0, 16.0, 19.0, 13.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001087188720703125, -0.00010549649596214294, -0.00010227411985397339, -9.905174374580383e-05, -9.582936763763428e-05, -9.260699152946472e-05, -8.938461542129517e-05, -8.616223931312561e-05, -8.293986320495605e-05, -7.97174870967865e-05, -7.649511098861694e-05, -7.327273488044739e-05, -7.005035877227783e-05, -6.682798266410828e-05, -6.360560655593872e-05, -6.0383230447769165e-05, -5.716085433959961e-05, -5.3938478231430054e-05, -5.07161021232605e-05, -4.749372601509094e-05, -4.427134990692139e-05, -4.104897379875183e-05, -3.7826597690582275e-05, -3.460422158241272e-05, -3.1381845474243164e-05, -2.815946936607361e-05, -2.4937093257904053e-05, -2.1714717149734497e-05, -1.849234104156494e-05, -1.5269964933395386e-05, -1.204758882522583e-05, -8.825212717056274e-06, -5.602836608886719e-06, -2.380460500717163e-06, 8.419156074523926e-07, 4.064291715621948e-06, 7.286667823791504e-06, 1.050904393196106e-05, 1.3731420040130615e-05, 1.695379614830017e-05, 2.0176172256469727e-05, 2.3398548364639282e-05, 2.6620924472808838e-05, 2.9843300580978394e-05, 3.306567668914795e-05, 3.6288052797317505e-05, 3.951042890548706e-05, 4.2732805013656616e-05, 4.595518112182617e-05, 4.917755722999573e-05, 5.239993333816528e-05, 5.562230944633484e-05, 5.8844685554504395e-05, 6.206706166267395e-05, 6.52894377708435e-05, 6.851181387901306e-05, 7.173418998718262e-05, 7.495656609535217e-05, 7.817894220352173e-05, 8.140131831169128e-05, 8.462369441986084e-05, 8.78460705280304e-05, 9.106844663619995e-05, 9.429082274436951e-05, 9.751319885253906e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 5.0, 7.0, 7.0, 15.0, 10.0, 16.0, 33.0, 32.0, 51.0, 86.0, 155.0, 361.0, 816.0, 2411.0, 7835.0, 35408.0, 291620.0, 615082.0, 75236.0, 13468.0, 3643.0, 1285.0, 447.0, 202.0, 109.0, 52.0, 40.0, 34.0, 23.0, 15.0, 11.0, 6.0, 10.0, 1.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1688232421875, -0.16415977478027344, -0.15949630737304688, -0.1548328399658203, -0.15016937255859375, -0.1455059051513672, -0.14084243774414062, -0.13617897033691406, -0.1315155029296875, -0.12685203552246094, -0.12218856811523438, -0.11752510070800781, -0.11286163330078125, -0.10819816589355469, -0.10353469848632812, -0.09887123107910156, -0.094207763671875, -0.08954429626464844, -0.08488082885742188, -0.08021736145019531, -0.07555389404296875, -0.07089042663574219, -0.06622695922851562, -0.06156349182128906, -0.0569000244140625, -0.05223655700683594, -0.047573089599609375, -0.04290962219238281, -0.03824615478515625, -0.03358268737792969, -0.028919219970703125, -0.024255752563476562, -0.01959228515625, -0.014928817749023438, -0.010265350341796875, -0.0056018829345703125, -0.00093841552734375, 0.0037250518798828125, 0.008388519287109375, 0.013051986694335938, 0.0177154541015625, 0.022378921508789062, 0.027042388916015625, 0.03170585632324219, 0.03636932373046875, 0.04103279113769531, 0.045696258544921875, 0.05035972595214844, 0.055023193359375, 0.05968666076660156, 0.06435012817382812, 0.06901359558105469, 0.07367706298828125, 0.07834053039550781, 0.08300399780273438, 0.08766746520996094, 0.0923309326171875, 0.09699440002441406, 0.10165786743164062, 0.10632133483886719, 0.11098480224609375, 0.11564826965332031, 0.12031173706054688, 0.12497520446777344, 0.129638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 3.0, 9.0, 10.0, 8.0, 18.0, 9.0, 9.0, 25.0, 27.0, 32.0, 38.0, 57.0, 55.0, 51.0, 82.0, 81.0, 84.0, 67.0, 69.0, 49.0, 47.0, 46.0, 27.0, 26.0, 17.0, 11.0, 1.0, 12.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.030487060546875, -0.029604673385620117, -0.028722286224365234, -0.02783989906311035, -0.02695751190185547, -0.026075124740600586, -0.025192737579345703, -0.02431035041809082, -0.023427963256835938, -0.022545576095581055, -0.021663188934326172, -0.02078080177307129, -0.019898414611816406, -0.019016027450561523, -0.01813364028930664, -0.017251253128051758, -0.016368865966796875, -0.015486478805541992, -0.01460409164428711, -0.013721704483032227, -0.012839317321777344, -0.011956930160522461, -0.011074542999267578, -0.010192155838012695, -0.009309768676757812, -0.00842738151550293, -0.007544994354248047, -0.006662607192993164, -0.005780220031738281, -0.0048978328704833984, -0.004015445709228516, -0.003133058547973633, -0.00225067138671875, -0.0013682842254638672, -0.0004858970642089844, 0.00039649009704589844, 0.0012788772583007812, 0.002161264419555664, 0.003043651580810547, 0.00392603874206543, 0.0048084259033203125, 0.005690813064575195, 0.006573200225830078, 0.007455587387084961, 0.008337974548339844, 0.009220361709594727, 0.01010274887084961, 0.010985136032104492, 0.011867523193359375, 0.012749910354614258, 0.01363229751586914, 0.014514684677124023, 0.015397071838378906, 0.01627945899963379, 0.017161846160888672, 0.018044233322143555, 0.018926620483398438, 0.01980900764465332, 0.020691394805908203, 0.021573781967163086, 0.02245616912841797, 0.02333855628967285, 0.024220943450927734, 0.025103330612182617, 0.0259857177734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 9.0, 45.0, 219.0, 450.0, 238.0, 49.0, 7.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.95737838745117, -35.32083511352539, -34.68429183959961, -34.04774475097656, -33.41120147705078, -32.774658203125, -32.13811492919922, -31.501569747924805, -30.865026473999023, -30.228483200073242, -29.591938018798828, -28.955394744873047, -28.318849563598633, -27.68230628967285, -27.045761108398438, -26.409217834472656, -25.772674560546875, -25.136131286621094, -24.49958610534668, -23.8630428314209, -23.226497650146484, -22.589954376220703, -21.953411102294922, -21.316865921020508, -20.680320739746094, -20.043777465820312, -19.4072322845459, -18.770689010620117, -18.134143829345703, -17.497600555419922, -16.86105728149414, -16.224512100219727, -15.587968826293945, -14.951424598693848, -14.31488037109375, -13.678337097167969, -13.041792869567871, -12.405248641967773, -11.768704414367676, -11.132160186767578, -10.495616912841797, -9.8590726852417, -9.222528457641602, -8.58598518371582, -7.949440956115723, -7.312896728515625, -6.676352500915527, -6.039808750152588, -5.40326452255249, -4.766720294952393, -4.130176544189453, -3.4936323165893555, -2.857088327407837, -2.2205443382263184, -1.5840001106262207, -0.9474563598632812, -0.3109121322631836, 0.32563191652297974, 0.9621759653091431, 1.5987200736999512, 2.2352640628814697, 2.8718080520629883, 3.508352279663086, 4.144896030426025, 4.781440258026123]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 8.0, 7.0, 8.0, 9.0, 21.0, 16.0, 20.0, 25.0, 26.0, 24.0, 24.0, 29.0, 37.0, 38.0, 30.0, 34.0, 41.0, 50.0, 48.0, 60.0, 45.0, 42.0, 49.0, 37.0, 43.0, 31.0, 33.0, 20.0, 28.0, 24.0, 22.0, 16.0, 11.0, 9.0, 9.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5625016689300537, -2.472991943359375, -2.3834822177886963, -2.2939724922180176, -2.204462766647339, -2.11495304107666, -2.0254435539245605, -1.9359337091445923, -1.8464239835739136, -1.7569142580032349, -1.6674045324325562, -1.577894926071167, -1.4883852005004883, -1.3988754749298096, -1.3093657493591309, -1.2198560237884521, -1.1303462982177734, -1.0408365726470947, -0.951326847076416, -0.8618171811103821, -0.7723074555397034, -0.6827977299690247, -0.5932880640029907, -0.503778338432312, -0.4142686128616333, -0.3247588872909546, -0.23524919152259827, -0.14573949575424194, -0.05622977018356323, 0.03327995538711548, 0.12278962135314941, 0.21229934692382812, 0.30180931091308594, 0.39131903648376465, 0.48082873225212097, 0.5703384280204773, 0.659848153591156, 0.7493578791618347, 0.8388675451278687, 0.9283772706985474, 1.017886996269226, 1.1073967218399048, 1.1969064474105835, 1.2864160537719727, 1.3759257793426514, 1.46543550491333, 1.5549452304840088, 1.6444549560546875, 1.7339646816253662, 1.823474407196045, 1.9129841327667236, 2.0024938583374023, 2.092003583908081, 2.1815133094787598, 2.2710227966308594, 2.360532760620117, 2.450042247772217, 2.5395519733428955, 2.629061698913574, 2.718571424484253, 2.8080811500549316, 2.8975908756256104, 2.987100601196289, 3.0766100883483887, 3.1661200523376465]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 8.0, 9.0, 17.0, 12.0, 14.0, 19.0, 15.0, 25.0, 52.0, 86.0, 124.0, 309.0, 900.0, 3274.0, 17087.0, 104966.0, 432315.0, 387381.0, 84145.0, 13590.0, 2783.0, 761.0, 267.0, 134.0, 82.0, 37.0, 26.0, 23.0, 9.0, 7.0, 13.0, 14.0, 13.0, 7.0, 6.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.08984375, -4.93048095703125, -4.7711181640625, -4.61175537109375, -4.452392578125, -4.29302978515625, -4.1336669921875, -3.97430419921875, -3.81494140625, -3.65557861328125, -3.4962158203125, -3.33685302734375, -3.177490234375, -3.01812744140625, -2.8587646484375, -2.69940185546875, -2.5400390625, -2.38067626953125, -2.2213134765625, -2.06195068359375, -1.902587890625, -1.74322509765625, -1.5838623046875, -1.42449951171875, -1.26513671875, -1.10577392578125, -0.9464111328125, -0.78704833984375, -0.627685546875, -0.46832275390625, -0.3089599609375, -0.14959716796875, 0.009765625, 0.16912841796875, 0.3284912109375, 0.48785400390625, 0.647216796875, 0.80657958984375, 0.9659423828125, 1.12530517578125, 1.28466796875, 1.44403076171875, 1.6033935546875, 1.76275634765625, 1.922119140625, 2.08148193359375, 2.2408447265625, 2.40020751953125, 2.5595703125, 2.71893310546875, 2.8782958984375, 3.03765869140625, 3.197021484375, 3.35638427734375, 3.5157470703125, 3.67510986328125, 3.83447265625, 3.99383544921875, 4.1531982421875, 4.31256103515625, 4.471923828125, 4.63128662109375, 4.7906494140625, 4.95001220703125, 5.109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 4.0, 3.0, 12.0, 6.0, 1.0, 6.0, 15.0, 16.0, 19.0, 20.0, 22.0, 21.0, 22.0, 31.0, 27.0, 29.0, 34.0, 48.0, 42.0, 38.0, 46.0, 55.0, 40.0, 51.0, 47.0, 40.0, 36.0, 30.0, 24.0, 32.0, 33.0, 34.0, 18.0, 22.0, 12.0, 12.0, 12.0, 12.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.265625, -4.116455078125, -3.96728515625, -3.818115234375, -3.6689453125, -3.519775390625, -3.37060546875, -3.221435546875, -3.072265625, -2.923095703125, -2.77392578125, -2.624755859375, -2.4755859375, -2.326416015625, -2.17724609375, -2.028076171875, -1.87890625, -1.729736328125, -1.58056640625, -1.431396484375, -1.2822265625, -1.133056640625, -0.98388671875, -0.834716796875, -0.685546875, -0.536376953125, -0.38720703125, -0.238037109375, -0.0888671875, 0.060302734375, 0.20947265625, 0.358642578125, 0.5078125, 0.656982421875, 0.80615234375, 0.955322265625, 1.1044921875, 1.253662109375, 1.40283203125, 1.552001953125, 1.701171875, 1.850341796875, 1.99951171875, 2.148681640625, 2.2978515625, 2.447021484375, 2.59619140625, 2.745361328125, 2.89453125, 3.043701171875, 3.19287109375, 3.342041015625, 3.4912109375, 3.640380859375, 3.78955078125, 3.938720703125, 4.087890625, 4.237060546875, 4.38623046875, 4.535400390625, 4.6845703125, 4.833740234375, 4.98291015625, 5.132080078125, 5.28125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 7.0, 13.0, 16.0, 12.0, 12.0, 15.0, 17.0, 21.0, 27.0, 38.0, 54.0, 66.0, 86.0, 131.0, 231.0, 307.0, 589.0, 3251.0, 136368.0, 845836.0, 58041.0, 1884.0, 520.0, 271.0, 163.0, 132.0, 119.0, 68.0, 60.0, 33.0, 33.0, 21.0, 16.0, 21.0, 13.0, 7.0, 12.0, 6.0, 4.0, 4.0, 9.0, 3.0, 0.0, 2.0, 5.0, 3.0, 0.0, 1.0], "bins": [-11.1171875, -10.8031005859375, -10.489013671875, -10.1749267578125, -9.86083984375, -9.5467529296875, -9.232666015625, -8.9185791015625, -8.6044921875, -8.2904052734375, -7.976318359375, -7.6622314453125, -7.34814453125, -7.0340576171875, -6.719970703125, -6.4058837890625, -6.091796875, -5.7777099609375, -5.463623046875, -5.1495361328125, -4.83544921875, -4.5213623046875, -4.207275390625, -3.8931884765625, -3.5791015625, -3.2650146484375, -2.950927734375, -2.6368408203125, -2.32275390625, -2.0086669921875, -1.694580078125, -1.3804931640625, -1.06640625, -0.7523193359375, -0.438232421875, -0.1241455078125, 0.18994140625, 0.5040283203125, 0.818115234375, 1.1322021484375, 1.4462890625, 1.7603759765625, 2.074462890625, 2.3885498046875, 2.70263671875, 3.0167236328125, 3.330810546875, 3.6448974609375, 3.958984375, 4.2730712890625, 4.587158203125, 4.9012451171875, 5.21533203125, 5.5294189453125, 5.843505859375, 6.1575927734375, 6.4716796875, 6.7857666015625, 7.099853515625, 7.4139404296875, 7.72802734375, 8.0421142578125, 8.356201171875, 8.6702880859375, 8.984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 11.0, 5.0, 12.0, 4.0, 11.0, 21.0, 23.0, 31.0, 30.0, 27.0, 44.0, 52.0, 41.0, 55.0, 40.0, 50.0, 43.0, 45.0, 39.0, 43.0, 43.0, 43.0, 33.0, 35.0, 24.0, 34.0, 19.0, 13.0, 13.0, 18.0, 14.0, 10.0, 9.0, 6.0, 10.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-5.8828125, -5.71270751953125, -5.5426025390625, -5.37249755859375, -5.202392578125, -5.03228759765625, -4.8621826171875, -4.69207763671875, -4.52197265625, -4.35186767578125, -4.1817626953125, -4.01165771484375, -3.841552734375, -3.67144775390625, -3.5013427734375, -3.33123779296875, -3.1611328125, -2.99102783203125, -2.8209228515625, -2.65081787109375, -2.480712890625, -2.31060791015625, -2.1405029296875, -1.97039794921875, -1.80029296875, -1.63018798828125, -1.4600830078125, -1.28997802734375, -1.119873046875, -0.94976806640625, -0.7796630859375, -0.60955810546875, -0.439453125, -0.26934814453125, -0.0992431640625, 0.07086181640625, 0.240966796875, 0.41107177734375, 0.5811767578125, 0.75128173828125, 0.92138671875, 1.09149169921875, 1.2615966796875, 1.43170166015625, 1.601806640625, 1.77191162109375, 1.9420166015625, 2.11212158203125, 2.2822265625, 2.45233154296875, 2.6224365234375, 2.79254150390625, 2.962646484375, 3.13275146484375, 3.3028564453125, 3.47296142578125, 3.64306640625, 3.81317138671875, 3.9832763671875, 4.15338134765625, 4.323486328125, 4.49359130859375, 4.6636962890625, 4.83380126953125, 5.00390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 4.0, 9.0, 9.0, 9.0, 22.0, 49.0, 101.0, 270.0, 946.0, 7025.0, 631672.0, 401533.0, 5591.0, 860.0, 214.0, 100.0, 48.0, 34.0, 16.0, 10.0, 5.0, 7.0, 2.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.77734375, -6.60333251953125, -6.4293212890625, -6.25531005859375, -6.081298828125, -5.90728759765625, -5.7332763671875, -5.55926513671875, -5.38525390625, -5.21124267578125, -5.0372314453125, -4.86322021484375, -4.689208984375, -4.51519775390625, -4.3411865234375, -4.16717529296875, -3.9931640625, -3.81915283203125, -3.6451416015625, -3.47113037109375, -3.297119140625, -3.12310791015625, -2.9490966796875, -2.77508544921875, -2.60107421875, -2.42706298828125, -2.2530517578125, -2.07904052734375, -1.905029296875, -1.73101806640625, -1.5570068359375, -1.38299560546875, -1.208984375, -1.03497314453125, -0.8609619140625, -0.68695068359375, -0.512939453125, -0.33892822265625, -0.1649169921875, 0.00909423828125, 0.18310546875, 0.35711669921875, 0.5311279296875, 0.70513916015625, 0.879150390625, 1.05316162109375, 1.2271728515625, 1.40118408203125, 1.5751953125, 1.74920654296875, 1.9232177734375, 2.09722900390625, 2.271240234375, 2.44525146484375, 2.6192626953125, 2.79327392578125, 2.96728515625, 3.14129638671875, 3.3153076171875, 3.48931884765625, 3.663330078125, 3.83734130859375, 4.0113525390625, 4.18536376953125, 4.359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 13.0, 15.0, 19.0, 40.0, 53.0, 95.0, 112.0, 133.0, 140.0, 123.0, 85.0, 60.0, 39.0, 23.0, 17.0, 10.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004935264587402344, -0.00047988444566726685, -0.0004662424325942993, -0.0004526004195213318, -0.00043895840644836426, -0.00042531639337539673, -0.0004116743803024292, -0.00039803236722946167, -0.00038439035415649414, -0.0003707483410835266, -0.0003571063280105591, -0.00034346431493759155, -0.000329822301864624, -0.0003161802887916565, -0.00030253827571868896, -0.00028889626264572144, -0.0002752542495727539, -0.0002616122364997864, -0.00024797022342681885, -0.00023432821035385132, -0.0002206861972808838, -0.00020704418420791626, -0.00019340217113494873, -0.0001797601580619812, -0.00016611814498901367, -0.00015247613191604614, -0.0001388341188430786, -0.00012519210577011108, -0.00011155009269714355, -9.790807962417603e-05, -8.42660665512085e-05, -7.062405347824097e-05, -5.698204040527344e-05, -4.334002733230591e-05, -2.969801425933838e-05, -1.605600118637085e-05, -2.4139881134033203e-06, 1.1228024959564209e-05, 2.4870038032531738e-05, 3.851205110549927e-05, 5.21540641784668e-05, 6.579607725143433e-05, 7.943809032440186e-05, 9.308010339736938e-05, 0.00010672211647033691, 0.00012036412954330444, 0.00013400614261627197, 0.0001476481556892395, 0.00016129016876220703, 0.00017493218183517456, 0.0001885741949081421, 0.00020221620798110962, 0.00021585822105407715, 0.00022950023412704468, 0.0002431422472000122, 0.00025678426027297974, 0.00027042627334594727, 0.0002840682864189148, 0.0002977102994918823, 0.00031135231256484985, 0.0003249943256378174, 0.0003386363387107849, 0.00035227835178375244, 0.00036592036485671997, 0.0003795623779296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 20.0, 24.0, 54.0, 96.0, 174.0, 590.0, 3552.0, 199169.0, 836393.0, 7009.0, 943.0, 273.0, 98.0, 50.0, 27.0, 24.0, 13.0, 7.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.752227783203125, -3.54547119140625, -3.338714599609375, -3.1319580078125, -2.925201416015625, -2.71844482421875, -2.511688232421875, -2.304931640625, -2.098175048828125, -1.89141845703125, -1.684661865234375, -1.4779052734375, -1.271148681640625, -1.06439208984375, -0.857635498046875, -0.65087890625, -0.444122314453125, -0.23736572265625, -0.030609130859375, 0.1761474609375, 0.382904052734375, 0.58966064453125, 0.796417236328125, 1.003173828125, 1.209930419921875, 1.41668701171875, 1.623443603515625, 1.8302001953125, 2.036956787109375, 2.24371337890625, 2.450469970703125, 2.6572265625, 2.863983154296875, 3.07073974609375, 3.277496337890625, 3.4842529296875, 3.691009521484375, 3.89776611328125, 4.104522705078125, 4.311279296875, 4.518035888671875, 4.72479248046875, 4.931549072265625, 5.1383056640625, 5.345062255859375, 5.55181884765625, 5.758575439453125, 5.96533203125, 6.172088623046875, 6.37884521484375, 6.585601806640625, 6.7923583984375, 6.999114990234375, 7.20587158203125, 7.412628173828125, 7.619384765625, 7.826141357421875, 8.03289794921875, 8.239654541015625, 8.4464111328125, 8.653167724609375, 8.85992431640625, 9.066680908203125, 9.2734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 8.0, 14.0, 27.0, 41.0, 60.0, 108.0, 109.0, 158.0, 151.0, 109.0, 73.0, 50.0, 34.0, 15.0, 17.0, 9.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.6135177612304688, -1.5766448974609375, -1.5397720336914062, -1.502899169921875, -1.4660263061523438, -1.4291534423828125, -1.3922805786132812, -1.35540771484375, -1.3185348510742188, -1.2816619873046875, -1.2447891235351562, -1.207916259765625, -1.1710433959960938, -1.1341705322265625, -1.0972976684570312, -1.0604248046875, -1.0235519409179688, -0.9866790771484375, -0.9498062133789062, -0.912933349609375, -0.8760604858398438, -0.8391876220703125, -0.8023147583007812, -0.76544189453125, -0.7285690307617188, -0.6916961669921875, -0.6548233032226562, -0.617950439453125, -0.5810775756835938, -0.5442047119140625, -0.5073318481445312, -0.470458984375, -0.43358612060546875, -0.3967132568359375, -0.35984039306640625, -0.322967529296875, -0.28609466552734375, -0.2492218017578125, -0.21234893798828125, -0.17547607421875, -0.13860321044921875, -0.1017303466796875, -0.06485748291015625, -0.027984619140625, 0.00888824462890625, 0.0457611083984375, 0.08263397216796875, 0.1195068359375, 0.15637969970703125, 0.1932525634765625, 0.23012542724609375, 0.266998291015625, 0.30387115478515625, 0.3407440185546875, 0.37761688232421875, 0.41448974609375, 0.45136260986328125, 0.4882354736328125, 0.5251083374023438, 0.561981201171875, 0.5988540649414062, 0.6357269287109375, 0.6725997924804688, 0.70947265625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 15.0, 22.0, 35.0, 44.0, 73.0, 79.0, 92.0, 110.0, 114.0, 95.0, 104.0, 73.0, 52.0, 33.0, 33.0, 14.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.735433578491211, -10.41178035736084, -10.088127136230469, -9.764473915100098, -9.440820693969727, -9.117166519165039, -8.793513298034668, -8.469860076904297, -8.146206855773926, -7.822553634643555, -7.498900413513184, -7.175246715545654, -6.851593494415283, -6.527940273284912, -6.204286575317383, -5.880633354187012, -5.556980133056641, -5.2333269119262695, -4.909673690795898, -4.586019992828369, -4.262366771697998, -3.938713550567627, -3.6150600910186768, -3.2914066314697266, -2.9677534103393555, -2.6441001892089844, -2.320446729660034, -1.9967933893203735, -1.673140048980713, -1.3494867086410522, -1.0258333683013916, -0.7021799087524414, -0.3785257339477539, -0.05487239360809326, 0.2687809467315674, 0.592434287071228, 0.9160876274108887, 1.2397409677505493, 1.56339430809021, 1.8870477676391602, 2.2107009887695312, 2.5343542098999023, 2.8580076694488525, 3.1816611289978027, 3.505314350128174, 3.828967571258545, 4.152621269226074, 4.476274490356445, 4.799927711486816, 5.1235809326171875, 5.447234153747559, 5.770887851715088, 6.094541072845459, 6.41819429397583, 6.741847991943359, 7.0655012130737305, 7.389154434204102, 7.712807655334473, 8.036460876464844, 8.360114097595215, 8.683767318725586, 9.007421493530273, 9.331074714660645, 9.654727935791016, 9.978381156921387]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 7.0, 8.0, 19.0, 19.0, 19.0, 24.0, 26.0, 23.0, 30.0, 39.0, 29.0, 36.0, 41.0, 53.0, 39.0, 39.0, 40.0, 46.0, 52.0, 41.0, 41.0, 43.0, 28.0, 42.0, 31.0, 37.0, 20.0, 19.0, 19.0, 11.0, 13.0, 12.0, 11.0, 14.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.183972358703613, -8.88526725769043, -8.586563110351562, -8.287858009338379, -7.989152908325195, -7.69044828414917, -7.3917436599731445, -7.093038558959961, -6.7943339347839355, -6.49562931060791, -6.196924209594727, -5.898219585418701, -5.599514961242676, -5.300809860229492, -5.002105236053467, -4.703400611877441, -4.404695510864258, -4.105990886688232, -3.807285785675049, -3.5085811614990234, -3.209876298904419, -2.9111714363098145, -2.612466812133789, -2.3137619495391846, -2.01505708694458, -1.7163522243499756, -1.4176474809646606, -1.1189427375793457, -0.8202378749847412, -0.5215330123901367, -0.22282826900482178, 0.07587647438049316, 0.37458133697509766, 0.6732861399650574, 0.9719909429550171, 1.270695686340332, 1.5694005489349365, 1.868105411529541, 2.1668100357055664, 2.465514898300171, 2.7642197608947754, 3.06292462348938, 3.3616294860839844, 3.6603341102600098, 3.9590389728546143, 4.257743835449219, 4.556448459625244, 4.8551530838012695, 5.153858184814453, 5.4525628089904785, 5.751267910003662, 6.0499725341796875, 6.348677635192871, 6.6473822593688965, 6.946086883544922, 7.2447919845581055, 7.543496608734131, 7.842201232910156, 8.14090633392334, 8.439611434936523, 8.73831558227539, 9.037020683288574, 9.335725784301758, 9.634429931640625, 9.933135032653809]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 9.0, 5.0, 11.0, 21.0, 16.0, 29.0, 33.0, 38.0, 91.0, 107.0, 170.0, 266.0, 498.0, 1570.0, 12236.0, 248084.0, 2983694.0, 907572.0, 35005.0, 3103.0, 725.0, 342.0, 213.0, 138.0, 92.0, 43.0, 44.0, 38.0, 20.0, 12.0, 11.0, 10.0, 6.0, 4.0, 11.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9453125, -8.6539306640625, -8.362548828125, -8.0711669921875, -7.77978515625, -7.4884033203125, -7.197021484375, -6.9056396484375, -6.6142578125, -6.3228759765625, -6.031494140625, -5.7401123046875, -5.44873046875, -5.1573486328125, -4.865966796875, -4.5745849609375, -4.283203125, -3.9918212890625, -3.700439453125, -3.4090576171875, -3.11767578125, -2.8262939453125, -2.534912109375, -2.2435302734375, -1.9521484375, -1.6607666015625, -1.369384765625, -1.0780029296875, -0.78662109375, -0.4952392578125, -0.203857421875, 0.0875244140625, 0.37890625, 0.6702880859375, 0.961669921875, 1.2530517578125, 1.54443359375, 1.8358154296875, 2.127197265625, 2.4185791015625, 2.7099609375, 3.0013427734375, 3.292724609375, 3.5841064453125, 3.87548828125, 4.1668701171875, 4.458251953125, 4.7496337890625, 5.041015625, 5.3323974609375, 5.623779296875, 5.9151611328125, 6.20654296875, 6.4979248046875, 6.789306640625, 7.0806884765625, 7.3720703125, 7.6634521484375, 7.954833984375, 8.2462158203125, 8.53759765625, 8.8289794921875, 9.120361328125, 9.4117431640625, 9.703125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 10.0, 11.0, 7.0, 13.0, 13.0, 21.0, 21.0, 22.0, 22.0, 35.0, 25.0, 34.0, 50.0, 37.0, 42.0, 43.0, 41.0, 47.0, 41.0, 45.0, 42.0, 49.0, 39.0, 34.0, 34.0, 41.0, 18.0, 27.0, 26.0, 18.0, 16.0, 17.0, 11.0, 7.0, 3.0, 7.0, 9.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.083984375, -2.972320556640625, -2.86065673828125, -2.748992919921875, -2.6373291015625, -2.525665283203125, -2.41400146484375, -2.302337646484375, -2.190673828125, -2.079010009765625, -1.96734619140625, -1.855682373046875, -1.7440185546875, -1.632354736328125, -1.52069091796875, -1.409027099609375, -1.29736328125, -1.185699462890625, -1.07403564453125, -0.962371826171875, -0.8507080078125, -0.739044189453125, -0.62738037109375, -0.515716552734375, -0.404052734375, -0.292388916015625, -0.18072509765625, -0.069061279296875, 0.0426025390625, 0.154266357421875, 0.26593017578125, 0.377593994140625, 0.4892578125, 0.600921630859375, 0.71258544921875, 0.824249267578125, 0.9359130859375, 1.047576904296875, 1.15924072265625, 1.270904541015625, 1.382568359375, 1.494232177734375, 1.60589599609375, 1.717559814453125, 1.8292236328125, 1.940887451171875, 2.05255126953125, 2.164215087890625, 2.27587890625, 2.387542724609375, 2.49920654296875, 2.610870361328125, 2.7225341796875, 2.834197998046875, 2.94586181640625, 3.057525634765625, 3.169189453125, 3.280853271484375, 3.39251708984375, 3.504180908203125, 3.6158447265625, 3.727508544921875, 3.83917236328125, 3.950836181640625, 4.0625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 21.0, 14.0, 21.0, 26.0, 61.0, 84.0, 113.0, 186.0, 268.0, 424.0, 805.0, 1611.0, 4853.0, 34645.0, 888766.0, 3108825.0, 137163.0, 11226.0, 2553.0, 1059.0, 543.0, 339.0, 207.0, 111.0, 82.0, 80.0, 42.0, 43.0, 27.0, 16.0, 11.0, 11.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.7734375, -6.5335693359375, -6.293701171875, -6.0538330078125, -5.81396484375, -5.5740966796875, -5.334228515625, -5.0943603515625, -4.8544921875, -4.6146240234375, -4.374755859375, -4.1348876953125, -3.89501953125, -3.6551513671875, -3.415283203125, -3.1754150390625, -2.935546875, -2.6956787109375, -2.455810546875, -2.2159423828125, -1.97607421875, -1.7362060546875, -1.496337890625, -1.2564697265625, -1.0166015625, -0.7767333984375, -0.536865234375, -0.2969970703125, -0.05712890625, 0.1827392578125, 0.422607421875, 0.6624755859375, 0.90234375, 1.1422119140625, 1.382080078125, 1.6219482421875, 1.86181640625, 2.1016845703125, 2.341552734375, 2.5814208984375, 2.8212890625, 3.0611572265625, 3.301025390625, 3.5408935546875, 3.78076171875, 4.0206298828125, 4.260498046875, 4.5003662109375, 4.740234375, 4.9801025390625, 5.219970703125, 5.4598388671875, 5.69970703125, 5.9395751953125, 6.179443359375, 6.4193115234375, 6.6591796875, 6.8990478515625, 7.138916015625, 7.3787841796875, 7.61865234375, 7.8585205078125, 8.098388671875, 8.3382568359375, 8.578125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 12.0, 14.0, 13.0, 22.0, 24.0, 21.0, 36.0, 66.0, 79.0, 123.0, 154.0, 226.0, 275.0, 379.0, 444.0, 440.0, 417.0, 306.0, 275.0, 200.0, 147.0, 103.0, 85.0, 49.0, 45.0, 25.0, 27.0, 19.0, 14.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.822265625, -1.7746124267578125, -1.726959228515625, -1.6793060302734375, -1.63165283203125, -1.5839996337890625, -1.536346435546875, -1.4886932373046875, -1.4410400390625, -1.3933868408203125, -1.345733642578125, -1.2980804443359375, -1.25042724609375, -1.2027740478515625, -1.155120849609375, -1.1074676513671875, -1.059814453125, -1.0121612548828125, -0.964508056640625, -0.9168548583984375, -0.86920166015625, -0.8215484619140625, -0.773895263671875, -0.7262420654296875, -0.6785888671875, -0.6309356689453125, -0.583282470703125, -0.5356292724609375, -0.48797607421875, -0.4403228759765625, -0.392669677734375, -0.3450164794921875, -0.29736328125, -0.2497100830078125, -0.202056884765625, -0.1544036865234375, -0.10675048828125, -0.0590972900390625, -0.011444091796875, 0.0362091064453125, 0.0838623046875, 0.1315155029296875, 0.179168701171875, 0.2268218994140625, 0.27447509765625, 0.3221282958984375, 0.369781494140625, 0.4174346923828125, 0.465087890625, 0.5127410888671875, 0.560394287109375, 0.6080474853515625, 0.65570068359375, 0.7033538818359375, 0.751007080078125, 0.7986602783203125, 0.8463134765625, 0.8939666748046875, 0.941619873046875, 0.9892730712890625, 1.03692626953125, 1.0845794677734375, 1.132232666015625, 1.1798858642578125, 1.2275390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 29.0, 52.0, 75.0, 101.0, 139.0, 142.0, 118.0, 122.0, 87.0, 56.0, 30.0, 19.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.18076229095459, -14.85482406616211, -14.528885841369629, -14.202947616577148, -13.877009391784668, -13.551071166992188, -13.225132942199707, -12.899194717407227, -12.573257446289062, -12.247319221496582, -11.921380996704102, -11.595442771911621, -11.26950454711914, -10.94356632232666, -10.61762809753418, -10.291690826416016, -9.965751647949219, -9.639813423156738, -9.313875198364258, -8.987936973571777, -8.661998748779297, -8.336060523986816, -8.010122299194336, -7.684184551239014, -7.358246326446533, -7.032308101654053, -6.706369876861572, -6.380431652069092, -6.0544939041137695, -5.728555679321289, -5.402617454528809, -5.076679229736328, -4.7507405281066895, -4.424802303314209, -4.0988640785217285, -3.772926092147827, -3.4469878673553467, -3.121049642562866, -2.795111656188965, -2.4691734313964844, -2.143235206604004, -1.8172969818115234, -1.4913588762283325, -1.1654207706451416, -0.8394825458526611, -0.5135443210601807, -0.18760621547698975, 0.13833189010620117, 0.46427011489868164, 0.7902082800865173, 1.116146445274353, 1.442084550857544, 1.7680227756500244, 2.093961000442505, 2.4198989868164062, 2.7458372116088867, 3.071775436401367, 3.3977136611938477, 3.723651885986328, 4.049590110778809, 4.375528335571289, 4.7014665603637695, 5.027404308319092, 5.353342533111572, 5.679280757904053]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 14.0, 10.0, 15.0, 15.0, 20.0, 26.0, 18.0, 28.0, 32.0, 39.0, 37.0, 25.0, 35.0, 47.0, 42.0, 37.0, 42.0, 47.0, 43.0, 40.0, 36.0, 39.0, 36.0, 38.0, 30.0, 29.0, 29.0, 30.0, 15.0, 14.0, 18.0, 14.0, 12.0, 11.0, 6.0, 3.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.415496587753296, -3.293851613998413, -3.1722066402435303, -3.0505619049072266, -2.9289169311523438, -2.807271957397461, -2.685626983642578, -2.5639820098876953, -2.4423370361328125, -2.3206920623779297, -2.199047088623047, -2.077402114868164, -1.9557573795318604, -1.8341124057769775, -1.7124674320220947, -1.590822458267212, -1.4691777229309082, -1.3475327491760254, -1.2258878946304321, -1.1042429208755493, -0.9825980067253113, -0.8609530925750732, -0.7393081188201904, -0.6176632046699524, -0.49601829051971436, -0.3743733763694763, -0.2527284324169159, -0.13108348846435547, -0.009438574314117432, 0.1122063398361206, 0.23385131359100342, 0.35549622774124146, 0.4771413803100586, 0.5987862944602966, 0.7204312086105347, 0.8420761823654175, 0.9637210965156555, 1.0853660106658936, 1.2070109844207764, 1.3286559581756592, 1.4503008127212524, 1.5719457864761353, 1.6935906410217285, 1.8152356147766113, 1.9368805885314941, 2.058525562286377, 2.1801705360412598, 2.3018152713775635, 2.4234602451324463, 2.545105218887329, 2.666750192642212, 2.7883949279785156, 2.9100399017333984, 3.0316848754882812, 3.153329849243164, 3.274974822998047, 3.3966197967529297, 3.5182647705078125, 3.6399097442626953, 3.761554718017578, 3.883199453353882, 4.004844665527344, 4.126489639282227, 4.248134136199951, 4.369779109954834]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 12.0, 16.0, 22.0, 36.0, 47.0, 100.0, 146.0, 255.0, 477.0, 994.0, 2314.0, 6057.0, 17894.0, 57628.0, 174003.0, 348675.0, 278862.0, 108480.0, 34658.0, 11013.0, 3775.0, 1489.0, 665.0, 355.0, 210.0, 111.0, 88.0, 48.0, 38.0, 15.0, 18.0, 12.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.558868408203125, -0.54010009765625, -0.521331787109375, -0.5025634765625, -0.483795166015625, -0.46502685546875, -0.446258544921875, -0.427490234375, -0.408721923828125, -0.38995361328125, -0.371185302734375, -0.3524169921875, -0.333648681640625, -0.31488037109375, -0.296112060546875, -0.27734375, -0.258575439453125, -0.23980712890625, -0.221038818359375, -0.2022705078125, -0.183502197265625, -0.16473388671875, -0.145965576171875, -0.127197265625, -0.108428955078125, -0.08966064453125, -0.070892333984375, -0.0521240234375, -0.033355712890625, -0.01458740234375, 0.004180908203125, 0.02294921875, 0.041717529296875, 0.06048583984375, 0.079254150390625, 0.0980224609375, 0.116790771484375, 0.13555908203125, 0.154327392578125, 0.173095703125, 0.191864013671875, 0.21063232421875, 0.229400634765625, 0.2481689453125, 0.266937255859375, 0.28570556640625, 0.304473876953125, 0.3232421875, 0.342010498046875, 0.36077880859375, 0.379547119140625, 0.3983154296875, 0.417083740234375, 0.43585205078125, 0.454620361328125, 0.473388671875, 0.492156982421875, 0.51092529296875, 0.529693603515625, 0.5484619140625, 0.567230224609375, 0.58599853515625, 0.604766845703125, 0.62353515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 9.0, 12.0, 16.0, 18.0, 36.0, 38.0, 26.0, 47.0, 60.0, 53.0, 46.0, 51.0, 55.0, 60.0, 57.0, 61.0, 55.0, 58.0, 43.0, 48.0, 31.0, 34.0, 17.0, 17.0, 13.0, 17.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.6470947265625, -2.528564453125, -2.4100341796875, -2.29150390625, -2.1729736328125, -2.054443359375, -1.9359130859375, -1.8173828125, -1.6988525390625, -1.580322265625, -1.4617919921875, -1.34326171875, -1.2247314453125, -1.106201171875, -0.9876708984375, -0.869140625, -0.7506103515625, -0.632080078125, -0.5135498046875, -0.39501953125, -0.2764892578125, -0.157958984375, -0.0394287109375, 0.0791015625, 0.1976318359375, 0.316162109375, 0.4346923828125, 0.55322265625, 0.6717529296875, 0.790283203125, 0.9088134765625, 1.02734375, 1.1458740234375, 1.264404296875, 1.3829345703125, 1.50146484375, 1.6199951171875, 1.738525390625, 1.8570556640625, 1.9755859375, 2.0941162109375, 2.212646484375, 2.3311767578125, 2.44970703125, 2.5682373046875, 2.686767578125, 2.8052978515625, 2.923828125, 3.0423583984375, 3.160888671875, 3.2794189453125, 3.39794921875, 3.5164794921875, 3.635009765625, 3.7535400390625, 3.8720703125, 3.9906005859375, 4.109130859375, 4.2276611328125, 4.34619140625, 4.4647216796875, 4.583251953125, 4.7017822265625, 4.8203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 22.0, 35.0, 60.0, 136.0, 221.0, 529.0, 1121.0, 2805.0, 6754.0, 16337.0, 39558.0, 93155.0, 196871.0, 287455.0, 217219.0, 107800.0, 46204.0, 18931.0, 7681.0, 3194.0, 1293.0, 583.0, 300.0, 145.0, 71.0, 22.0, 15.0, 10.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.457763671875, -0.44525146484375, -0.4327392578125, -0.42022705078125, -0.40771484375, -0.39520263671875, -0.3826904296875, -0.37017822265625, -0.357666015625, -0.34515380859375, -0.3326416015625, -0.32012939453125, -0.3076171875, -0.29510498046875, -0.2825927734375, -0.27008056640625, -0.257568359375, -0.24505615234375, -0.2325439453125, -0.22003173828125, -0.20751953125, -0.19500732421875, -0.1824951171875, -0.16998291015625, -0.157470703125, -0.14495849609375, -0.1324462890625, -0.11993408203125, -0.107421875, -0.09490966796875, -0.0823974609375, -0.06988525390625, -0.057373046875, -0.04486083984375, -0.0323486328125, -0.01983642578125, -0.00732421875, 0.00518798828125, 0.0177001953125, 0.03021240234375, 0.042724609375, 0.05523681640625, 0.0677490234375, 0.08026123046875, 0.0927734375, 0.10528564453125, 0.1177978515625, 0.13031005859375, 0.142822265625, 0.15533447265625, 0.1678466796875, 0.18035888671875, 0.19287109375, 0.20538330078125, 0.2178955078125, 0.23040771484375, 0.242919921875, 0.25543212890625, 0.2679443359375, 0.28045654296875, 0.29296875, 0.30548095703125, 0.3179931640625, 0.33050537109375, 0.343017578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 5.0, 3.0, 8.0, 12.0, 14.0, 16.0, 17.0, 18.0, 24.0, 24.0, 26.0, 33.0, 37.0, 46.0, 41.0, 60.0, 59.0, 60.0, 54.0, 56.0, 46.0, 48.0, 52.0, 35.0, 41.0, 24.0, 25.0, 24.0, 17.0, 10.0, 6.0, 18.0, 7.0, 7.0, 8.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.3203125, -7.121826171875, -6.92333984375, -6.724853515625, -6.5263671875, -6.327880859375, -6.12939453125, -5.930908203125, -5.732421875, -5.533935546875, -5.33544921875, -5.136962890625, -4.9384765625, -4.739990234375, -4.54150390625, -4.343017578125, -4.14453125, -3.946044921875, -3.74755859375, -3.549072265625, -3.3505859375, -3.152099609375, -2.95361328125, -2.755126953125, -2.556640625, -2.358154296875, -2.15966796875, -1.961181640625, -1.7626953125, -1.564208984375, -1.36572265625, -1.167236328125, -0.96875, -0.770263671875, -0.57177734375, -0.373291015625, -0.1748046875, 0.023681640625, 0.22216796875, 0.420654296875, 0.619140625, 0.817626953125, 1.01611328125, 1.214599609375, 1.4130859375, 1.611572265625, 1.81005859375, 2.008544921875, 2.20703125, 2.405517578125, 2.60400390625, 2.802490234375, 3.0009765625, 3.199462890625, 3.39794921875, 3.596435546875, 3.794921875, 3.993408203125, 4.19189453125, 4.390380859375, 4.5888671875, 4.787353515625, 4.98583984375, 5.184326171875, 5.3828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 11.0, 8.0, 14.0, 26.0, 45.0, 64.0, 92.0, 137.0, 211.0, 388.0, 723.0, 1496.0, 3764.0, 11310.0, 48583.0, 305514.0, 548075.0, 98573.0, 19480.0, 5823.0, 2095.0, 917.0, 473.0, 277.0, 165.0, 99.0, 60.0, 46.0, 28.0, 22.0, 9.0, 4.0, 8.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.10186767578125, -0.09888935089111328, -0.09591102600097656, -0.09293270111083984, -0.08995437622070312, -0.0869760513305664, -0.08399772644042969, -0.08101940155029297, -0.07804107666015625, -0.07506275177001953, -0.07208442687988281, -0.0691061019897461, -0.06612777709960938, -0.06314945220947266, -0.06017112731933594, -0.05719280242919922, -0.0542144775390625, -0.05123615264892578, -0.04825782775878906, -0.045279502868652344, -0.042301177978515625, -0.039322853088378906, -0.03634452819824219, -0.03336620330810547, -0.03038787841796875, -0.02740955352783203, -0.024431228637695312, -0.021452903747558594, -0.018474578857421875, -0.015496253967285156, -0.012517929077148438, -0.009539604187011719, -0.006561279296875, -0.0035829544067382812, -0.0006046295166015625, 0.0023736953735351562, 0.005352020263671875, 0.008330345153808594, 0.011308670043945312, 0.014286994934082031, 0.01726531982421875, 0.02024364471435547, 0.023221969604492188, 0.026200294494628906, 0.029178619384765625, 0.032156944274902344, 0.03513526916503906, 0.03811359405517578, 0.0410919189453125, 0.04407024383544922, 0.04704856872558594, 0.050026893615722656, 0.053005218505859375, 0.055983543395996094, 0.05896186828613281, 0.06194019317626953, 0.06491851806640625, 0.06789684295654297, 0.07087516784667969, 0.0738534927368164, 0.07683181762695312, 0.07981014251708984, 0.08278846740722656, 0.08576679229736328, 0.0887451171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 5.0, 17.0, 18.0, 30.0, 40.0, 46.0, 77.0, 112.0, 116.0, 138.0, 110.0, 91.0, 62.0, 39.0, 34.0, 20.0, 10.0, 14.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.432699203491211e-05, -7.178634405136108e-05, -6.924569606781006e-05, -6.670504808425903e-05, -6.416440010070801e-05, -6.162375211715698e-05, -5.908310413360596e-05, -5.654245615005493e-05, -5.4001808166503906e-05, -5.146116018295288e-05, -4.8920512199401855e-05, -4.637986421585083e-05, -4.3839216232299805e-05, -4.129856824874878e-05, -3.8757920265197754e-05, -3.621727228164673e-05, -3.36766242980957e-05, -3.113597631454468e-05, -2.8595328330993652e-05, -2.6054680347442627e-05, -2.35140323638916e-05, -2.0973384380340576e-05, -1.843273639678955e-05, -1.5892088413238525e-05, -1.33514404296875e-05, -1.0810792446136475e-05, -8.27014446258545e-06, -5.729496479034424e-06, -3.1888484954833984e-06, -6.48200511932373e-07, 1.8924474716186523e-06, 4.433095455169678e-06, 6.973743438720703e-06, 9.514391422271729e-06, 1.2055039405822754e-05, 1.459568738937378e-05, 1.7136335372924805e-05, 1.967698335647583e-05, 2.2217631340026855e-05, 2.475827932357788e-05, 2.7298927307128906e-05, 2.983957529067993e-05, 3.238022327423096e-05, 3.492087125778198e-05, 3.746151924133301e-05, 4.000216722488403e-05, 4.254281520843506e-05, 4.5083463191986084e-05, 4.762411117553711e-05, 5.0164759159088135e-05, 5.270540714263916e-05, 5.5246055126190186e-05, 5.778670310974121e-05, 6.0327351093292236e-05, 6.286799907684326e-05, 6.540864706039429e-05, 6.794929504394531e-05, 7.048994302749634e-05, 7.303059101104736e-05, 7.557123899459839e-05, 7.811188697814941e-05, 8.065253496170044e-05, 8.319318294525146e-05, 8.573383092880249e-05, 8.827447891235352e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 4.0, 2.0, 8.0, 7.0, 3.0, 14.0, 7.0, 14.0, 25.0, 24.0, 58.0, 124.0, 218.0, 415.0, 1105.0, 3000.0, 11061.0, 65413.0, 623256.0, 302879.0, 30645.0, 6711.0, 1970.0, 788.0, 338.0, 187.0, 87.0, 51.0, 27.0, 21.0, 10.0, 13.0, 7.0, 4.0, 7.0, 7.0, 3.0, 5.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.11977005004882812, -0.11588287353515625, -0.11199569702148438, -0.1081085205078125, -0.10422134399414062, -0.10033416748046875, -0.09644699096679688, -0.092559814453125, -0.08867263793945312, -0.08478546142578125, -0.08089828491210938, -0.0770111083984375, -0.07312393188476562, -0.06923675537109375, -0.06534957885742188, -0.06146240234375, -0.057575225830078125, -0.05368804931640625, -0.049800872802734375, -0.0459136962890625, -0.042026519775390625, -0.03813934326171875, -0.034252166748046875, -0.030364990234375, -0.026477813720703125, -0.02259063720703125, -0.018703460693359375, -0.0148162841796875, -0.010929107666015625, -0.00704193115234375, -0.003154754638671875, 0.000732421875, 0.004619598388671875, 0.00850677490234375, 0.012393951416015625, 0.0162811279296875, 0.020168304443359375, 0.02405548095703125, 0.027942657470703125, 0.031829833984375, 0.035717010498046875, 0.03960418701171875, 0.043491363525390625, 0.0473785400390625, 0.051265716552734375, 0.05515289306640625, 0.059040069580078125, 0.06292724609375, 0.06681442260742188, 0.07070159912109375, 0.07458877563476562, 0.0784759521484375, 0.08236312866210938, 0.08625030517578125, 0.09013748168945312, 0.094024658203125, 0.09791183471679688, 0.10179901123046875, 0.10568618774414062, 0.1095733642578125, 0.11346054077148438, 0.11734771728515625, 0.12123489379882812, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 14.0, 16.0, 11.0, 25.0, 38.0, 46.0, 59.0, 80.0, 103.0, 100.0, 111.0, 87.0, 77.0, 44.0, 43.0, 43.0, 27.0, 14.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0254974365234375, -0.02469491958618164, -0.02389240264892578, -0.023089885711669922, -0.022287368774414062, -0.021484851837158203, -0.020682334899902344, -0.019879817962646484, -0.019077301025390625, -0.018274784088134766, -0.017472267150878906, -0.016669750213623047, -0.015867233276367188, -0.015064716339111328, -0.014262199401855469, -0.01345968246459961, -0.01265716552734375, -0.01185464859008789, -0.011052131652832031, -0.010249614715576172, -0.009447097778320312, -0.008644580841064453, -0.007842063903808594, -0.007039546966552734, -0.006237030029296875, -0.005434513092041016, -0.004631996154785156, -0.003829479217529297, -0.0030269622802734375, -0.002224445343017578, -0.0014219284057617188, -0.0006194114685058594, 0.00018310546875, 0.0009856224060058594, 0.0017881393432617188, 0.002590656280517578, 0.0033931732177734375, 0.004195690155029297, 0.004998207092285156, 0.005800724029541016, 0.006603240966796875, 0.007405757904052734, 0.008208274841308594, 0.009010791778564453, 0.009813308715820312, 0.010615825653076172, 0.011418342590332031, 0.01222085952758789, 0.01302337646484375, 0.01382589340209961, 0.014628410339355469, 0.015430927276611328, 0.016233444213867188, 0.017035961151123047, 0.017838478088378906, 0.018640995025634766, 0.019443511962890625, 0.020246028900146484, 0.021048545837402344, 0.021851062774658203, 0.022653579711914062, 0.023456096649169922, 0.02425861358642578, 0.02506113052368164, 0.0258636474609375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 15.0, 91.0, 304.0, 380.0, 181.0, 31.0, 7.0, 5.0, 0.0, 3.0], "bins": [-31.23577880859375, -30.69000816345215, -30.144237518310547, -29.598466873168945, -29.052696228027344, -28.506925582885742, -27.96115493774414, -27.415386199951172, -26.869613647460938, -26.323843002319336, -25.778072357177734, -25.232301712036133, -24.68653106689453, -24.14076042175293, -23.594989776611328, -23.04922103881836, -22.503450393676758, -21.957679748535156, -21.411909103393555, -20.866138458251953, -20.32036781311035, -19.77459716796875, -19.22882652282715, -18.683055877685547, -18.137287139892578, -17.591516494750977, -17.045745849609375, -16.499975204467773, -15.954204559326172, -15.40843391418457, -14.862664222717285, -14.316893577575684, -13.77112102508545, -13.225350379943848, -12.679579734802246, -12.133809089660645, -11.58803939819336, -11.042268753051758, -10.496498107910156, -9.950727462768555, -9.404956817626953, -8.859186172485352, -8.31341552734375, -7.767645359039307, -7.221874713897705, -6.6761040687561035, -6.13033390045166, -5.584563255310059, -5.038792610168457, -4.4930219650268555, -3.947251558303833, -3.4014811515808105, -2.855710506439209, -2.3099398612976074, -1.764169454574585, -1.2183990478515625, -0.6726281642913818, -0.12685763835906982, 0.4189128875732422, 0.9646834135055542, 1.5104539394378662, 2.0562245845794678, 2.6019949913024902, 3.1477653980255127, 3.6935360431671143]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 12.0, 14.0, 15.0, 17.0, 23.0, 22.0, 30.0, 31.0, 43.0, 41.0, 42.0, 27.0, 49.0, 54.0, 41.0, 48.0, 52.0, 46.0, 36.0, 49.0, 33.0, 47.0, 30.0, 29.0, 31.0, 26.0, 20.0, 15.0, 10.0, 14.0, 12.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4967775344848633, -2.408999443054199, -2.321221113204956, -2.233443021774292, -2.145664930343628, -2.0578866004943848, -1.9701085090637207, -1.8823304176330566, -1.794552206993103, -1.7067739963531494, -1.6189959049224854, -1.5312176942825317, -1.4434394836425781, -1.355661392211914, -1.2678831815719604, -1.1801049709320068, -1.0923268795013428, -1.0045486688613892, -0.9167705774307251, -0.8289923667907715, -0.7412142157554626, -0.6534360647201538, -0.5656578540802002, -0.47787970304489136, -0.3901015520095825, -0.3023234009742737, -0.21454522013664246, -0.12676703929901123, -0.03898888826370239, 0.048789262771606445, 0.13656747341156006, 0.2243456244468689, 0.31212353706359863, 0.39990168809890747, 0.4876798689365387, 0.5754580497741699, 0.6632362008094788, 0.7510143518447876, 0.8387925624847412, 0.92657071352005, 1.0143488645553589, 1.1021270751953125, 1.1899051666259766, 1.2776833772659302, 1.3654615879058838, 1.4532396793365479, 1.5410178899765015, 1.628796100616455, 1.7165741920471191, 1.8043524026870728, 1.8921304941177368, 1.9799087047576904, 2.0676867961883545, 2.1554651260375977, 2.2432432174682617, 2.331021308898926, 2.41879940032959, 2.506577491760254, 2.594355821609497, 2.682133913040161, 2.769912004470825, 2.8576903343200684, 2.9454684257507324, 3.0332465171813965, 3.1210248470306396]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 11.0, 16.0, 15.0, 30.0, 79.0, 178.0, 349.0, 933.0, 3179.0, 11469.0, 47552.0, 197092.0, 489506.0, 224982.0, 54401.0, 13276.0, 3624.0, 1047.0, 426.0, 177.0, 85.0, 39.0, 23.0, 22.0, 9.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94140625, -3.8203125, -3.69921875, -3.578125, -3.45703125, -3.3359375, -3.21484375, -3.09375, -2.97265625, -2.8515625, -2.73046875, -2.609375, -2.48828125, -2.3671875, -2.24609375, -2.125, -2.00390625, -1.8828125, -1.76171875, -1.640625, -1.51953125, -1.3984375, -1.27734375, -1.15625, -1.03515625, -0.9140625, -0.79296875, -0.671875, -0.55078125, -0.4296875, -0.30859375, -0.1875, -0.06640625, 0.0546875, 0.17578125, 0.296875, 0.41796875, 0.5390625, 0.66015625, 0.78125, 0.90234375, 1.0234375, 1.14453125, 1.265625, 1.38671875, 1.5078125, 1.62890625, 1.75, 1.87109375, 1.9921875, 2.11328125, 2.234375, 2.35546875, 2.4765625, 2.59765625, 2.71875, 2.83984375, 2.9609375, 3.08203125, 3.203125, 3.32421875, 3.4453125, 3.56640625, 3.6875, 3.80859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 11.0, 10.0, 12.0, 23.0, 22.0, 24.0, 24.0, 25.0, 36.0, 42.0, 40.0, 39.0, 50.0, 43.0, 44.0, 44.0, 52.0, 47.0, 47.0, 41.0, 45.0, 39.0, 40.0, 34.0, 21.0, 23.0, 27.0, 14.0, 14.0, 13.0, 11.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.17578125, -5.01300048828125, -4.8502197265625, -4.68743896484375, -4.524658203125, -4.36187744140625, -4.1990966796875, -4.03631591796875, -3.87353515625, -3.71075439453125, -3.5479736328125, -3.38519287109375, -3.222412109375, -3.05963134765625, -2.8968505859375, -2.73406982421875, -2.5712890625, -2.40850830078125, -2.2457275390625, -2.08294677734375, -1.920166015625, -1.75738525390625, -1.5946044921875, -1.43182373046875, -1.26904296875, -1.10626220703125, -0.9434814453125, -0.78070068359375, -0.617919921875, -0.45513916015625, -0.2923583984375, -0.12957763671875, 0.033203125, 0.19598388671875, 0.3587646484375, 0.52154541015625, 0.684326171875, 0.84710693359375, 1.0098876953125, 1.17266845703125, 1.33544921875, 1.49822998046875, 1.6610107421875, 1.82379150390625, 1.986572265625, 2.14935302734375, 2.3121337890625, 2.47491455078125, 2.6376953125, 2.80047607421875, 2.9632568359375, 3.12603759765625, 3.288818359375, 3.45159912109375, 3.6143798828125, 3.77716064453125, 3.93994140625, 4.10272216796875, 4.2655029296875, 4.42828369140625, 4.591064453125, 4.75384521484375, 4.9166259765625, 5.07940673828125, 5.2421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 10.0, 15.0, 6.0, 27.0, 15.0, 20.0, 24.0, 34.0, 36.0, 61.0, 100.0, 153.0, 250.0, 481.0, 2124.0, 122692.0, 901574.0, 18994.0, 979.0, 375.0, 186.0, 110.0, 73.0, 45.0, 28.0, 36.0, 18.0, 14.0, 13.0, 7.0, 11.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.625, -11.253662109375, -10.88232421875, -10.510986328125, -10.1396484375, -9.768310546875, -9.39697265625, -9.025634765625, -8.654296875, -8.282958984375, -7.91162109375, -7.540283203125, -7.1689453125, -6.797607421875, -6.42626953125, -6.054931640625, -5.68359375, -5.312255859375, -4.94091796875, -4.569580078125, -4.1982421875, -3.826904296875, -3.45556640625, -3.084228515625, -2.712890625, -2.341552734375, -1.97021484375, -1.598876953125, -1.2275390625, -0.856201171875, -0.48486328125, -0.113525390625, 0.2578125, 0.629150390625, 1.00048828125, 1.371826171875, 1.7431640625, 2.114501953125, 2.48583984375, 2.857177734375, 3.228515625, 3.599853515625, 3.97119140625, 4.342529296875, 4.7138671875, 5.085205078125, 5.45654296875, 5.827880859375, 6.19921875, 6.570556640625, 6.94189453125, 7.313232421875, 7.6845703125, 8.055908203125, 8.42724609375, 8.798583984375, 9.169921875, 9.541259765625, 9.91259765625, 10.283935546875, 10.6552734375, 11.026611328125, 11.39794921875, 11.769287109375, 12.140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 9.0, 16.0, 14.0, 16.0, 11.0, 22.0, 20.0, 21.0, 27.0, 42.0, 33.0, 33.0, 46.0, 34.0, 41.0, 48.0, 49.0, 43.0, 37.0, 36.0, 45.0, 37.0, 42.0, 35.0, 23.0, 34.0, 25.0, 28.0, 32.0, 8.0, 9.0, 13.0, 12.0, 5.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-6.34765625, -6.1689453125, -5.990234375, -5.8115234375, -5.6328125, -5.4541015625, -5.275390625, -5.0966796875, -4.91796875, -4.7392578125, -4.560546875, -4.3818359375, -4.203125, -4.0244140625, -3.845703125, -3.6669921875, -3.48828125, -3.3095703125, -3.130859375, -2.9521484375, -2.7734375, -2.5947265625, -2.416015625, -2.2373046875, -2.05859375, -1.8798828125, -1.701171875, -1.5224609375, -1.34375, -1.1650390625, -0.986328125, -0.8076171875, -0.62890625, -0.4501953125, -0.271484375, -0.0927734375, 0.0859375, 0.2646484375, 0.443359375, 0.6220703125, 0.80078125, 0.9794921875, 1.158203125, 1.3369140625, 1.515625, 1.6943359375, 1.873046875, 2.0517578125, 2.23046875, 2.4091796875, 2.587890625, 2.7666015625, 2.9453125, 3.1240234375, 3.302734375, 3.4814453125, 3.66015625, 3.8388671875, 4.017578125, 4.1962890625, 4.375, 4.5537109375, 4.732421875, 4.9111328125, 5.08984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 15.0, 37.0, 117.0, 603.0, 25177.0, 1019129.0, 3102.0, 244.0, 52.0, 27.0, 20.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.3626708984375, -9.053466796875, -8.7442626953125, -8.43505859375, -8.1258544921875, -7.816650390625, -7.5074462890625, -7.1982421875, -6.8890380859375, -6.579833984375, -6.2706298828125, -5.96142578125, -5.6522216796875, -5.343017578125, -5.0338134765625, -4.724609375, -4.4154052734375, -4.106201171875, -3.7969970703125, -3.48779296875, -3.1785888671875, -2.869384765625, -2.5601806640625, -2.2509765625, -1.9417724609375, -1.632568359375, -1.3233642578125, -1.01416015625, -0.7049560546875, -0.395751953125, -0.0865478515625, 0.22265625, 0.5318603515625, 0.841064453125, 1.1502685546875, 1.45947265625, 1.7686767578125, 2.077880859375, 2.3870849609375, 2.6962890625, 3.0054931640625, 3.314697265625, 3.6239013671875, 3.93310546875, 4.2423095703125, 4.551513671875, 4.8607177734375, 5.169921875, 5.4791259765625, 5.788330078125, 6.0975341796875, 6.40673828125, 6.7159423828125, 7.025146484375, 7.3343505859375, 7.6435546875, 7.9527587890625, 8.261962890625, 8.5711669921875, 8.88037109375, 9.1895751953125, 9.498779296875, 9.8079833984375, 10.1171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 14.0, 30.0, 35.0, 49.0, 72.0, 89.0, 115.0, 97.0, 114.0, 92.0, 69.0, 60.0, 49.0, 29.0, 23.0, 11.0, 12.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002415180206298828, -0.0002328045666217804, -0.00022409111261367798, -0.00021537765860557556, -0.00020666420459747314, -0.00019795075058937073, -0.0001892372965812683, -0.0001805238425731659, -0.00017181038856506348, -0.00016309693455696106, -0.00015438348054885864, -0.00014567002654075623, -0.0001369565725326538, -0.0001282431185245514, -0.00011952966451644897, -0.00011081621050834656, -0.00010210275650024414, -9.338930249214172e-05, -8.46758484840393e-05, -7.596239447593689e-05, -6.724894046783447e-05, -5.8535486459732056e-05, -4.982203245162964e-05, -4.110857844352722e-05, -3.2395124435424805e-05, -2.3681670427322388e-05, -1.496821641921997e-05, -6.254762411117554e-06, 2.4586915969848633e-06, 1.117214560508728e-05, 1.9885599613189697e-05, 2.8599053621292114e-05, 3.731250762939453e-05, 4.602596163749695e-05, 5.4739415645599365e-05, 6.345286965370178e-05, 7.21663236618042e-05, 8.087977766990662e-05, 8.959323167800903e-05, 9.830668568611145e-05, 0.00010702013969421387, 0.00011573359370231628, 0.0001244470477104187, 0.00013316050171852112, 0.00014187395572662354, 0.00015058740973472595, 0.00015930086374282837, 0.00016801431775093079, 0.0001767277717590332, 0.00018544122576713562, 0.00019415467977523804, 0.00020286813378334045, 0.00021158158779144287, 0.0002202950417995453, 0.0002290084958076477, 0.00023772194981575012, 0.00024643540382385254, 0.00025514885783195496, 0.0002638623118400574, 0.0002725757658481598, 0.0002812892198562622, 0.0002900026738643646, 0.00029871612787246704, 0.00030742958188056946, 0.0003161430358886719]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 15.0, 31.0, 101.0, 376.0, 4297.0, 1034390.0, 8596.0, 574.0, 113.0, 32.0, 10.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.90625, -17.52191162109375, -17.1375732421875, -16.75323486328125, -16.368896484375, -15.98455810546875, -15.6002197265625, -15.21588134765625, -14.83154296875, -14.44720458984375, -14.0628662109375, -13.67852783203125, -13.294189453125, -12.90985107421875, -12.5255126953125, -12.14117431640625, -11.7568359375, -11.37249755859375, -10.9881591796875, -10.60382080078125, -10.219482421875, -9.83514404296875, -9.4508056640625, -9.06646728515625, -8.68212890625, -8.29779052734375, -7.9134521484375, -7.52911376953125, -7.144775390625, -6.76043701171875, -6.3760986328125, -5.99176025390625, -5.607421875, -5.22308349609375, -4.8387451171875, -4.45440673828125, -4.070068359375, -3.68572998046875, -3.3013916015625, -2.91705322265625, -2.53271484375, -2.14837646484375, -1.7640380859375, -1.37969970703125, -0.995361328125, -0.61102294921875, -0.2266845703125, 0.15765380859375, 0.5419921875, 0.92633056640625, 1.3106689453125, 1.69500732421875, 2.079345703125, 2.46368408203125, 2.8480224609375, 3.23236083984375, 3.61669921875, 4.00103759765625, 4.3853759765625, 4.76971435546875, 5.154052734375, 5.53839111328125, 5.9227294921875, 6.30706787109375, 6.69140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 12.0, 28.0, 87.0, 151.0, 275.0, 224.0, 131.0, 56.0, 23.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.111328125, -1.045257568359375, -0.97918701171875, -0.913116455078125, -0.8470458984375, -0.780975341796875, -0.71490478515625, -0.648834228515625, -0.582763671875, -0.516693115234375, -0.45062255859375, -0.384552001953125, -0.3184814453125, -0.252410888671875, -0.18634033203125, -0.120269775390625, -0.05419921875, 0.011871337890625, 0.07794189453125, 0.144012451171875, 0.2100830078125, 0.276153564453125, 0.34222412109375, 0.408294677734375, 0.474365234375, 0.540435791015625, 0.60650634765625, 0.672576904296875, 0.7386474609375, 0.804718017578125, 0.87078857421875, 0.936859130859375, 1.0029296875, 1.069000244140625, 1.13507080078125, 1.201141357421875, 1.2672119140625, 1.333282470703125, 1.39935302734375, 1.465423583984375, 1.531494140625, 1.597564697265625, 1.66363525390625, 1.729705810546875, 1.7957763671875, 1.861846923828125, 1.92791748046875, 1.993988037109375, 2.06005859375, 2.126129150390625, 2.19219970703125, 2.258270263671875, 2.3243408203125, 2.390411376953125, 2.45648193359375, 2.522552490234375, 2.588623046875, 2.654693603515625, 2.72076416015625, 2.786834716796875, 2.8529052734375, 2.918975830078125, 2.98504638671875, 3.051116943359375, 3.1171875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 13.0, 19.0, 44.0, 74.0, 88.0, 107.0, 104.0, 142.0, 112.0, 82.0, 82.0, 56.0, 26.0, 18.0, 13.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.801612377166748, -5.464967250823975, -5.128322124481201, -4.791677474975586, -4.4550323486328125, -4.118387222290039, -3.7817420959472656, -3.445096969604492, -3.1084518432617188, -2.7718067169189453, -2.435161590576172, -2.0985167026519775, -1.761871576309204, -1.4252264499664307, -1.0885815620422363, -0.7519364356994629, -0.41529130935668945, -0.07864624261856079, 0.25799882411956787, 0.5946438312530518, 0.9312889575958252, 1.2679340839385986, 1.604578971862793, 1.9412240982055664, 2.27786922454834, 2.6145143508911133, 2.9511594772338867, 3.287804365158081, 3.6244494915008545, 3.961094617843628, 4.297739505767822, 4.634384632110596, 4.971029281616211, 5.307674407958984, 5.644319534301758, 5.980964660644531, 6.317609786987305, 6.654254913330078, 6.990899562835693, 7.327544689178467, 7.66418981552124, 8.000834465026855, 8.337479591369629, 8.674124717712402, 9.010769844055176, 9.34741497039795, 9.684060096740723, 10.020705223083496, 10.35735034942627, 10.693995475769043, 11.030640602111816, 11.36728572845459, 11.703930854797363, 12.040575981140137, 12.377220153808594, 12.713865280151367, 13.05051040649414, 13.387155532836914, 13.723800659179688, 14.060445785522461, 14.397090911865234, 14.733736038208008, 15.070381164550781, 15.407026290893555, 15.743671417236328]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 4.0, 18.0, 12.0, 16.0, 19.0, 18.0, 20.0, 36.0, 23.0, 38.0, 38.0, 33.0, 36.0, 23.0, 35.0, 38.0, 45.0, 42.0, 41.0, 32.0, 60.0, 31.0, 31.0, 30.0, 31.0, 30.0, 27.0, 24.0, 26.0, 19.0, 20.0, 14.0, 12.0, 8.0, 12.0, 10.0, 11.0, 3.0, 4.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.518416404724121, -7.246252059936523, -6.974087715148926, -6.701923370361328, -6.429759502410889, -6.157595157623291, -5.885430812835693, -5.613266468048096, -5.341102600097656, -5.068938255310059, -4.796773910522461, -4.524609565734863, -4.252445697784424, -3.980281352996826, -3.7081170082092285, -3.435952663421631, -3.163788318634033, -2.8916239738464355, -2.619459867477417, -2.3472955226898193, -2.075131416320801, -1.8029670715332031, -1.5308027267456055, -1.2586385011672974, -0.9864742755889893, -0.7143100500106812, -0.44214576482772827, -0.1699814796447754, 0.10218274593353271, 0.3743469715118408, 0.6465113162994385, 0.9186755418777466, 1.1908397674560547, 1.4630039930343628, 1.735168218612671, 2.0073325634002686, 2.279496669769287, 2.5516610145568848, 2.8238253593444824, 3.09598970413208, 3.3681538105010986, 3.6403181552886963, 3.912482261657715, 4.1846466064453125, 4.45681095123291, 4.728975296020508, 5.0011396408081055, 5.273303508758545, 5.545467853546143, 5.81763219833374, 6.089796543121338, 6.361960411071777, 6.634124755859375, 6.906289100646973, 7.17845344543457, 7.450617790222168, 7.722782135009766, 7.994946479797363, 8.267110824584961, 8.539275169372559, 8.811439514160156, 9.083602905273438, 9.355768203735352, 9.627931594848633, 9.90009593963623]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 5.0, 9.0, 12.0, 13.0, 21.0, 21.0, 24.0, 36.0, 54.0, 63.0, 99.0, 129.0, 278.0, 472.0, 1168.0, 5634.0, 46226.0, 652203.0, 2822598.0, 615032.0, 42513.0, 5167.0, 1194.0, 490.0, 255.0, 167.0, 113.0, 81.0, 51.0, 32.0, 37.0, 19.0, 17.0, 13.0, 8.0, 6.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.8079833984375, -6.584716796875, -6.3614501953125, -6.13818359375, -5.9149169921875, -5.691650390625, -5.4683837890625, -5.2451171875, -5.0218505859375, -4.798583984375, -4.5753173828125, -4.35205078125, -4.1287841796875, -3.905517578125, -3.6822509765625, -3.458984375, -3.2357177734375, -3.012451171875, -2.7891845703125, -2.56591796875, -2.3426513671875, -2.119384765625, -1.8961181640625, -1.6728515625, -1.4495849609375, -1.226318359375, -1.0030517578125, -0.77978515625, -0.5565185546875, -0.333251953125, -0.1099853515625, 0.11328125, 0.3365478515625, 0.559814453125, 0.7830810546875, 1.00634765625, 1.2296142578125, 1.452880859375, 1.6761474609375, 1.8994140625, 2.1226806640625, 2.345947265625, 2.5692138671875, 2.79248046875, 3.0157470703125, 3.239013671875, 3.4622802734375, 3.685546875, 3.9088134765625, 4.132080078125, 4.3553466796875, 4.57861328125, 4.8018798828125, 5.025146484375, 5.2484130859375, 5.4716796875, 5.6949462890625, 5.918212890625, 6.1414794921875, 6.36474609375, 6.5880126953125, 6.811279296875, 7.0345458984375, 7.2578125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 10.0, 14.0, 16.0, 17.0, 23.0, 23.0, 30.0, 38.0, 43.0, 38.0, 37.0, 38.0, 35.0, 45.0, 63.0, 41.0, 43.0, 48.0, 42.0, 41.0, 38.0, 41.0, 37.0, 30.0, 29.0, 20.0, 19.0, 27.0, 13.0, 7.0, 11.0, 3.0, 6.0, 9.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.647308349609375, -2.53875732421875, -2.430206298828125, -2.3216552734375, -2.213104248046875, -2.10455322265625, -1.996002197265625, -1.887451171875, -1.778900146484375, -1.67034912109375, -1.561798095703125, -1.4532470703125, -1.344696044921875, -1.23614501953125, -1.127593994140625, -1.01904296875, -0.910491943359375, -0.80194091796875, -0.693389892578125, -0.5848388671875, -0.476287841796875, -0.36773681640625, -0.259185791015625, -0.150634765625, -0.042083740234375, 0.06646728515625, 0.175018310546875, 0.2835693359375, 0.392120361328125, 0.50067138671875, 0.609222412109375, 0.7177734375, 0.826324462890625, 0.93487548828125, 1.043426513671875, 1.1519775390625, 1.260528564453125, 1.36907958984375, 1.477630615234375, 1.586181640625, 1.694732666015625, 1.80328369140625, 1.911834716796875, 2.0203857421875, 2.128936767578125, 2.23748779296875, 2.346038818359375, 2.45458984375, 2.563140869140625, 2.67169189453125, 2.780242919921875, 2.8887939453125, 2.997344970703125, 3.10589599609375, 3.214447021484375, 3.322998046875, 3.431549072265625, 3.54010009765625, 3.648651123046875, 3.7572021484375, 3.865753173828125, 3.97430419921875, 4.082855224609375, 4.19140625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 7.0, 9.0, 14.0, 19.0, 28.0, 62.0, 120.0, 265.0, 582.0, 1476.0, 7744.0, 403594.0, 3730275.0, 44919.0, 3418.0, 951.0, 371.0, 173.0, 92.0, 64.0, 37.0, 20.0, 16.0, 3.0, 7.0, 2.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7265625, -9.341796875, -8.95703125, -8.572265625, -8.1875, -7.802734375, -7.41796875, -7.033203125, -6.6484375, -6.263671875, -5.87890625, -5.494140625, -5.109375, -4.724609375, -4.33984375, -3.955078125, -3.5703125, -3.185546875, -2.80078125, -2.416015625, -2.03125, -1.646484375, -1.26171875, -0.876953125, -0.4921875, -0.107421875, 0.27734375, 0.662109375, 1.046875, 1.431640625, 1.81640625, 2.201171875, 2.5859375, 2.970703125, 3.35546875, 3.740234375, 4.125, 4.509765625, 4.89453125, 5.279296875, 5.6640625, 6.048828125, 6.43359375, 6.818359375, 7.203125, 7.587890625, 7.97265625, 8.357421875, 8.7421875, 9.126953125, 9.51171875, 9.896484375, 10.28125, 10.666015625, 11.05078125, 11.435546875, 11.8203125, 12.205078125, 12.58984375, 12.974609375, 13.359375, 13.744140625, 14.12890625, 14.513671875, 14.8984375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 18.0, 22.0, 37.0, 62.0, 88.0, 166.0, 282.0, 482.0, 610.0, 663.0, 594.0, 414.0, 249.0, 160.0, 75.0, 64.0, 33.0, 18.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.033203125, -2.9599151611328125, -2.886627197265625, -2.8133392333984375, -2.74005126953125, -2.6667633056640625, -2.593475341796875, -2.5201873779296875, -2.4468994140625, -2.3736114501953125, -2.300323486328125, -2.2270355224609375, -2.15374755859375, -2.0804595947265625, -2.007171630859375, -1.9338836669921875, -1.860595703125, -1.7873077392578125, -1.714019775390625, -1.6407318115234375, -1.56744384765625, -1.4941558837890625, -1.420867919921875, -1.3475799560546875, -1.2742919921875, -1.2010040283203125, -1.127716064453125, -1.0544281005859375, -0.98114013671875, -0.9078521728515625, -0.834564208984375, -0.7612762451171875, -0.68798828125, -0.6147003173828125, -0.541412353515625, -0.4681243896484375, -0.39483642578125, -0.3215484619140625, -0.248260498046875, -0.1749725341796875, -0.1016845703125, -0.0283966064453125, 0.044891357421875, 0.1181793212890625, 0.19146728515625, 0.2647552490234375, 0.338043212890625, 0.4113311767578125, 0.484619140625, 0.5579071044921875, 0.631195068359375, 0.7044830322265625, 0.77777099609375, 0.8510589599609375, 0.924346923828125, 0.9976348876953125, 1.0709228515625, 1.1442108154296875, 1.217498779296875, 1.2907867431640625, 1.36407470703125, 1.4373626708984375, 1.510650634765625, 1.5839385986328125, 1.6572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 13.0, 20.0, 32.0, 56.0, 64.0, 95.0, 88.0, 111.0, 108.0, 98.0, 97.0, 67.0, 52.0, 44.0, 17.0, 12.0, 7.0, 6.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.965921878814697, -6.728592395782471, -6.491262912750244, -6.253932952880859, -6.016603469848633, -5.779273986816406, -5.54194450378418, -5.304615020751953, -5.067285537719727, -4.8299560546875, -4.592626571655273, -4.355297088623047, -4.117967128753662, -3.8806376457214355, -3.643308162689209, -3.4059786796569824, -3.1686487197875977, -2.931319236755371, -2.6939895153045654, -2.456660032272339, -2.219330310821533, -1.9820008277893066, -1.74467134475708, -1.507341742515564, -1.2700121402740479, -1.0326825380325317, -0.7953529953956604, -0.5580234527587891, -0.32069385051727295, -0.08336424827575684, 0.15396523475646973, 0.39129483699798584, 0.6286249160766602, 0.8659545183181763, 1.1032841205596924, 1.340613603591919, 1.577943205833435, 1.8152728080749512, 2.0526022911071777, 2.2899317741394043, 2.52726149559021, 2.7645909786224365, 3.001920700073242, 3.2392501831054688, 3.4765796661376953, 3.713909387588501, 3.9512388706207275, 4.188568592071533, 4.42589807510376, 4.663227558135986, 4.900557041168213, 5.137887001037598, 5.375216484069824, 5.612545967102051, 5.849875450134277, 6.087204933166504, 6.3245344161987305, 6.561863899230957, 6.799193382263184, 7.03652286529541, 7.273852825164795, 7.5111823081970215, 7.748511791229248, 7.985841274261475, 8.22317123413086]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 4.0, 6.0, 10.0, 14.0, 12.0, 22.0, 21.0, 30.0, 43.0, 28.0, 36.0, 29.0, 40.0, 37.0, 33.0, 41.0, 48.0, 51.0, 57.0, 38.0, 44.0, 38.0, 35.0, 24.0, 33.0, 42.0, 32.0, 20.0, 27.0, 22.0, 16.0, 8.0, 12.0, 12.0, 12.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2223548889160156, -3.102600336074829, -2.9828457832336426, -2.863091230392456, -2.7433366775512695, -2.623582124710083, -2.5038275718688965, -2.38407301902771, -2.2643184661865234, -2.144563913345337, -2.0248093605041504, -1.9050548076629639, -1.7853002548217773, -1.6655457019805908, -1.5457911491394043, -1.4260365962982178, -1.3062820434570312, -1.1865274906158447, -1.0667729377746582, -0.9470183849334717, -0.8272638320922852, -0.7075092792510986, -0.5877547264099121, -0.4680001735687256, -0.34824562072753906, -0.22849106788635254, -0.10873651504516602, 0.011018037796020508, 0.13077259063720703, 0.25052714347839355, 0.3702816963195801, 0.4900362491607666, 0.6097908020019531, 0.7295453548431396, 0.8492999076843262, 0.9690544605255127, 1.0888090133666992, 1.2085635662078857, 1.3283181190490723, 1.4480726718902588, 1.5678272247314453, 1.6875817775726318, 1.8073363304138184, 1.9270908832550049, 2.0468454360961914, 2.166599988937378, 2.2863545417785645, 2.406109094619751, 2.5258636474609375, 2.645618200302124, 2.7653727531433105, 2.885127305984497, 3.0048818588256836, 3.12463641166687, 3.2443909645080566, 3.364145517349243, 3.4839000701904297, 3.603654623031616, 3.7234091758728027, 3.8431637287139893, 3.962918281555176, 4.082673072814941, 4.202427387237549, 4.322181701660156, 4.441936492919922]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 12.0, 8.0, 18.0, 27.0, 35.0, 66.0, 85.0, 120.0, 195.0, 298.0, 604.0, 1482.0, 5029.0, 21605.0, 102386.0, 364286.0, 396420.0, 120688.0, 26024.0, 5888.0, 1723.0, 671.0, 310.0, 198.0, 118.0, 88.0, 62.0, 37.0, 18.0, 23.0, 15.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7470703125, -0.7213592529296875, -0.695648193359375, -0.6699371337890625, -0.64422607421875, -0.6185150146484375, -0.592803955078125, -0.5670928955078125, -0.5413818359375, -0.5156707763671875, -0.489959716796875, -0.4642486572265625, -0.43853759765625, -0.4128265380859375, -0.387115478515625, -0.3614044189453125, -0.335693359375, -0.3099822998046875, -0.284271240234375, -0.2585601806640625, -0.23284912109375, -0.2071380615234375, -0.181427001953125, -0.1557159423828125, -0.1300048828125, -0.1042938232421875, -0.078582763671875, -0.0528717041015625, -0.02716064453125, -0.0014495849609375, 0.024261474609375, 0.0499725341796875, 0.07568359375, 0.1013946533203125, 0.127105712890625, 0.1528167724609375, 0.17852783203125, 0.2042388916015625, 0.229949951171875, 0.2556610107421875, 0.2813720703125, 0.3070831298828125, 0.332794189453125, 0.3585052490234375, 0.38421630859375, 0.4099273681640625, 0.435638427734375, 0.4613494873046875, 0.487060546875, 0.5127716064453125, 0.538482666015625, 0.5641937255859375, 0.58990478515625, 0.6156158447265625, 0.641326904296875, 0.6670379638671875, 0.6927490234375, 0.7184600830078125, 0.744171142578125, 0.7698822021484375, 0.79559326171875, 0.8213043212890625, 0.847015380859375, 0.8727264404296875, 0.8984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 14.0, 22.0, 21.0, 24.0, 31.0, 29.0, 31.0, 49.0, 45.0, 47.0, 51.0, 50.0, 56.0, 43.0, 51.0, 42.0, 55.0, 39.0, 40.0, 33.0, 41.0, 26.0, 24.0, 19.0, 25.0, 27.0, 11.0, 11.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.413360595703125, -2.31500244140625, -2.216644287109375, -2.1182861328125, -2.019927978515625, -1.92156982421875, -1.823211669921875, -1.724853515625, -1.626495361328125, -1.52813720703125, -1.429779052734375, -1.3314208984375, -1.233062744140625, -1.13470458984375, -1.036346435546875, -0.93798828125, -0.839630126953125, -0.74127197265625, -0.642913818359375, -0.5445556640625, -0.446197509765625, -0.34783935546875, -0.249481201171875, -0.151123046875, -0.052764892578125, 0.04559326171875, 0.143951416015625, 0.2423095703125, 0.340667724609375, 0.43902587890625, 0.537384033203125, 0.6357421875, 0.734100341796875, 0.83245849609375, 0.930816650390625, 1.0291748046875, 1.127532958984375, 1.22589111328125, 1.324249267578125, 1.422607421875, 1.520965576171875, 1.61932373046875, 1.717681884765625, 1.8160400390625, 1.914398193359375, 2.01275634765625, 2.111114501953125, 2.20947265625, 2.307830810546875, 2.40618896484375, 2.504547119140625, 2.6029052734375, 2.701263427734375, 2.79962158203125, 2.897979736328125, 2.996337890625, 3.094696044921875, 3.19305419921875, 3.291412353515625, 3.3897705078125, 3.488128662109375, 3.58648681640625, 3.684844970703125, 3.783203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 3.0, 2.0, 3.0, 7.0, 9.0, 8.0, 13.0, 17.0, 33.0, 49.0, 75.0, 118.0, 202.0, 381.0, 679.0, 1243.0, 2234.0, 4116.0, 7302.0, 13050.0, 23364.0, 41017.0, 67781.0, 105310.0, 145979.0, 170716.0, 156315.0, 118778.0, 78559.0, 47858.0, 27999.0, 15777.0, 8755.0, 4797.0, 2572.0, 1518.0, 818.0, 454.0, 255.0, 137.0, 102.0, 34.0, 47.0, 21.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.255126953125, -0.247314453125, -0.239501953125, -0.231689453125, -0.223876953125, -0.216064453125, -0.208251953125, -0.200439453125, -0.192626953125, -0.184814453125, -0.177001953125, -0.169189453125, -0.161376953125, -0.153564453125, -0.145751953125, -0.137939453125, -0.130126953125, -0.122314453125, -0.114501953125, -0.106689453125, -0.098876953125, -0.091064453125, -0.083251953125, -0.075439453125, -0.067626953125, -0.059814453125, -0.052001953125, -0.044189453125, -0.036376953125, -0.028564453125, -0.020751953125, -0.012939453125, -0.005126953125, 0.002685546875, 0.010498046875, 0.018310546875, 0.026123046875, 0.033935546875, 0.041748046875, 0.049560546875, 0.057373046875, 0.065185546875, 0.072998046875, 0.080810546875, 0.088623046875, 0.096435546875, 0.104248046875, 0.112060546875, 0.119873046875, 0.127685546875, 0.135498046875, 0.143310546875, 0.151123046875, 0.158935546875, 0.166748046875, 0.174560546875, 0.182373046875, 0.190185546875, 0.197998046875, 0.205810546875, 0.213623046875, 0.221435546875, 0.229248046875, 0.237060546875, 0.244873046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 10.0, 4.0, 4.0, 6.0, 4.0, 13.0, 14.0, 18.0, 6.0, 15.0, 13.0, 18.0, 23.0, 26.0, 20.0, 45.0, 27.0, 36.0, 35.0, 22.0, 54.0, 33.0, 42.0, 38.0, 37.0, 36.0, 41.0, 41.0, 29.0, 29.0, 35.0, 34.0, 33.0, 24.0, 18.0, 24.0, 9.0, 13.0, 16.0, 10.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.94921875, -4.7945556640625, -4.639892578125, -4.4852294921875, -4.33056640625, -4.1759033203125, -4.021240234375, -3.8665771484375, -3.7119140625, -3.5572509765625, -3.402587890625, -3.2479248046875, -3.09326171875, -2.9385986328125, -2.783935546875, -2.6292724609375, -2.474609375, -2.3199462890625, -2.165283203125, -2.0106201171875, -1.85595703125, -1.7012939453125, -1.546630859375, -1.3919677734375, -1.2373046875, -1.0826416015625, -0.927978515625, -0.7733154296875, -0.61865234375, -0.4639892578125, -0.309326171875, -0.1546630859375, 0.0, 0.1546630859375, 0.309326171875, 0.4639892578125, 0.61865234375, 0.7733154296875, 0.927978515625, 1.0826416015625, 1.2373046875, 1.3919677734375, 1.546630859375, 1.7012939453125, 1.85595703125, 2.0106201171875, 2.165283203125, 2.3199462890625, 2.474609375, 2.6292724609375, 2.783935546875, 2.9385986328125, 3.09326171875, 3.2479248046875, 3.402587890625, 3.5572509765625, 3.7119140625, 3.8665771484375, 4.021240234375, 4.1759033203125, 4.33056640625, 4.4852294921875, 4.639892578125, 4.7945556640625, 4.94921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 9.0, 20.0, 35.0, 44.0, 54.0, 107.0, 180.0, 265.0, 474.0, 760.0, 1307.0, 2504.0, 5203.0, 12575.0, 36906.0, 122801.0, 362076.0, 337527.0, 110207.0, 33415.0, 11618.0, 4875.0, 2352.0, 1286.0, 738.0, 435.0, 271.0, 154.0, 118.0, 68.0, 54.0, 27.0, 24.0, 9.0, 9.0, 9.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0765380859375, -0.07434844970703125, -0.0721588134765625, -0.06996917724609375, -0.067779541015625, -0.06558990478515625, -0.0634002685546875, -0.06121063232421875, -0.05902099609375, -0.05683135986328125, -0.0546417236328125, -0.05245208740234375, -0.050262451171875, -0.04807281494140625, -0.0458831787109375, -0.04369354248046875, -0.04150390625, -0.03931427001953125, -0.0371246337890625, -0.03493499755859375, -0.032745361328125, -0.03055572509765625, -0.0283660888671875, -0.02617645263671875, -0.02398681640625, -0.02179718017578125, -0.0196075439453125, -0.01741790771484375, -0.015228271484375, -0.01303863525390625, -0.0108489990234375, -0.00865936279296875, -0.0064697265625, -0.00428009033203125, -0.0020904541015625, 9.918212890625e-05, 0.002288818359375, 0.00447845458984375, 0.0066680908203125, 0.00885772705078125, 0.01104736328125, 0.01323699951171875, 0.0154266357421875, 0.01761627197265625, 0.019805908203125, 0.02199554443359375, 0.0241851806640625, 0.02637481689453125, 0.028564453125, 0.03075408935546875, 0.0329437255859375, 0.03513336181640625, 0.037322998046875, 0.03951263427734375, 0.0417022705078125, 0.04389190673828125, 0.04608154296875, 0.04827117919921875, 0.0504608154296875, 0.05265045166015625, 0.054840087890625, 0.05702972412109375, 0.0592193603515625, 0.06140899658203125, 0.0635986328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 2.0, 6.0, 7.0, 13.0, 16.0, 20.0, 36.0, 46.0, 59.0, 61.0, 84.0, 100.0, 84.0, 81.0, 118.0, 69.0, 55.0, 42.0, 35.0, 21.0, 10.0, 13.0, 8.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.644559860229492e-05, -5.42299821972847e-05, -5.2014365792274475e-05, -4.979874938726425e-05, -4.758313298225403e-05, -4.5367516577243805e-05, -4.315190017223358e-05, -4.093628376722336e-05, -3.8720667362213135e-05, -3.650505095720291e-05, -3.428943455219269e-05, -3.2073818147182465e-05, -2.985820174217224e-05, -2.7642585337162018e-05, -2.5426968932151794e-05, -2.321135252714157e-05, -2.0995736122131348e-05, -1.8780119717121124e-05, -1.65645033121109e-05, -1.4348886907100677e-05, -1.2133270502090454e-05, -9.91765409708023e-06, -7.702037692070007e-06, -5.486421287059784e-06, -3.2708048820495605e-06, -1.0551884770393372e-06, 1.1604279279708862e-06, 3.3760443329811096e-06, 5.591660737991333e-06, 7.807277143001556e-06, 1.002289354801178e-05, 1.2238509953022003e-05, 1.4454126358032227e-05, 1.666974276304245e-05, 1.8885359168052673e-05, 2.1100975573062897e-05, 2.331659197807312e-05, 2.5532208383083344e-05, 2.7747824788093567e-05, 2.996344119310379e-05, 3.2179057598114014e-05, 3.439467400312424e-05, 3.661029040813446e-05, 3.8825906813144684e-05, 4.104152321815491e-05, 4.325713962316513e-05, 4.5472756028175354e-05, 4.768837243318558e-05, 4.99039888381958e-05, 5.2119605243206024e-05, 5.433522164821625e-05, 5.655083805322647e-05, 5.8766454458236694e-05, 6.098207086324692e-05, 6.319768726825714e-05, 6.541330367326736e-05, 6.762892007827759e-05, 6.984453648328781e-05, 7.206015288829803e-05, 7.427576929330826e-05, 7.649138569831848e-05, 7.87070021033287e-05, 8.092261850833893e-05, 8.313823491334915e-05, 8.535385131835938e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 7.0, 13.0, 9.0, 13.0, 20.0, 21.0, 20.0, 41.0, 61.0, 92.0, 155.0, 222.0, 435.0, 965.0, 1961.0, 4932.0, 14452.0, 56143.0, 297355.0, 514291.0, 117463.0, 26172.0, 7925.0, 2966.0, 1303.0, 596.0, 331.0, 207.0, 105.0, 85.0, 58.0, 40.0, 22.0, 13.0, 15.0, 7.0, 10.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.09033203125, -0.08743953704833984, -0.08454704284667969, -0.08165454864501953, -0.07876205444335938, -0.07586956024169922, -0.07297706604003906, -0.0700845718383789, -0.06719207763671875, -0.0642995834350586, -0.06140708923339844, -0.05851459503173828, -0.055622100830078125, -0.05272960662841797, -0.04983711242675781, -0.046944618225097656, -0.0440521240234375, -0.041159629821777344, -0.03826713562011719, -0.03537464141845703, -0.032482147216796875, -0.02958965301513672, -0.026697158813476562, -0.023804664611816406, -0.02091217041015625, -0.018019676208496094, -0.015127182006835938, -0.012234687805175781, -0.009342193603515625, -0.006449699401855469, -0.0035572052001953125, -0.0006647109985351562, 0.002227783203125, 0.005120277404785156, 0.008012771606445312, 0.010905265808105469, 0.013797760009765625, 0.01669025421142578, 0.019582748413085938, 0.022475242614746094, 0.02536773681640625, 0.028260231018066406, 0.031152725219726562, 0.03404521942138672, 0.036937713623046875, 0.03983020782470703, 0.04272270202636719, 0.045615196228027344, 0.0485076904296875, 0.051400184631347656, 0.05429267883300781, 0.05718517303466797, 0.060077667236328125, 0.06297016143798828, 0.06586265563964844, 0.0687551498413086, 0.07164764404296875, 0.0745401382446289, 0.07743263244628906, 0.08032512664794922, 0.08321762084960938, 0.08611011505126953, 0.08900260925292969, 0.09189510345458984, 0.09478759765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 0.0, 3.0, 4.0, 0.0, 4.0, 9.0, 14.0, 11.0, 16.0, 19.0, 28.0, 31.0, 38.0, 58.0, 44.0, 66.0, 64.0, 85.0, 69.0, 74.0, 66.0, 49.0, 51.0, 43.0, 29.0, 19.0, 25.0, 14.0, 14.0, 7.0, 7.0, 7.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.024627685546875, -0.023868560791015625, -0.02310943603515625, -0.022350311279296875, -0.0215911865234375, -0.020832061767578125, -0.02007293701171875, -0.019313812255859375, -0.0185546875, -0.017795562744140625, -0.01703643798828125, -0.016277313232421875, -0.0155181884765625, -0.014759063720703125, -0.01399993896484375, -0.013240814208984375, -0.012481689453125, -0.011722564697265625, -0.01096343994140625, -0.010204315185546875, -0.0094451904296875, -0.008686065673828125, -0.00792694091796875, -0.007167816162109375, -0.00640869140625, -0.005649566650390625, -0.00489044189453125, -0.004131317138671875, -0.0033721923828125, -0.002613067626953125, -0.00185394287109375, -0.001094818115234375, -0.000335693359375, 0.000423431396484375, 0.00118255615234375, 0.001941680908203125, 0.0027008056640625, 0.003459930419921875, 0.00421905517578125, 0.004978179931640625, 0.0057373046875, 0.006496429443359375, 0.00725555419921875, 0.008014678955078125, 0.0087738037109375, 0.009532928466796875, 0.01029205322265625, 0.011051177978515625, 0.011810302734375, 0.012569427490234375, 0.01332855224609375, 0.014087677001953125, 0.0148468017578125, 0.015605926513671875, 0.01636505126953125, 0.017124176025390625, 0.01788330078125, 0.018642425537109375, 0.01940155029296875, 0.020160675048828125, 0.0209197998046875, 0.021678924560546875, 0.02243804931640625, 0.023197174072265625, 0.023956298828125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 25.0, 65.0, 154.0, 265.0, 234.0, 165.0, 67.0, 20.0, 10.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.17115592956543, -14.826726913452148, -14.482297897338867, -14.137869834899902, -13.793440818786621, -13.44901180267334, -13.104583740234375, -12.760154724121094, -12.415725708007812, -12.071296691894531, -11.72686767578125, -11.382439613342285, -11.038010597229004, -10.693581581115723, -10.349153518676758, -10.004724502563477, -9.660295486450195, -9.315866470336914, -8.971437454223633, -8.627009391784668, -8.282580375671387, -7.9381513595581055, -7.593722820281982, -7.249294281005859, -6.904865264892578, -6.560436248779297, -6.216007709503174, -5.871579170227051, -5.5271501541137695, -5.182721138000488, -4.838292598724365, -4.493864059448242, -4.149434566497803, -3.8050057888031006, -3.4605770111083984, -3.1161482334136963, -2.771719455718994, -2.427290678024292, -2.08286190032959, -1.7384331226348877, -1.3940043449401855, -1.0495755672454834, -0.7051467895507812, -0.3607180118560791, -0.016289234161376953, 0.3281395435333252, 0.6725683212280273, 1.0169970989227295, 1.3614258766174316, 1.7058546543121338, 2.050283432006836, 2.394712209701538, 2.7391409873962402, 3.0835697650909424, 3.4279985427856445, 3.7724273204803467, 4.116856098175049, 4.461284637451172, 4.805713653564453, 5.150142669677734, 5.494571208953857, 5.8389997482299805, 6.183428764343262, 6.527857780456543, 6.872286319732666]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 7.0, 9.0, 5.0, 14.0, 11.0, 17.0, 23.0, 30.0, 39.0, 40.0, 32.0, 40.0, 37.0, 40.0, 37.0, 49.0, 60.0, 54.0, 47.0, 46.0, 41.0, 34.0, 36.0, 33.0, 41.0, 35.0, 24.0, 19.0, 23.0, 17.0, 12.0, 20.0, 8.0, 7.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.383441686630249, -2.2934117317199707, -2.2033820152282715, -2.113352060317993, -2.023322105407715, -1.9332923889160156, -1.8432624340057373, -1.7532325983047485, -1.6632027626037598, -1.573172926902771, -1.4831430912017822, -1.393113136291504, -1.3030833005905151, -1.2130534648895264, -1.123023509979248, -1.0329936742782593, -0.9429638385772705, -0.8529340028762817, -0.7629041075706482, -0.6728742122650146, -0.5828443765640259, -0.4928145110607147, -0.40278464555740356, -0.31275475025177, -0.22272491455078125, -0.1326950490474701, -0.042665183544158936, 0.04736468195915222, 0.13739454746246338, 0.22742441296577454, 0.3174542784690857, 0.40748417377471924, 0.4975137710571289, 0.5875436067581177, 0.6775735020637512, 0.7676033973693848, 0.8576332330703735, 0.9476630687713623, 1.0376930236816406, 1.1277228593826294, 1.2177526950836182, 1.307782530784607, 1.3978123664855957, 1.487842321395874, 1.5778721570968628, 1.6679019927978516, 1.7579319477081299, 1.8479617834091187, 1.9379916191101074, 2.0280215740203857, 2.118051290512085, 2.2080812454223633, 2.2981109619140625, 2.388140916824341, 2.478170871734619, 2.5682005882263184, 2.6582305431365967, 2.748260498046875, 2.838290214538574, 2.9283201694488525, 3.018350124359131, 3.10837984085083, 3.1984097957611084, 3.2884397506713867, 3.378469467163086]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 15.0, 16.0, 45.0, 57.0, 115.0, 304.0, 653.0, 1746.0, 6120.0, 23515.0, 91917.0, 425766.0, 383943.0, 84410.0, 21451.0, 5602.0, 1632.0, 639.0, 271.0, 145.0, 74.0, 42.0, 20.0, 16.0, 8.0, 4.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.73114013671875, -2.6068115234375, -2.48248291015625, -2.358154296875, -2.23382568359375, -2.1094970703125, -1.98516845703125, -1.86083984375, -1.73651123046875, -1.6121826171875, -1.48785400390625, -1.363525390625, -1.23919677734375, -1.1148681640625, -0.99053955078125, -0.8662109375, -0.74188232421875, -0.6175537109375, -0.49322509765625, -0.368896484375, -0.24456787109375, -0.1202392578125, 0.00408935546875, 0.12841796875, 0.25274658203125, 0.3770751953125, 0.50140380859375, 0.625732421875, 0.75006103515625, 0.8743896484375, 0.99871826171875, 1.123046875, 1.24737548828125, 1.3717041015625, 1.49603271484375, 1.620361328125, 1.74468994140625, 1.8690185546875, 1.99334716796875, 2.11767578125, 2.24200439453125, 2.3663330078125, 2.49066162109375, 2.614990234375, 2.73931884765625, 2.8636474609375, 2.98797607421875, 3.1123046875, 3.23663330078125, 3.3609619140625, 3.48529052734375, 3.609619140625, 3.73394775390625, 3.8582763671875, 3.98260498046875, 4.10693359375, 4.23126220703125, 4.3555908203125, 4.47991943359375, 4.604248046875, 4.72857666015625, 4.8529052734375, 4.97723388671875, 5.1015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 17.0, 15.0, 13.0, 23.0, 20.0, 33.0, 28.0, 31.0, 39.0, 44.0, 36.0, 35.0, 37.0, 50.0, 35.0, 43.0, 44.0, 41.0, 44.0, 35.0, 33.0, 36.0, 24.0, 42.0, 20.0, 24.0, 18.0, 23.0, 13.0, 21.0, 13.0, 17.0, 2.0, 7.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.36138916015625, -4.2149658203125, -4.06854248046875, -3.922119140625, -3.77569580078125, -3.6292724609375, -3.48284912109375, -3.33642578125, -3.19000244140625, -3.0435791015625, -2.89715576171875, -2.750732421875, -2.60430908203125, -2.4578857421875, -2.31146240234375, -2.1650390625, -2.01861572265625, -1.8721923828125, -1.72576904296875, -1.579345703125, -1.43292236328125, -1.2864990234375, -1.14007568359375, -0.99365234375, -0.84722900390625, -0.7008056640625, -0.55438232421875, -0.407958984375, -0.26153564453125, -0.1151123046875, 0.03131103515625, 0.177734375, 0.32415771484375, 0.4705810546875, 0.61700439453125, 0.763427734375, 0.90985107421875, 1.0562744140625, 1.20269775390625, 1.34912109375, 1.49554443359375, 1.6419677734375, 1.78839111328125, 1.934814453125, 2.08123779296875, 2.2276611328125, 2.37408447265625, 2.5205078125, 2.66693115234375, 2.8133544921875, 2.95977783203125, 3.106201171875, 3.25262451171875, 3.3990478515625, 3.54547119140625, 3.69189453125, 3.83831787109375, 3.9847412109375, 4.13116455078125, 4.277587890625, 4.42401123046875, 4.5704345703125, 4.71685791015625, 4.86328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 12.0, 10.0, 5.0, 6.0, 20.0, 20.0, 17.0, 23.0, 34.0, 53.0, 104.0, 141.0, 307.0, 906.0, 17036.0, 941460.0, 85841.0, 1593.0, 447.0, 180.0, 95.0, 65.0, 32.0, 36.0, 16.0, 17.0, 15.0, 13.0, 11.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.734375, -14.33251953125, -13.9306640625, -13.52880859375, -13.126953125, -12.72509765625, -12.3232421875, -11.92138671875, -11.51953125, -11.11767578125, -10.7158203125, -10.31396484375, -9.912109375, -9.51025390625, -9.1083984375, -8.70654296875, -8.3046875, -7.90283203125, -7.5009765625, -7.09912109375, -6.697265625, -6.29541015625, -5.8935546875, -5.49169921875, -5.08984375, -4.68798828125, -4.2861328125, -3.88427734375, -3.482421875, -3.08056640625, -2.6787109375, -2.27685546875, -1.875, -1.47314453125, -1.0712890625, -0.66943359375, -0.267578125, 0.13427734375, 0.5361328125, 0.93798828125, 1.33984375, 1.74169921875, 2.1435546875, 2.54541015625, 2.947265625, 3.34912109375, 3.7509765625, 4.15283203125, 4.5546875, 4.95654296875, 5.3583984375, 5.76025390625, 6.162109375, 6.56396484375, 6.9658203125, 7.36767578125, 7.76953125, 8.17138671875, 8.5732421875, 8.97509765625, 9.376953125, 9.77880859375, 10.1806640625, 10.58251953125, 10.984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 8.0, 7.0, 12.0, 11.0, 11.0, 21.0, 19.0, 19.0, 41.0, 19.0, 23.0, 16.0, 29.0, 41.0, 42.0, 41.0, 51.0, 44.0, 41.0, 51.0, 33.0, 48.0, 47.0, 35.0, 27.0, 47.0, 24.0, 27.0, 22.0, 17.0, 26.0, 17.0, 13.0, 12.0, 9.0, 5.0, 6.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.7421875, -5.56597900390625, -5.3897705078125, -5.21356201171875, -5.037353515625, -4.86114501953125, -4.6849365234375, -4.50872802734375, -4.33251953125, -4.15631103515625, -3.9801025390625, -3.80389404296875, -3.627685546875, -3.45147705078125, -3.2752685546875, -3.09906005859375, -2.9228515625, -2.74664306640625, -2.5704345703125, -2.39422607421875, -2.218017578125, -2.04180908203125, -1.8656005859375, -1.68939208984375, -1.51318359375, -1.33697509765625, -1.1607666015625, -0.98455810546875, -0.808349609375, -0.63214111328125, -0.4559326171875, -0.27972412109375, -0.103515625, 0.07269287109375, 0.2489013671875, 0.42510986328125, 0.601318359375, 0.77752685546875, 0.9537353515625, 1.12994384765625, 1.30615234375, 1.48236083984375, 1.6585693359375, 1.83477783203125, 2.010986328125, 2.18719482421875, 2.3634033203125, 2.53961181640625, 2.7158203125, 2.89202880859375, 3.0682373046875, 3.24444580078125, 3.420654296875, 3.59686279296875, 3.7730712890625, 3.94927978515625, 4.12548828125, 4.30169677734375, 4.4779052734375, 4.65411376953125, 4.830322265625, 5.00653076171875, 5.1827392578125, 5.35894775390625, 5.53515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 4.0, 11.0, 10.0, 17.0, 34.0, 52.0, 104.0, 207.0, 687.0, 3110.0, 52271.0, 965863.0, 22897.0, 2334.0, 539.0, 176.0, 90.0, 51.0, 29.0, 20.0, 12.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.11846923828125, -3.9830322265625, -3.84759521484375, -3.712158203125, -3.57672119140625, -3.4412841796875, -3.30584716796875, -3.17041015625, -3.03497314453125, -2.8995361328125, -2.76409912109375, -2.628662109375, -2.49322509765625, -2.3577880859375, -2.22235107421875, -2.0869140625, -1.95147705078125, -1.8160400390625, -1.68060302734375, -1.545166015625, -1.40972900390625, -1.2742919921875, -1.13885498046875, -1.00341796875, -0.86798095703125, -0.7325439453125, -0.59710693359375, -0.461669921875, -0.32623291015625, -0.1907958984375, -0.05535888671875, 0.080078125, 0.21551513671875, 0.3509521484375, 0.48638916015625, 0.621826171875, 0.75726318359375, 0.8927001953125, 1.02813720703125, 1.16357421875, 1.29901123046875, 1.4344482421875, 1.56988525390625, 1.705322265625, 1.84075927734375, 1.9761962890625, 2.11163330078125, 2.2470703125, 2.38250732421875, 2.5179443359375, 2.65338134765625, 2.788818359375, 2.92425537109375, 3.0596923828125, 3.19512939453125, 3.33056640625, 3.46600341796875, 3.6014404296875, 3.73687744140625, 3.872314453125, 4.00775146484375, 4.1431884765625, 4.27862548828125, 4.4140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 22.0, 27.0, 44.0, 48.0, 64.0, 98.0, 172.0, 162.0, 104.0, 64.0, 52.0, 38.0, 30.0, 17.0, 14.0, 12.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003829002380371094, -0.00037333741784095764, -0.0003637745976448059, -0.0003542117774486542, -0.00034464895725250244, -0.0003350861370563507, -0.000325523316860199, -0.00031596049666404724, -0.0003063976764678955, -0.0002968348562717438, -0.00028727203607559204, -0.0002777092158794403, -0.0002681463956832886, -0.00025858357548713684, -0.0002490207552909851, -0.00023945793509483337, -0.00022989511489868164, -0.0002203322947025299, -0.00021076947450637817, -0.00020120665431022644, -0.0001916438341140747, -0.00018208101391792297, -0.00017251819372177124, -0.0001629553735256195, -0.00015339255332946777, -0.00014382973313331604, -0.0001342669129371643, -0.00012470409274101257, -0.00011514127254486084, -0.0001055784523487091, -9.601563215255737e-05, -8.645281195640564e-05, -7.68899917602539e-05, -6.732717156410217e-05, -5.776435136795044e-05, -4.8201531171798706e-05, -3.863871097564697e-05, -2.907589077949524e-05, -1.9513070583343506e-05, -9.950250387191772e-06, -3.8743019104003906e-07, 9.175390005111694e-06, 1.8738210201263428e-05, 2.830103039741516e-05, 3.7863850593566895e-05, 4.742667078971863e-05, 5.698949098587036e-05, 6.65523111820221e-05, 7.611513137817383e-05, 8.567795157432556e-05, 9.52407717704773e-05, 0.00010480359196662903, 0.00011436641216278076, 0.0001239292323589325, 0.00013349205255508423, 0.00014305487275123596, 0.0001526176929473877, 0.00016218051314353943, 0.00017174333333969116, 0.0001813061535358429, 0.00019086897373199463, 0.00020043179392814636, 0.0002099946141242981, 0.00021955743432044983, 0.00022912025451660156]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 9.0, 22.0, 20.0, 23.0, 38.0, 76.0, 135.0, 268.0, 547.0, 1665.0, 7593.0, 445688.0, 581148.0, 8264.0, 1792.0, 592.0, 275.0, 133.0, 100.0, 51.0, 29.0, 14.0, 19.0, 12.0, 6.0, 9.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.7509765625, -4.611328125, -4.4716796875, -4.33203125, -4.1923828125, -4.052734375, -3.9130859375, -3.7734375, -3.6337890625, -3.494140625, -3.3544921875, -3.21484375, -3.0751953125, -2.935546875, -2.7958984375, -2.65625, -2.5166015625, -2.376953125, -2.2373046875, -2.09765625, -1.9580078125, -1.818359375, -1.6787109375, -1.5390625, -1.3994140625, -1.259765625, -1.1201171875, -0.98046875, -0.8408203125, -0.701171875, -0.5615234375, -0.421875, -0.2822265625, -0.142578125, -0.0029296875, 0.13671875, 0.2763671875, 0.416015625, 0.5556640625, 0.6953125, 0.8349609375, 0.974609375, 1.1142578125, 1.25390625, 1.3935546875, 1.533203125, 1.6728515625, 1.8125, 1.9521484375, 2.091796875, 2.2314453125, 2.37109375, 2.5107421875, 2.650390625, 2.7900390625, 2.9296875, 3.0693359375, 3.208984375, 3.3486328125, 3.48828125, 3.6279296875, 3.767578125, 3.9072265625, 4.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 14.0, 15.0, 14.0, 31.0, 23.0, 39.0, 54.0, 69.0, 82.0, 182.0, 149.0, 74.0, 79.0, 41.0, 34.0, 25.0, 21.0, 20.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.88232421875, -0.8546600341796875, -0.826995849609375, -0.7993316650390625, -0.77166748046875, -0.7440032958984375, -0.716339111328125, -0.6886749267578125, -0.6610107421875, -0.6333465576171875, -0.605682373046875, -0.5780181884765625, -0.55035400390625, -0.5226898193359375, -0.495025634765625, -0.4673614501953125, -0.439697265625, -0.4120330810546875, -0.384368896484375, -0.3567047119140625, -0.32904052734375, -0.3013763427734375, -0.273712158203125, -0.2460479736328125, -0.2183837890625, -0.1907196044921875, -0.163055419921875, -0.1353912353515625, -0.10772705078125, -0.0800628662109375, -0.052398681640625, -0.0247344970703125, 0.0029296875, 0.0305938720703125, 0.058258056640625, 0.0859222412109375, 0.11358642578125, 0.1412506103515625, 0.168914794921875, 0.1965789794921875, 0.2242431640625, 0.2519073486328125, 0.279571533203125, 0.3072357177734375, 0.33489990234375, 0.3625640869140625, 0.390228271484375, 0.4178924560546875, 0.445556640625, 0.4732208251953125, 0.500885009765625, 0.5285491943359375, 0.55621337890625, 0.5838775634765625, 0.611541748046875, 0.6392059326171875, 0.6668701171875, 0.6945343017578125, 0.722198486328125, 0.7498626708984375, 0.77752685546875, 0.8051910400390625, 0.832855224609375, 0.8605194091796875, 0.88818359375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 12.0, 20.0, 27.0, 46.0, 66.0, 66.0, 98.0, 121.0, 121.0, 102.0, 81.0, 80.0, 66.0, 34.0, 23.0, 17.0, 10.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.639266014099121, -8.355813980102539, -8.072362899780273, -7.788910865783691, -7.505458831787109, -7.2220072746276855, -6.938555717468262, -6.65510368347168, -6.371652126312256, -6.088200569152832, -5.80474853515625, -5.521296977996826, -5.237845420837402, -4.95439338684082, -4.6709418296813965, -4.387490272521973, -4.104038238525391, -3.8205864429473877, -3.5371346473693848, -3.253683090209961, -2.970231294631958, -2.686779499053955, -2.4033279418945312, -2.1198761463165283, -1.8364243507385254, -1.5529725551605225, -1.269520878791809, -0.9860691428184509, -0.7026174068450928, -0.41916561126708984, -0.13571393489837646, 0.14773774147033691, 0.43119049072265625, 0.7146422266960144, 0.9980939626693726, 1.281545639038086, 1.5649974346160889, 1.8484492301940918, 2.1319007873535156, 2.4153525829315186, 2.6988043785095215, 2.9822561740875244, 3.2657079696655273, 3.549159526824951, 3.832611322402954, 4.116063117980957, 4.399514675140381, 4.682966232299805, 4.966418266296387, 5.2498698234558105, 5.533321857452393, 5.816773414611816, 6.100225448608398, 6.383677005767822, 6.667128562927246, 6.950580596923828, 7.234032154083252, 7.517483711242676, 7.800935745239258, 8.08438777923584, 8.367838859558105, 8.651290893554688, 8.93474292755127, 9.218194007873535, 9.501646041870117]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 5.0, 4.0, 10.0, 1.0, 8.0, 11.0, 9.0, 5.0, 14.0, 14.0, 19.0, 15.0, 24.0, 26.0, 23.0, 27.0, 22.0, 29.0, 28.0, 37.0, 37.0, 20.0, 23.0, 45.0, 39.0, 27.0, 43.0, 22.0, 38.0, 29.0, 29.0, 25.0, 28.0, 25.0, 27.0, 31.0, 24.0, 20.0, 10.0, 14.0, 16.0, 17.0, 12.0, 10.0, 10.0, 9.0, 7.0, 6.0, 5.0, 1.0, 0.0, 8.0, 3.0, 5.0, 2.0, 1.0], "bins": [-7.011007308959961, -6.798781871795654, -6.586556911468506, -6.374331474304199, -6.162106037139893, -5.949880599975586, -5.7376556396484375, -5.525430202484131, -5.313204765319824, -5.100979328155518, -4.888754367828369, -4.6765289306640625, -4.464303493499756, -4.252078056335449, -4.039853096008301, -3.827627658843994, -3.6154024600982666, -3.403177261352539, -3.1909518241882324, -2.978726625442505, -2.7665011882781982, -2.5542759895324707, -2.342050552368164, -2.1298253536224365, -1.9176000356674194, -1.7053747177124023, -1.4931493997573853, -1.2809240818023682, -1.0686988830566406, -0.8564735651016235, -0.6442482471466064, -0.43202292919158936, -0.21979761123657227, -0.00757230818271637, 0.20465299487113953, 0.41687828302383423, 0.6291036009788513, 0.8413288593292236, 1.0535541772842407, 1.2657794952392578, 1.478004813194275, 1.690230131149292, 1.902455449104309, 2.114680767059326, 2.3269059658050537, 2.5391311645507812, 2.751356601715088, 2.9635820388793945, 3.175807237625122, 3.3880324363708496, 3.6002578735351562, 3.812483072280884, 4.024708271026611, 4.236933708190918, 4.449159145355225, 4.661384582519531, 4.87360954284668, 5.085834980010986, 5.298059940338135, 5.510285377502441, 5.722510814666748, 5.934736251831055, 6.146961212158203, 6.35918664932251, 6.571412086486816]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 9.0, 14.0, 17.0, 18.0, 33.0, 42.0, 47.0, 74.0, 125.0, 173.0, 323.0, 629.0, 1636.0, 5951.0, 31966.0, 261035.0, 1890414.0, 1748611.0, 217538.0, 27089.0, 5367.0, 1541.0, 604.0, 344.0, 209.0, 125.0, 101.0, 67.0, 41.0, 31.0, 25.0, 20.0, 16.0, 14.0, 7.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.43841552734375, -4.2674560546875, -4.09649658203125, -3.925537109375, -3.75457763671875, -3.5836181640625, -3.41265869140625, -3.24169921875, -3.07073974609375, -2.8997802734375, -2.72882080078125, -2.557861328125, -2.38690185546875, -2.2159423828125, -2.04498291015625, -1.8740234375, -1.70306396484375, -1.5321044921875, -1.36114501953125, -1.190185546875, -1.01922607421875, -0.8482666015625, -0.67730712890625, -0.50634765625, -0.33538818359375, -0.1644287109375, 0.00653076171875, 0.177490234375, 0.34844970703125, 0.5194091796875, 0.69036865234375, 0.861328125, 1.03228759765625, 1.2032470703125, 1.37420654296875, 1.545166015625, 1.71612548828125, 1.8870849609375, 2.05804443359375, 2.22900390625, 2.39996337890625, 2.5709228515625, 2.74188232421875, 2.912841796875, 3.08380126953125, 3.2547607421875, 3.42572021484375, 3.5966796875, 3.76763916015625, 3.9385986328125, 4.10955810546875, 4.280517578125, 4.45147705078125, 4.6224365234375, 4.79339599609375, 4.96435546875, 5.13531494140625, 5.3062744140625, 5.47723388671875, 5.648193359375, 5.81915283203125, 5.9901123046875, 6.16107177734375, 6.33203125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 10.0, 9.0, 15.0, 23.0, 27.0, 20.0, 40.0, 49.0, 41.0, 40.0, 50.0, 43.0, 51.0, 52.0, 51.0, 42.0, 52.0, 47.0, 38.0, 37.0, 52.0, 34.0, 31.0, 28.0, 22.0, 14.0, 16.0, 14.0, 14.0, 7.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.085235595703125, -2.96929931640625, -2.853363037109375, -2.7374267578125, -2.621490478515625, -2.50555419921875, -2.389617919921875, -2.273681640625, -2.157745361328125, -2.04180908203125, -1.925872802734375, -1.8099365234375, -1.694000244140625, -1.57806396484375, -1.462127685546875, -1.34619140625, -1.230255126953125, -1.11431884765625, -0.998382568359375, -0.8824462890625, -0.766510009765625, -0.65057373046875, -0.534637451171875, -0.418701171875, -0.302764892578125, -0.18682861328125, -0.070892333984375, 0.0450439453125, 0.160980224609375, 0.27691650390625, 0.392852783203125, 0.5087890625, 0.624725341796875, 0.74066162109375, 0.856597900390625, 0.9725341796875, 1.088470458984375, 1.20440673828125, 1.320343017578125, 1.436279296875, 1.552215576171875, 1.66815185546875, 1.784088134765625, 1.9000244140625, 2.015960693359375, 2.13189697265625, 2.247833251953125, 2.36376953125, 2.479705810546875, 2.59564208984375, 2.711578369140625, 2.8275146484375, 2.943450927734375, 3.05938720703125, 3.175323486328125, 3.291259765625, 3.407196044921875, 3.52313232421875, 3.639068603515625, 3.7550048828125, 3.870941162109375, 3.98687744140625, 4.102813720703125, 4.21875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 3.0, 4.0, 5.0, 8.0, 9.0, 12.0, 37.0, 33.0, 47.0, 71.0, 110.0, 177.0, 359.0, 692.0, 1522.0, 4642.0, 29448.0, 1051741.0, 3022076.0, 71943.0, 7517.0, 1971.0, 824.0, 410.0, 220.0, 133.0, 84.0, 45.0, 35.0, 20.0, 19.0, 14.0, 14.0, 8.0, 5.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6484375, -6.394287109375, -6.14013671875, -5.885986328125, -5.6318359375, -5.377685546875, -5.12353515625, -4.869384765625, -4.615234375, -4.361083984375, -4.10693359375, -3.852783203125, -3.5986328125, -3.344482421875, -3.09033203125, -2.836181640625, -2.58203125, -2.327880859375, -2.07373046875, -1.819580078125, -1.5654296875, -1.311279296875, -1.05712890625, -0.802978515625, -0.548828125, -0.294677734375, -0.04052734375, 0.213623046875, 0.4677734375, 0.721923828125, 0.97607421875, 1.230224609375, 1.484375, 1.738525390625, 1.99267578125, 2.246826171875, 2.5009765625, 2.755126953125, 3.00927734375, 3.263427734375, 3.517578125, 3.771728515625, 4.02587890625, 4.280029296875, 4.5341796875, 4.788330078125, 5.04248046875, 5.296630859375, 5.55078125, 5.804931640625, 6.05908203125, 6.313232421875, 6.5673828125, 6.821533203125, 7.07568359375, 7.329833984375, 7.583984375, 7.838134765625, 8.09228515625, 8.346435546875, 8.6005859375, 8.854736328125, 9.10888671875, 9.363037109375, 9.6171875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 13.0, 12.0, 22.0, 35.0, 42.0, 67.0, 114.0, 145.0, 210.0, 320.0, 429.0, 496.0, 518.0, 458.0, 357.0, 253.0, 180.0, 103.0, 91.0, 66.0, 33.0, 24.0, 21.0, 10.0, 9.0, 10.0, 9.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.732421875, -1.681854248046875, -1.63128662109375, -1.580718994140625, -1.5301513671875, -1.479583740234375, -1.42901611328125, -1.378448486328125, -1.327880859375, -1.277313232421875, -1.22674560546875, -1.176177978515625, -1.1256103515625, -1.075042724609375, -1.02447509765625, -0.973907470703125, -0.92333984375, -0.872772216796875, -0.82220458984375, -0.771636962890625, -0.7210693359375, -0.670501708984375, -0.61993408203125, -0.569366455078125, -0.518798828125, -0.468231201171875, -0.41766357421875, -0.367095947265625, -0.3165283203125, -0.265960693359375, -0.21539306640625, -0.164825439453125, -0.1142578125, -0.063690185546875, -0.01312255859375, 0.037445068359375, 0.0880126953125, 0.138580322265625, 0.18914794921875, 0.239715576171875, 0.290283203125, 0.340850830078125, 0.39141845703125, 0.441986083984375, 0.4925537109375, 0.543121337890625, 0.59368896484375, 0.644256591796875, 0.69482421875, 0.745391845703125, 0.79595947265625, 0.846527099609375, 0.8970947265625, 0.947662353515625, 0.99822998046875, 1.048797607421875, 1.099365234375, 1.149932861328125, 1.20050048828125, 1.251068115234375, 1.3016357421875, 1.352203369140625, 1.40277099609375, 1.453338623046875, 1.50390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 13.0, 19.0, 20.0, 47.0, 48.0, 49.0, 66.0, 81.0, 79.0, 77.0, 68.0, 70.0, 66.0, 64.0, 48.0, 46.0, 30.0, 22.0, 15.0, 27.0, 16.0, 9.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763986825942993, -3.6003661155700684, -3.4367451667785645, -3.2731244564056396, -3.109503746032715, -2.94588303565979, -2.7822623252868652, -2.6186413764953613, -2.4550206661224365, -2.2913999557495117, -2.127779006958008, -1.964158296585083, -1.8005375862121582, -1.6369168758392334, -1.473296046257019, -1.3096752166748047, -1.1460545063018799, -0.9824337363243103, -0.8188129663467407, -0.6551921963691711, -0.49157142639160156, -0.327950656414032, -0.1643298864364624, -0.0007090568542480469, 0.16291165351867676, 0.32653242349624634, 0.4901531934738159, 0.6537739634513855, 0.8173947334289551, 0.9810155034065247, 1.1446362733840942, 1.3082571029663086, 1.4718775749206543, 1.635498285293579, 1.7991191148757935, 1.9627399444580078, 2.1263606548309326, 2.2899813652038574, 2.4536023139953613, 2.617223024368286, 2.780843734741211, 2.9444644451141357, 3.1080851554870605, 3.2717061042785645, 3.4353268146514893, 3.598947525024414, 3.762568473815918, 3.9261891841888428, 4.089809894561768, 4.2534308433532715, 4.417051315307617, 4.580672264099121, 4.744293212890625, 4.907913684844971, 5.071534633636475, 5.23515510559082, 5.398776054382324, 5.562397003173828, 5.726017475128174, 5.889638423919678, 6.053258895874023, 6.216879844665527, 6.380500793457031, 6.544121742248535, 6.707742214202881]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 7.0, 8.0, 20.0, 13.0, 15.0, 19.0, 16.0, 29.0, 30.0, 38.0, 51.0, 24.0, 30.0, 34.0, 40.0, 54.0, 32.0, 52.0, 45.0, 48.0, 32.0, 38.0, 28.0, 39.0, 43.0, 35.0, 31.0, 23.0, 24.0, 18.0, 14.0, 13.0, 8.0, 8.0, 12.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.936814308166504, -3.8266875743865967, -3.7165610790252686, -3.6064343452453613, -3.496307849884033, -3.386181116104126, -3.2760543823242188, -3.1659278869628906, -3.0558013916015625, -2.9456746578216553, -2.835548162460327, -2.72542142868042, -2.615294933319092, -2.5051681995391846, -2.3950414657592773, -2.284914970397949, -2.174788236618042, -2.0646615028381348, -1.9545350074768066, -1.8444082736968994, -1.7342817783355713, -1.624155044555664, -1.5140284299850464, -1.4039018154144287, -1.293775200843811, -1.1836485862731934, -1.0735219717025757, -0.9633952975273132, -0.8532686829566956, -0.7431420683860779, -0.6330153942108154, -0.5228887796401978, -0.412761926651001, -0.3026353120803833, -0.19250866770744324, -0.08238202333450317, 0.027744591236114502, 0.13787120580673218, 0.24799787998199463, 0.3581244945526123, 0.46825110912323, 0.5783777236938477, 0.6885043382644653, 0.7986310124397278, 0.9087576270103455, 1.0188841819763184, 1.1290109157562256, 1.2391375303268433, 1.349264144897461, 1.4593907594680786, 1.5695173740386963, 1.6796441078186035, 1.7897706031799316, 1.8998973369598389, 2.010024070739746, 2.120150566101074, 2.2302770614624023, 2.3404037952423096, 2.4505302906036377, 2.560657024383545, 2.670783519744873, 2.7809102535247803, 2.8910369873046875, 3.0011634826660156, 3.111290216445923]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 11.0, 8.0, 13.0, 23.0, 17.0, 39.0, 57.0, 80.0, 126.0, 234.0, 373.0, 777.0, 1470.0, 3448.0, 9295.0, 32361.0, 137456.0, 437246.0, 316440.0, 78302.0, 19580.0, 6242.0, 2465.0, 1125.0, 556.0, 318.0, 165.0, 114.0, 71.0, 44.0, 27.0, 26.0, 16.0, 7.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6021575927734375, -0.578826904296875, -0.5554962158203125, -0.53216552734375, -0.5088348388671875, -0.485504150390625, -0.4621734619140625, -0.4388427734375, -0.4155120849609375, -0.392181396484375, -0.3688507080078125, -0.34552001953125, -0.3221893310546875, -0.298858642578125, -0.2755279541015625, -0.252197265625, -0.2288665771484375, -0.205535888671875, -0.1822052001953125, -0.15887451171875, -0.1355438232421875, -0.112213134765625, -0.0888824462890625, -0.0655517578125, -0.0422210693359375, -0.018890380859375, 0.0044403076171875, 0.02777099609375, 0.0511016845703125, 0.074432373046875, 0.0977630615234375, 0.12109375, 0.1444244384765625, 0.167755126953125, 0.1910858154296875, 0.21441650390625, 0.2377471923828125, 0.261077880859375, 0.2844085693359375, 0.3077392578125, 0.3310699462890625, 0.354400634765625, 0.3777313232421875, 0.40106201171875, 0.4243927001953125, 0.447723388671875, 0.4710540771484375, 0.494384765625, 0.5177154541015625, 0.541046142578125, 0.5643768310546875, 0.58770751953125, 0.6110382080078125, 0.634368896484375, 0.6576995849609375, 0.6810302734375, 0.7043609619140625, 0.727691650390625, 0.7510223388671875, 0.77435302734375, 0.7976837158203125, 0.821014404296875, 0.8443450927734375, 0.86767578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 11.0, 15.0, 10.0, 14.0, 17.0, 25.0, 28.0, 33.0, 41.0, 44.0, 42.0, 55.0, 54.0, 50.0, 44.0, 52.0, 50.0, 65.0, 46.0, 30.0, 49.0, 38.0, 38.0, 24.0, 28.0, 17.0, 16.0, 13.0, 10.0, 13.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.21453857421875, -2.1263427734375, -2.03814697265625, -1.949951171875, -1.86175537109375, -1.7735595703125, -1.68536376953125, -1.59716796875, -1.50897216796875, -1.4207763671875, -1.33258056640625, -1.244384765625, -1.15618896484375, -1.0679931640625, -0.97979736328125, -0.8916015625, -0.80340576171875, -0.7152099609375, -0.62701416015625, -0.538818359375, -0.45062255859375, -0.3624267578125, -0.27423095703125, -0.18603515625, -0.09783935546875, -0.0096435546875, 0.07855224609375, 0.166748046875, 0.25494384765625, 0.3431396484375, 0.43133544921875, 0.51953125, 0.60772705078125, 0.6959228515625, 0.78411865234375, 0.872314453125, 0.96051025390625, 1.0487060546875, 1.13690185546875, 1.22509765625, 1.31329345703125, 1.4014892578125, 1.48968505859375, 1.577880859375, 1.66607666015625, 1.7542724609375, 1.84246826171875, 1.9306640625, 2.01885986328125, 2.1070556640625, 2.19525146484375, 2.283447265625, 2.37164306640625, 2.4598388671875, 2.54803466796875, 2.63623046875, 2.72442626953125, 2.8126220703125, 2.90081787109375, 2.989013671875, 3.07720947265625, 3.1654052734375, 3.25360107421875, 3.341796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 12.0, 3.0, 16.0, 13.0, 16.0, 25.0, 29.0, 53.0, 121.0, 201.0, 408.0, 728.0, 1489.0, 3173.0, 6943.0, 14758.0, 31627.0, 65225.0, 123957.0, 196043.0, 228848.0, 174068.0, 101847.0, 52067.0, 24860.0, 11717.0, 5352.0, 2506.0, 1194.0, 573.0, 307.0, 130.0, 86.0, 50.0, 34.0, 23.0, 13.0, 9.0, 5.0, 8.0, 8.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.29833984375, -0.2896537780761719, -0.28096771240234375, -0.2722816467285156, -0.2635955810546875, -0.2549095153808594, -0.24622344970703125, -0.23753738403320312, -0.228851318359375, -0.22016525268554688, -0.21147918701171875, -0.20279312133789062, -0.1941070556640625, -0.18542098999023438, -0.17673492431640625, -0.16804885864257812, -0.15936279296875, -0.15067672729492188, -0.14199066162109375, -0.13330459594726562, -0.1246185302734375, -0.11593246459960938, -0.10724639892578125, -0.09856033325195312, -0.089874267578125, -0.08118820190429688, -0.07250213623046875, -0.06381607055664062, -0.0551300048828125, -0.046443939208984375, -0.03775787353515625, -0.029071807861328125, -0.0203857421875, -0.011699676513671875, -0.00301361083984375, 0.005672454833984375, 0.0143585205078125, 0.023044586181640625, 0.03173065185546875, 0.040416717529296875, 0.049102783203125, 0.057788848876953125, 0.06647491455078125, 0.07516098022460938, 0.0838470458984375, 0.09253311157226562, 0.10121917724609375, 0.10990524291992188, 0.11859130859375, 0.12727737426757812, 0.13596343994140625, 0.14464950561523438, 0.1533355712890625, 0.16202163696289062, 0.17070770263671875, 0.17939376831054688, 0.188079833984375, 0.19676589965820312, 0.20545196533203125, 0.21413803100585938, 0.2228240966796875, 0.23151016235351562, 0.24019622802734375, 0.24888229370117188, 0.257568359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 6.0, 12.0, 9.0, 12.0, 21.0, 21.0, 23.0, 30.0, 34.0, 30.0, 37.0, 44.0, 52.0, 52.0, 50.0, 51.0, 39.0, 44.0, 59.0, 34.0, 38.0, 45.0, 27.0, 26.0, 34.0, 26.0, 19.0, 19.0, 16.0, 9.0, 13.0, 10.0, 6.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.64453125, -5.49005126953125, -5.3355712890625, -5.18109130859375, -5.026611328125, -4.87213134765625, -4.7176513671875, -4.56317138671875, -4.40869140625, -4.25421142578125, -4.0997314453125, -3.94525146484375, -3.790771484375, -3.63629150390625, -3.4818115234375, -3.32733154296875, -3.1728515625, -3.01837158203125, -2.8638916015625, -2.70941162109375, -2.554931640625, -2.40045166015625, -2.2459716796875, -2.09149169921875, -1.93701171875, -1.78253173828125, -1.6280517578125, -1.47357177734375, -1.319091796875, -1.16461181640625, -1.0101318359375, -0.85565185546875, -0.701171875, -0.54669189453125, -0.3922119140625, -0.23773193359375, -0.083251953125, 0.07122802734375, 0.2257080078125, 0.38018798828125, 0.53466796875, 0.68914794921875, 0.8436279296875, 0.99810791015625, 1.152587890625, 1.30706787109375, 1.4615478515625, 1.61602783203125, 1.7705078125, 1.92498779296875, 2.0794677734375, 2.23394775390625, 2.388427734375, 2.54290771484375, 2.6973876953125, 2.85186767578125, 3.00634765625, 3.16082763671875, 3.3153076171875, 3.46978759765625, 3.624267578125, 3.77874755859375, 3.9332275390625, 4.08770751953125, 4.2421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 13.0, 7.0, 23.0, 30.0, 28.0, 41.0, 63.0, 90.0, 115.0, 185.0, 293.0, 520.0, 898.0, 1712.0, 3191.0, 6612.0, 14136.0, 35629.0, 102507.0, 291394.0, 362139.0, 144583.0, 48392.0, 18683.0, 8503.0, 4047.0, 2018.0, 1117.0, 564.0, 359.0, 227.0, 126.0, 95.0, 54.0, 39.0, 27.0, 23.0, 27.0, 13.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.051910400390625, -0.050066471099853516, -0.04822254180908203, -0.04637861251831055, -0.04453468322753906, -0.04269075393676758, -0.040846824645996094, -0.03900289535522461, -0.037158966064453125, -0.03531503677368164, -0.033471107482910156, -0.03162717819213867, -0.029783248901367188, -0.027939319610595703, -0.02609539031982422, -0.024251461029052734, -0.02240753173828125, -0.020563602447509766, -0.01871967315673828, -0.016875743865966797, -0.015031814575195312, -0.013187885284423828, -0.011343955993652344, -0.00950002670288086, -0.007656097412109375, -0.005812168121337891, -0.003968238830566406, -0.002124309539794922, -0.0002803802490234375, 0.0015635490417480469, 0.0034074783325195312, 0.005251407623291016, 0.0070953369140625, 0.008939266204833984, 0.010783195495605469, 0.012627124786376953, 0.014471054077148438, 0.016314983367919922, 0.018158912658691406, 0.02000284194946289, 0.021846771240234375, 0.02369070053100586, 0.025534629821777344, 0.027378559112548828, 0.029222488403320312, 0.031066417694091797, 0.03291034698486328, 0.034754276275634766, 0.03659820556640625, 0.038442134857177734, 0.04028606414794922, 0.0421299934387207, 0.04397392272949219, 0.04581785202026367, 0.047661781311035156, 0.04950571060180664, 0.051349639892578125, 0.05319356918334961, 0.055037498474121094, 0.05688142776489258, 0.05872535705566406, 0.06056928634643555, 0.06241321563720703, 0.06425714492797852, 0.06610107421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 1.0, 7.0, 6.0, 21.0, 11.0, 18.0, 30.0, 28.0, 36.0, 45.0, 55.0, 42.0, 69.0, 80.0, 80.0, 96.0, 61.0, 57.0, 53.0, 38.0, 37.0, 29.0, 23.0, 12.0, 12.0, 13.0, 10.0, 9.0, 4.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-5.7816505432128906e-05, -5.6306831538677216e-05, -5.4797157645225525e-05, -5.3287483751773834e-05, -5.1777809858322144e-05, -5.026813596487045e-05, -4.875846207141876e-05, -4.724878817796707e-05, -4.573911428451538e-05, -4.422944039106369e-05, -4.2719766497612e-05, -4.121009260416031e-05, -3.970041871070862e-05, -3.819074481725693e-05, -3.668107092380524e-05, -3.5171397030353546e-05, -3.3661723136901855e-05, -3.2152049243450165e-05, -3.0642375349998474e-05, -2.9132701456546783e-05, -2.7623027563095093e-05, -2.6113353669643402e-05, -2.460367977619171e-05, -2.309400588274002e-05, -2.158433198928833e-05, -2.007465809583664e-05, -1.856498420238495e-05, -1.7055310308933258e-05, -1.5545636415481567e-05, -1.4035962522029877e-05, -1.2526288628578186e-05, -1.1016614735126495e-05, -9.506940841674805e-06, -7.997266948223114e-06, -6.487593054771423e-06, -4.977919161319733e-06, -3.468245267868042e-06, -1.9585713744163513e-06, -4.4889748096466064e-07, 1.06077641248703e-06, 2.5704503059387207e-06, 4.080124199390411e-06, 5.589798092842102e-06, 7.099471986293793e-06, 8.609145879745483e-06, 1.0118819773197174e-05, 1.1628493666648865e-05, 1.3138167560100555e-05, 1.4647841453552246e-05, 1.6157515347003937e-05, 1.7667189240455627e-05, 1.9176863133907318e-05, 2.068653702735901e-05, 2.21962109208107e-05, 2.370588481426239e-05, 2.521555870771408e-05, 2.672523260116577e-05, 2.8234906494617462e-05, 2.9744580388069153e-05, 3.1254254281520844e-05, 3.2763928174972534e-05, 3.4273602068424225e-05, 3.5783275961875916e-05, 3.7292949855327606e-05, 3.88026237487793e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 6.0, 13.0, 19.0, 20.0, 25.0, 42.0, 50.0, 63.0, 116.0, 174.0, 282.0, 418.0, 828.0, 1419.0, 2638.0, 5436.0, 11676.0, 29282.0, 96211.0, 383767.0, 371569.0, 93115.0, 28580.0, 11399.0, 5280.0, 2702.0, 1386.0, 768.0, 457.0, 246.0, 169.0, 122.0, 70.0, 49.0, 41.0, 22.0, 23.0, 18.0, 8.0, 9.0, 1.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0716552734375, -0.06941509246826172, -0.06717491149902344, -0.06493473052978516, -0.06269454956054688, -0.060454368591308594, -0.05821418762207031, -0.05597400665283203, -0.05373382568359375, -0.05149364471435547, -0.04925346374511719, -0.047013282775878906, -0.044773101806640625, -0.042532920837402344, -0.04029273986816406, -0.03805255889892578, -0.0358123779296875, -0.03357219696044922, -0.03133201599121094, -0.029091835021972656, -0.026851654052734375, -0.024611473083496094, -0.022371292114257812, -0.02013111114501953, -0.01789093017578125, -0.01565074920654297, -0.013410568237304688, -0.011170387268066406, -0.008930206298828125, -0.006690025329589844, -0.0044498443603515625, -0.0022096633911132812, 3.0517578125e-05, 0.0022706985473632812, 0.0045108795166015625, 0.006751060485839844, 0.008991241455078125, 0.011231422424316406, 0.013471603393554688, 0.01571178436279297, 0.01795196533203125, 0.02019214630126953, 0.022432327270507812, 0.024672508239746094, 0.026912689208984375, 0.029152870178222656, 0.03139305114746094, 0.03363323211669922, 0.0358734130859375, 0.03811359405517578, 0.04035377502441406, 0.042593955993652344, 0.044834136962890625, 0.047074317932128906, 0.04931449890136719, 0.05155467987060547, 0.05379486083984375, 0.05603504180908203, 0.05827522277832031, 0.060515403747558594, 0.06275558471679688, 0.06499576568603516, 0.06723594665527344, 0.06947612762451172, 0.07171630859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 13.0, 9.0, 9.0, 12.0, 22.0, 16.0, 20.0, 21.0, 25.0, 34.0, 54.0, 64.0, 60.0, 83.0, 65.0, 71.0, 74.0, 58.0, 50.0, 50.0, 31.0, 25.0, 21.0, 15.0, 23.0, 8.0, 7.0, 6.0, 6.0, 6.0, 7.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0189208984375, -0.01833939552307129, -0.017757892608642578, -0.017176389694213867, -0.016594886779785156, -0.016013383865356445, -0.015431880950927734, -0.014850378036499023, -0.014268875122070312, -0.013687372207641602, -0.01310586929321289, -0.01252436637878418, -0.011942863464355469, -0.011361360549926758, -0.010779857635498047, -0.010198354721069336, -0.009616851806640625, -0.009035348892211914, -0.008453845977783203, -0.007872343063354492, -0.007290840148925781, -0.00670933723449707, -0.006127834320068359, -0.0055463314056396484, -0.0049648284912109375, -0.0043833255767822266, -0.0038018226623535156, -0.0032203197479248047, -0.0026388168334960938, -0.002057313919067383, -0.0014758110046386719, -0.0008943080902099609, -0.00031280517578125, 0.00026869773864746094, 0.0008502006530761719, 0.0014317035675048828, 0.0020132064819335938, 0.0025947093963623047, 0.0031762123107910156, 0.0037577152252197266, 0.0043392181396484375, 0.0049207210540771484, 0.005502223968505859, 0.00608372688293457, 0.006665229797363281, 0.007246732711791992, 0.007828235626220703, 0.008409738540649414, 0.008991241455078125, 0.009572744369506836, 0.010154247283935547, 0.010735750198364258, 0.011317253112792969, 0.01189875602722168, 0.01248025894165039, 0.013061761856079102, 0.013643264770507812, 0.014224767684936523, 0.014806270599365234, 0.015387773513793945, 0.015969276428222656, 0.016550779342651367, 0.017132282257080078, 0.01771378517150879, 0.0182952880859375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 17.0, 25.0, 39.0, 71.0, 123.0, 135.0, 154.0, 123.0, 117.0, 75.0, 39.0, 37.0, 21.0, 13.0, 7.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.134188652038574, -5.962375640869141, -5.790562629699707, -5.618749618530273, -5.446937084197998, -5.2751240730285645, -5.103311061859131, -4.931498050689697, -4.759685516357422, -4.587872505187988, -4.416059494018555, -4.244246482849121, -4.072433948516846, -3.900620937347412, -3.7288079261779785, -3.556994915008545, -3.3851819038391113, -3.2133688926696777, -3.0415561199188232, -2.8697431087493896, -2.697930335998535, -2.5261173248291016, -2.354304313659668, -2.1824913024902344, -2.01067852973938, -1.8388656377792358, -1.6670527458190918, -1.4952397346496582, -1.3234268426895142, -1.1516139507293701, -0.9798009395599365, -0.8079880475997925, -0.6361756324768066, -0.4643627107143402, -0.2925497889518738, -0.12073683738708496, 0.05107605457305908, 0.22288894653320312, 0.3947019577026367, 0.5665148496627808, 0.7383277416229248, 0.9101406335830688, 1.081953525543213, 1.2537665367126465, 1.4255794286727905, 1.5973923206329346, 1.7692053318023682, 1.9410182237625122, 2.1128311157226562, 2.28464412689209, 2.4564568996429443, 2.628269910812378, 2.8000826835632324, 2.971895694732666, 3.1437087059020996, 3.315521717071533, 3.4873344898223877, 3.6591475009918213, 3.830960273742676, 4.002773284912109, 4.174586296081543, 4.346399307250977, 4.51821231842041, 4.6900248527526855, 4.861837863922119]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 10.0, 4.0, 20.0, 18.0, 16.0, 7.0, 31.0, 24.0, 32.0, 45.0, 39.0, 28.0, 32.0, 40.0, 43.0, 47.0, 38.0, 51.0, 47.0, 40.0, 35.0, 40.0, 27.0, 49.0, 38.0, 31.0, 32.0, 20.0, 20.0, 13.0, 14.0, 14.0, 9.0, 12.0, 9.0, 2.0, 5.0, 2.0, 1.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2405951023101807, -2.1690683364868164, -2.097541570663452, -2.026014804840088, -1.9544881582260132, -1.882961392402649, -1.8114347457885742, -1.73990797996521, -1.6683812141418457, -1.5968544483184814, -1.5253276824951172, -1.4538010358810425, -1.3822742700576782, -1.310747504234314, -1.2392208576202393, -1.167694091796875, -1.0961673259735107, -1.0246405601501465, -0.953113853931427, -0.8815871477127075, -0.8100603818893433, -0.738533616065979, -0.6670069098472595, -0.59548020362854, -0.5239534378051758, -0.4524267017841339, -0.38089996576309204, -0.30937322974205017, -0.2378464937210083, -0.16631975769996643, -0.09479302167892456, -0.023266315460205078, 0.04826021194458008, 0.11978694796562195, 0.19131368398666382, 0.2628404200077057, 0.33436715602874756, 0.40589389204978943, 0.4774206280708313, 0.5489473342895508, 0.620474100112915, 0.6920008659362793, 0.7635275721549988, 0.8350542783737183, 0.9065810441970825, 0.9781078100204468, 1.0496344566345215, 1.1211612224578857, 1.19268798828125, 1.2642147541046143, 1.3357415199279785, 1.4072681665420532, 1.4787949323654175, 1.5503216981887817, 1.6218483448028564, 1.6933751106262207, 1.764901876449585, 1.8364286422729492, 1.9079554080963135, 1.9794820547103882, 2.051008701324463, 2.122535467147827, 2.1940622329711914, 2.2655889987945557, 2.33711576461792]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 11.0, 19.0, 30.0, 55.0, 86.0, 142.0, 293.0, 655.0, 1467.0, 4806.0, 15316.0, 52970.0, 261250.0, 589301.0, 86080.0, 24662.0, 7382.0, 2286.0, 893.0, 398.0, 198.0, 79.0, 57.0, 37.0, 22.0, 10.0, 13.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5625, -3.444488525390625, -3.32647705078125, -3.208465576171875, -3.0904541015625, -2.972442626953125, -2.85443115234375, -2.736419677734375, -2.618408203125, -2.500396728515625, -2.38238525390625, -2.264373779296875, -2.1463623046875, -2.028350830078125, -1.91033935546875, -1.792327880859375, -1.67431640625, -1.556304931640625, -1.43829345703125, -1.320281982421875, -1.2022705078125, -1.084259033203125, -0.96624755859375, -0.848236083984375, -0.730224609375, -0.612213134765625, -0.49420166015625, -0.376190185546875, -0.2581787109375, -0.140167236328125, -0.02215576171875, 0.095855712890625, 0.2138671875, 0.331878662109375, 0.44989013671875, 0.567901611328125, 0.6859130859375, 0.803924560546875, 0.92193603515625, 1.039947509765625, 1.157958984375, 1.275970458984375, 1.39398193359375, 1.511993408203125, 1.6300048828125, 1.748016357421875, 1.86602783203125, 1.984039306640625, 2.10205078125, 2.220062255859375, 2.33807373046875, 2.456085205078125, 2.5740966796875, 2.692108154296875, 2.81011962890625, 2.928131103515625, 3.046142578125, 3.164154052734375, 3.28216552734375, 3.400177001953125, 3.5181884765625, 3.636199951171875, 3.75421142578125, 3.872222900390625, 3.990234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 6.0, 4.0, 15.0, 15.0, 12.0, 14.0, 27.0, 29.0, 23.0, 32.0, 36.0, 45.0, 47.0, 44.0, 43.0, 50.0, 38.0, 61.0, 37.0, 46.0, 50.0, 42.0, 45.0, 33.0, 31.0, 26.0, 26.0, 23.0, 23.0, 12.0, 14.0, 8.0, 12.0, 9.0, 7.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.18731689453125, -4.0386962890625, -3.89007568359375, -3.741455078125, -3.59283447265625, -3.4442138671875, -3.29559326171875, -3.14697265625, -2.99835205078125, -2.8497314453125, -2.70111083984375, -2.552490234375, -2.40386962890625, -2.2552490234375, -2.10662841796875, -1.9580078125, -1.80938720703125, -1.6607666015625, -1.51214599609375, -1.363525390625, -1.21490478515625, -1.0662841796875, -0.91766357421875, -0.76904296875, -0.62042236328125, -0.4718017578125, -0.32318115234375, -0.174560546875, -0.02593994140625, 0.1226806640625, 0.27130126953125, 0.419921875, 0.56854248046875, 0.7171630859375, 0.86578369140625, 1.014404296875, 1.16302490234375, 1.3116455078125, 1.46026611328125, 1.60888671875, 1.75750732421875, 1.9061279296875, 2.05474853515625, 2.203369140625, 2.35198974609375, 2.5006103515625, 2.64923095703125, 2.7978515625, 2.94647216796875, 3.0950927734375, 3.24371337890625, 3.392333984375, 3.54095458984375, 3.6895751953125, 3.83819580078125, 3.98681640625, 4.13543701171875, 4.2840576171875, 4.43267822265625, 4.581298828125, 4.72991943359375, 4.8785400390625, 5.02716064453125, 5.17578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 8.0, 5.0, 7.0, 9.0, 10.0, 18.0, 17.0, 25.0, 30.0, 43.0, 41.0, 52.0, 104.0, 125.0, 207.0, 422.0, 1022.0, 7765.0, 185998.0, 827118.0, 22251.0, 1854.0, 560.0, 280.0, 151.0, 111.0, 65.0, 58.0, 42.0, 24.0, 16.0, 19.0, 20.0, 9.0, 17.0, 9.0, 8.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.8359375, -8.5614013671875, -8.286865234375, -8.0123291015625, -7.73779296875, -7.4632568359375, -7.188720703125, -6.9141845703125, -6.6396484375, -6.3651123046875, -6.090576171875, -5.8160400390625, -5.54150390625, -5.2669677734375, -4.992431640625, -4.7178955078125, -4.443359375, -4.1688232421875, -3.894287109375, -3.6197509765625, -3.34521484375, -3.0706787109375, -2.796142578125, -2.5216064453125, -2.2470703125, -1.9725341796875, -1.697998046875, -1.4234619140625, -1.14892578125, -0.8743896484375, -0.599853515625, -0.3253173828125, -0.05078125, 0.2237548828125, 0.498291015625, 0.7728271484375, 1.04736328125, 1.3218994140625, 1.596435546875, 1.8709716796875, 2.1455078125, 2.4200439453125, 2.694580078125, 2.9691162109375, 3.24365234375, 3.5181884765625, 3.792724609375, 4.0672607421875, 4.341796875, 4.6163330078125, 4.890869140625, 5.1654052734375, 5.43994140625, 5.7144775390625, 5.989013671875, 6.2635498046875, 6.5380859375, 6.8126220703125, 7.087158203125, 7.3616943359375, 7.63623046875, 7.9107666015625, 8.185302734375, 8.4598388671875, 8.734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 4.0, 6.0, 9.0, 18.0, 10.0, 13.0, 22.0, 20.0, 28.0, 39.0, 36.0, 36.0, 26.0, 47.0, 51.0, 48.0, 54.0, 55.0, 54.0, 52.0, 58.0, 49.0, 39.0, 32.0, 31.0, 20.0, 37.0, 11.0, 15.0, 10.0, 12.0, 20.0, 6.0, 14.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.43597412109375, -5.2508544921875, -5.06573486328125, -4.880615234375, -4.69549560546875, -4.5103759765625, -4.32525634765625, -4.14013671875, -3.95501708984375, -3.7698974609375, -3.58477783203125, -3.399658203125, -3.21453857421875, -3.0294189453125, -2.84429931640625, -2.6591796875, -2.47406005859375, -2.2889404296875, -2.10382080078125, -1.918701171875, -1.73358154296875, -1.5484619140625, -1.36334228515625, -1.17822265625, -0.99310302734375, -0.8079833984375, -0.62286376953125, -0.437744140625, -0.25262451171875, -0.0675048828125, 0.11761474609375, 0.302734375, 0.48785400390625, 0.6729736328125, 0.85809326171875, 1.043212890625, 1.22833251953125, 1.4134521484375, 1.59857177734375, 1.78369140625, 1.96881103515625, 2.1539306640625, 2.33905029296875, 2.524169921875, 2.70928955078125, 2.8944091796875, 3.07952880859375, 3.2646484375, 3.44976806640625, 3.6348876953125, 3.82000732421875, 4.005126953125, 4.19024658203125, 4.3753662109375, 4.56048583984375, 4.74560546875, 4.93072509765625, 5.1158447265625, 5.30096435546875, 5.486083984375, 5.67120361328125, 5.8563232421875, 6.04144287109375, 6.2265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 11.0, 27.0, 57.0, 183.0, 936.0, 10724.0, 1012677.0, 22071.0, 1412.0, 296.0, 75.0, 41.0, 18.0, 4.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.74346923828125, -7.5572509765625, -7.37103271484375, -7.184814453125, -6.99859619140625, -6.8123779296875, -6.62615966796875, -6.43994140625, -6.25372314453125, -6.0675048828125, -5.88128662109375, -5.695068359375, -5.50885009765625, -5.3226318359375, -5.13641357421875, -4.9501953125, -4.76397705078125, -4.5777587890625, -4.39154052734375, -4.205322265625, -4.01910400390625, -3.8328857421875, -3.64666748046875, -3.46044921875, -3.27423095703125, -3.0880126953125, -2.90179443359375, -2.715576171875, -2.52935791015625, -2.3431396484375, -2.15692138671875, -1.970703125, -1.78448486328125, -1.5982666015625, -1.41204833984375, -1.225830078125, -1.03961181640625, -0.8533935546875, -0.66717529296875, -0.48095703125, -0.29473876953125, -0.1085205078125, 0.07769775390625, 0.263916015625, 0.45013427734375, 0.6363525390625, 0.82257080078125, 1.0087890625, 1.19500732421875, 1.3812255859375, 1.56744384765625, 1.753662109375, 1.93988037109375, 2.1260986328125, 2.31231689453125, 2.49853515625, 2.68475341796875, 2.8709716796875, 3.05718994140625, 3.243408203125, 3.42962646484375, 3.6158447265625, 3.80206298828125, 3.98828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 19.0, 19.0, 22.0, 32.0, 42.0, 46.0, 78.0, 114.0, 183.0, 108.0, 61.0, 47.0, 43.0, 30.0, 20.0, 24.0, 19.0, 9.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.00019502639770507812, -0.00018935278058052063, -0.00018367916345596313, -0.00017800554633140564, -0.00017233192920684814, -0.00016665831208229065, -0.00016098469495773315, -0.00015531107783317566, -0.00014963746070861816, -0.00014396384358406067, -0.00013829022645950317, -0.00013261660933494568, -0.00012694299221038818, -0.00012126937508583069, -0.0001155957579612732, -0.0001099221408367157, -0.0001042485237121582, -9.857490658760071e-05, -9.290128946304321e-05, -8.722767233848572e-05, -8.155405521392822e-05, -7.588043808937073e-05, -7.020682096481323e-05, -6.453320384025574e-05, -5.885958671569824e-05, -5.318596959114075e-05, -4.751235246658325e-05, -4.183873534202576e-05, -3.616511821746826e-05, -3.0491501092910767e-05, -2.481788396835327e-05, -1.9144266843795776e-05, -1.3470649719238281e-05, -7.797032594680786e-06, -2.123415470123291e-06, 3.550201654434204e-06, 9.2238187789917e-06, 1.4897435903549194e-05, 2.057105302810669e-05, 2.6244670152664185e-05, 3.191828727722168e-05, 3.7591904401779175e-05, 4.326552152633667e-05, 4.8939138650894165e-05, 5.461275577545166e-05, 6.0286372900009155e-05, 6.595999002456665e-05, 7.163360714912415e-05, 7.730722427368164e-05, 8.298084139823914e-05, 8.865445852279663e-05, 9.432807564735413e-05, 0.00010000169277191162, 0.00010567530989646912, 0.00011134892702102661, 0.0001170225441455841, 0.0001226961612701416, 0.0001283697783946991, 0.0001340433955192566, 0.0001397170126438141, 0.00014539062976837158, 0.00015106424689292908, 0.00015673786401748657, 0.00016241148114204407, 0.00016808509826660156]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 11.0, 19.0, 29.0, 65.0, 122.0, 361.0, 1006.0, 5204.0, 659553.0, 376016.0, 4673.0, 951.0, 306.0, 129.0, 54.0, 27.0, 13.0, 4.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.45831298828125, -4.2642822265625, -4.07025146484375, -3.876220703125, -3.68218994140625, -3.4881591796875, -3.29412841796875, -3.10009765625, -2.90606689453125, -2.7120361328125, -2.51800537109375, -2.323974609375, -2.12994384765625, -1.9359130859375, -1.74188232421875, -1.5478515625, -1.35382080078125, -1.1597900390625, -0.96575927734375, -0.771728515625, -0.57769775390625, -0.3836669921875, -0.18963623046875, 0.00439453125, 0.19842529296875, 0.3924560546875, 0.58648681640625, 0.780517578125, 0.97454833984375, 1.1685791015625, 1.36260986328125, 1.556640625, 1.75067138671875, 1.9447021484375, 2.13873291015625, 2.332763671875, 2.52679443359375, 2.7208251953125, 2.91485595703125, 3.10888671875, 3.30291748046875, 3.4969482421875, 3.69097900390625, 3.885009765625, 4.07904052734375, 4.2730712890625, 4.46710205078125, 4.6611328125, 4.85516357421875, 5.0491943359375, 5.24322509765625, 5.437255859375, 5.63128662109375, 5.8253173828125, 6.01934814453125, 6.21337890625, 6.40740966796875, 6.6014404296875, 6.79547119140625, 6.989501953125, 7.18353271484375, 7.3775634765625, 7.57159423828125, 7.765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 15.0, 17.0, 24.0, 45.0, 85.0, 162.0, 321.0, 147.0, 66.0, 45.0, 22.0, 15.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9306640625, -1.890777587890625, -1.85089111328125, -1.811004638671875, -1.7711181640625, -1.731231689453125, -1.69134521484375, -1.651458740234375, -1.611572265625, -1.571685791015625, -1.53179931640625, -1.491912841796875, -1.4520263671875, -1.412139892578125, -1.37225341796875, -1.332366943359375, -1.29248046875, -1.252593994140625, -1.21270751953125, -1.172821044921875, -1.1329345703125, -1.093048095703125, -1.05316162109375, -1.013275146484375, -0.973388671875, -0.933502197265625, -0.89361572265625, -0.853729248046875, -0.8138427734375, -0.773956298828125, -0.73406982421875, -0.694183349609375, -0.654296875, -0.614410400390625, -0.57452392578125, -0.534637451171875, -0.4947509765625, -0.454864501953125, -0.41497802734375, -0.375091552734375, -0.335205078125, -0.295318603515625, -0.25543212890625, -0.215545654296875, -0.1756591796875, -0.135772705078125, -0.09588623046875, -0.055999755859375, -0.01611328125, 0.023773193359375, 0.06365966796875, 0.103546142578125, 0.1434326171875, 0.183319091796875, 0.22320556640625, 0.263092041015625, 0.302978515625, 0.342864990234375, 0.38275146484375, 0.422637939453125, 0.4625244140625, 0.502410888671875, 0.54229736328125, 0.582183837890625, 0.6220703125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 7.0, 9.0, 13.0, 24.0, 49.0, 64.0, 102.0, 135.0, 131.0, 135.0, 110.0, 81.0, 57.0, 40.0, 22.0, 20.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.997753381729126, -3.6640477180480957, -3.3303420543670654, -2.996636390686035, -2.662930727005005, -2.3292250633239746, -1.9955193996429443, -1.661813735961914, -1.3281080722808838, -0.9944024085998535, -0.6606967449188232, -0.32699108123779297, 0.006714582443237305, 0.3404202461242676, 0.6741259098052979, 1.0078315734863281, 1.3415372371673584, 1.6752429008483887, 2.008948564529419, 2.342654228210449, 2.6763598918914795, 3.0100655555725098, 3.34377121925354, 3.6774768829345703, 4.01118278503418, 4.344888687133789, 4.67859411239624, 5.012299537658691, 5.346005439758301, 5.67971134185791, 6.013416767120361, 6.3471221923828125, 6.680828094482422, 7.014533996582031, 7.348239421844482, 7.681944847106934, 8.015650749206543, 8.349356651306152, 8.683061599731445, 9.016767501831055, 9.350473403930664, 9.684179306030273, 10.017885208129883, 10.351590156555176, 10.685296058654785, 11.019001960754395, 11.352706909179688, 11.686412811279297, 12.020118713378906, 12.353824615478516, 12.687530517578125, 13.021235466003418, 13.354941368103027, 13.688647270202637, 14.02235221862793, 14.356058120727539, 14.689764022827148, 15.023469924926758, 15.357175827026367, 15.69088077545166, 16.024585723876953, 16.358291625976562, 16.691997528076172, 17.02570343017578, 17.35940933227539]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 2.0, 3.0, 6.0, 11.0, 6.0, 10.0, 10.0, 13.0, 14.0, 21.0, 20.0, 27.0, 33.0, 38.0, 33.0, 25.0, 28.0, 53.0, 43.0, 31.0, 57.0, 37.0, 40.0, 50.0, 35.0, 30.0, 38.0, 44.0, 31.0, 25.0, 27.0, 28.0, 22.0, 23.0, 19.0, 13.0, 11.0, 10.0, 10.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-8.875509262084961, -8.623944282531738, -8.3723783493042, -8.120813369750977, -7.8692474365234375, -7.617681980133057, -7.366116523742676, -7.114551544189453, -6.862985610961914, -6.611420154571533, -6.359854698181152, -6.1082892417907715, -5.856723785400391, -5.60515832901001, -5.353592872619629, -5.102027893066406, -4.850462436676025, -4.5988969802856445, -4.347331523895264, -4.095766067504883, -3.844200611114502, -3.592635154724121, -3.3410699367523193, -3.0895044803619385, -2.8379390239715576, -2.5863735675811768, -2.334808111190796, -2.083242893218994, -1.8316773176193237, -1.5801118612289429, -1.3285465240478516, -1.0769810676574707, -0.8254156112670898, -0.573850154876709, -0.3222847580909729, -0.07071936130523682, 0.18084609508514404, 0.4324115514755249, 0.6839768886566162, 0.9355423450469971, 1.187107801437378, 1.4386732578277588, 1.6902387142181396, 1.941804051399231, 2.1933693885803223, 2.444934844970703, 2.696500301361084, 2.948065757751465, 3.1996312141418457, 3.4511966705322266, 3.7027621269226074, 3.9543275833129883, 4.205893039703369, 4.45745849609375, 4.709023475646973, 4.960589408874512, 5.212154388427734, 5.463719844818115, 5.715285301208496, 5.966850757598877, 6.218416213989258, 6.469981670379639, 6.7215471267700195, 6.973112106323242, 7.224678039550781]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 6.0, 9.0, 6.0, 12.0, 18.0, 16.0, 28.0, 21.0, 30.0, 35.0, 60.0, 67.0, 135.0, 218.0, 467.0, 1319.0, 7177.0, 92384.0, 2412709.0, 1621007.0, 51961.0, 4671.0, 990.0, 345.0, 157.0, 96.0, 67.0, 55.0, 40.0, 29.0, 27.0, 19.0, 21.0, 12.0, 10.0, 7.0, 10.0, 4.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.87109375, -7.60797119140625, -7.3448486328125, -7.08172607421875, -6.818603515625, -6.55548095703125, -6.2923583984375, -6.02923583984375, -5.76611328125, -5.50299072265625, -5.2398681640625, -4.97674560546875, -4.713623046875, -4.45050048828125, -4.1873779296875, -3.92425537109375, -3.6611328125, -3.39801025390625, -3.1348876953125, -2.87176513671875, -2.608642578125, -2.34552001953125, -2.0823974609375, -1.81927490234375, -1.55615234375, -1.29302978515625, -1.0299072265625, -0.76678466796875, -0.503662109375, -0.24053955078125, 0.0225830078125, 0.28570556640625, 0.548828125, 0.81195068359375, 1.0750732421875, 1.33819580078125, 1.601318359375, 1.86444091796875, 2.1275634765625, 2.39068603515625, 2.65380859375, 2.91693115234375, 3.1800537109375, 3.44317626953125, 3.706298828125, 3.96942138671875, 4.2325439453125, 4.49566650390625, 4.7587890625, 5.02191162109375, 5.2850341796875, 5.54815673828125, 5.811279296875, 6.07440185546875, 6.3375244140625, 6.60064697265625, 6.86376953125, 7.12689208984375, 7.3900146484375, 7.65313720703125, 7.916259765625, 8.17938232421875, 8.4425048828125, 8.70562744140625, 8.96875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 8.0, 4.0, 3.0, 4.0, 11.0, 10.0, 5.0, 20.0, 20.0, 16.0, 29.0, 26.0, 21.0, 33.0, 44.0, 42.0, 47.0, 48.0, 51.0, 40.0, 51.0, 48.0, 47.0, 38.0, 45.0, 38.0, 37.0, 31.0, 33.0, 22.0, 22.0, 23.0, 19.0, 21.0, 7.0, 12.0, 4.0, 7.0, 8.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.529296875, -2.434967041015625, -2.34063720703125, -2.246307373046875, -2.1519775390625, -2.057647705078125, -1.96331787109375, -1.868988037109375, -1.774658203125, -1.680328369140625, -1.58599853515625, -1.491668701171875, -1.3973388671875, -1.303009033203125, -1.20867919921875, -1.114349365234375, -1.02001953125, -0.925689697265625, -0.83135986328125, -0.737030029296875, -0.6427001953125, -0.548370361328125, -0.45404052734375, -0.359710693359375, -0.265380859375, -0.171051025390625, -0.07672119140625, 0.017608642578125, 0.1119384765625, 0.206268310546875, 0.30059814453125, 0.394927978515625, 0.4892578125, 0.583587646484375, 0.67791748046875, 0.772247314453125, 0.8665771484375, 0.960906982421875, 1.05523681640625, 1.149566650390625, 1.243896484375, 1.338226318359375, 1.43255615234375, 1.526885986328125, 1.6212158203125, 1.715545654296875, 1.80987548828125, 1.904205322265625, 1.99853515625, 2.092864990234375, 2.18719482421875, 2.281524658203125, 2.3758544921875, 2.470184326171875, 2.56451416015625, 2.658843994140625, 2.753173828125, 2.847503662109375, 2.94183349609375, 3.036163330078125, 3.1304931640625, 3.224822998046875, 3.31915283203125, 3.413482666015625, 3.5078125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 7.0, 6.0, 7.0, 11.0, 12.0, 23.0, 40.0, 58.0, 107.0, 176.0, 257.0, 480.0, 977.0, 2406.0, 11410.0, 190827.0, 3719948.0, 249572.0, 12932.0, 2740.0, 1075.0, 541.0, 237.0, 156.0, 95.0, 51.0, 40.0, 31.0, 18.0, 7.0, 5.0, 6.0, 0.0, 4.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-7.859375, -7.59326171875, -7.3271484375, -7.06103515625, -6.794921875, -6.52880859375, -6.2626953125, -5.99658203125, -5.73046875, -5.46435546875, -5.1982421875, -4.93212890625, -4.666015625, -4.39990234375, -4.1337890625, -3.86767578125, -3.6015625, -3.33544921875, -3.0693359375, -2.80322265625, -2.537109375, -2.27099609375, -2.0048828125, -1.73876953125, -1.47265625, -1.20654296875, -0.9404296875, -0.67431640625, -0.408203125, -0.14208984375, 0.1240234375, 0.39013671875, 0.65625, 0.92236328125, 1.1884765625, 1.45458984375, 1.720703125, 1.98681640625, 2.2529296875, 2.51904296875, 2.78515625, 3.05126953125, 3.3173828125, 3.58349609375, 3.849609375, 4.11572265625, 4.3818359375, 4.64794921875, 4.9140625, 5.18017578125, 5.4462890625, 5.71240234375, 5.978515625, 6.24462890625, 6.5107421875, 6.77685546875, 7.04296875, 7.30908203125, 7.5751953125, 7.84130859375, 8.107421875, 8.37353515625, 8.6396484375, 8.90576171875, 9.171875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 15.0, 20.0, 39.0, 30.0, 53.0, 74.0, 88.0, 128.0, 214.0, 255.0, 330.0, 452.0, 458.0, 461.0, 405.0, 260.0, 188.0, 157.0, 106.0, 53.0, 58.0, 54.0, 43.0, 21.0, 19.0, 13.0, 9.0, 8.0, 6.0, 7.0, 4.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.5458984375, -1.502685546875, -1.45947265625, -1.416259765625, -1.373046875, -1.329833984375, -1.28662109375, -1.243408203125, -1.2001953125, -1.156982421875, -1.11376953125, -1.070556640625, -1.02734375, -0.984130859375, -0.94091796875, -0.897705078125, -0.8544921875, -0.811279296875, -0.76806640625, -0.724853515625, -0.681640625, -0.638427734375, -0.59521484375, -0.552001953125, -0.5087890625, -0.465576171875, -0.42236328125, -0.379150390625, -0.3359375, -0.292724609375, -0.24951171875, -0.206298828125, -0.1630859375, -0.119873046875, -0.07666015625, -0.033447265625, 0.009765625, 0.052978515625, 0.09619140625, 0.139404296875, 0.1826171875, 0.225830078125, 0.26904296875, 0.312255859375, 0.35546875, 0.398681640625, 0.44189453125, 0.485107421875, 0.5283203125, 0.571533203125, 0.61474609375, 0.657958984375, 0.701171875, 0.744384765625, 0.78759765625, 0.830810546875, 0.8740234375, 0.917236328125, 0.96044921875, 1.003662109375, 1.046875, 1.090087890625, 1.13330078125, 1.176513671875, 1.2197265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 15.0, 7.0, 15.0, 26.0, 50.0, 54.0, 55.0, 75.0, 78.0, 94.0, 97.0, 97.0, 66.0, 77.0, 63.0, 42.0, 32.0, 18.0, 11.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.7051496505737305, -4.526846885681152, -4.348544597625732, -4.170241832733154, -3.9919395446777344, -3.8136370182037354, -3.6353344917297363, -3.457031726837158, -3.2787294387817383, -3.1004269123077393, -2.9221243858337402, -2.743821859359741, -2.565519332885742, -2.387216806411743, -2.208914279937744, -2.030611515045166, -1.852308988571167, -1.674006462097168, -1.495703935623169, -1.31740140914917, -1.139098882675171, -0.9607962965965271, -0.7824937105178833, -0.6041911840438843, -0.42588865756988525, -0.24758611619472504, -0.06928357481956482, 0.10901898145675659, 0.2873215079307556, 0.46562403440475464, 0.6439266204833984, 0.8222291469573975, 1.0005316734313965, 1.1788341999053955, 1.3571367263793945, 1.5354392528533936, 1.7137417793273926, 1.8920443058013916, 2.0703468322753906, 2.2486495971679688, 2.4269518852233887, 2.6052544116973877, 2.7835569381713867, 2.9618594646453857, 3.1401619911193848, 3.318464517593384, 3.496767044067383, 3.675069808959961, 3.85337233543396, 4.031674861907959, 4.209977626800537, 4.388279914855957, 4.566582679748535, 4.744884967803955, 4.923187732696533, 5.101490020751953, 5.279792785644531, 5.458095550537109, 5.636397838592529, 5.814700603485107, 5.993002891540527, 6.1713056564331055, 6.349607944488525, 6.5279107093811035, 6.706212997436523]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 11.0, 16.0, 9.0, 25.0, 19.0, 26.0, 24.0, 25.0, 26.0, 32.0, 33.0, 27.0, 37.0, 37.0, 40.0, 39.0, 41.0, 40.0, 44.0, 37.0, 34.0, 43.0, 45.0, 36.0, 27.0, 21.0, 30.0, 23.0, 24.0, 12.0, 21.0, 12.0, 12.0, 11.0, 8.0, 2.0, 8.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0967464447021484, -2.997384548187256, -2.8980228900909424, -2.79866099357605, -2.6992990970611572, -2.5999374389648438, -2.500575542449951, -2.4012136459350586, -2.301851749420166, -2.2024898529052734, -2.10312819480896, -2.0037662982940674, -1.9044044017791748, -1.8050426244735718, -1.7056808471679688, -1.6063189506530762, -1.5069572925567627, -1.4075955152511597, -1.308233618736267, -1.208871841430664, -1.1095099449157715, -1.0101481676101685, -0.9107863903045654, -0.8114245533943176, -0.7120627164840698, -0.612700879573822, -0.5133390426635742, -0.4139772653579712, -0.3146154284477234, -0.21525359153747559, -0.11589181423187256, -0.016529977321624756, 0.08283185958862305, 0.18219368159770966, 0.28155550360679626, 0.3809173107147217, 0.4802791476249695, 0.5796409845352173, 0.6790027618408203, 0.7783645987510681, 0.8777264356613159, 0.9770882725715637, 1.0764501094818115, 1.1758118867874146, 1.2751736640930176, 1.3745355606079102, 1.4738973379135132, 1.5732591152191162, 1.6726210117340088, 1.7719827890396118, 1.8713446855545044, 1.9707064628601074, 2.070068359375, 2.1694302558898926, 2.268791913986206, 2.3681538105010986, 2.467515468597412, 2.5668773651123047, 2.666239023208618, 2.7656009197235107, 2.8649628162384033, 2.964324474334717, 3.0636863708496094, 3.163048267364502, 3.2624101638793945]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 4.0, 14.0, 15.0, 35.0, 46.0, 87.0, 158.0, 289.0, 616.0, 1423.0, 4742.0, 36626.0, 618216.0, 361482.0, 19343.0, 3281.0, 1116.0, 499.0, 252.0, 123.0, 77.0, 43.0, 20.0, 25.0, 8.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6953125, -1.6385650634765625, -1.581817626953125, -1.5250701904296875, -1.46832275390625, -1.4115753173828125, -1.354827880859375, -1.2980804443359375, -1.2413330078125, -1.1845855712890625, -1.127838134765625, -1.0710906982421875, -1.01434326171875, -0.9575958251953125, -0.900848388671875, -0.8441009521484375, -0.787353515625, -0.7306060791015625, -0.673858642578125, -0.6171112060546875, -0.56036376953125, -0.5036163330078125, -0.446868896484375, -0.3901214599609375, -0.3333740234375, -0.2766265869140625, -0.219879150390625, -0.1631317138671875, -0.10638427734375, -0.0496368408203125, 0.007110595703125, 0.0638580322265625, 0.12060546875, 0.1773529052734375, 0.234100341796875, 0.2908477783203125, 0.34759521484375, 0.4043426513671875, 0.461090087890625, 0.5178375244140625, 0.5745849609375, 0.6313323974609375, 0.688079833984375, 0.7448272705078125, 0.80157470703125, 0.8583221435546875, 0.915069580078125, 0.9718170166015625, 1.028564453125, 1.0853118896484375, 1.142059326171875, 1.1988067626953125, 1.25555419921875, 1.3123016357421875, 1.369049072265625, 1.4257965087890625, 1.4825439453125, 1.5392913818359375, 1.596038818359375, 1.6527862548828125, 1.70953369140625, 1.7662811279296875, 1.823028564453125, 1.8797760009765625, 1.9365234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 15.0, 21.0, 19.0, 41.0, 36.0, 51.0, 63.0, 73.0, 65.0, 78.0, 71.0, 81.0, 63.0, 61.0, 53.0, 50.0, 40.0, 36.0, 20.0, 20.0, 9.0, 8.0, 6.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.84765625, -5.71630859375, -5.5849609375, -5.45361328125, -5.322265625, -5.19091796875, -5.0595703125, -4.92822265625, -4.796875, -4.66552734375, -4.5341796875, -4.40283203125, -4.271484375, -4.14013671875, -4.0087890625, -3.87744140625, -3.74609375, -3.61474609375, -3.4833984375, -3.35205078125, -3.220703125, -3.08935546875, -2.9580078125, -2.82666015625, -2.6953125, -2.56396484375, -2.4326171875, -2.30126953125, -2.169921875, -2.03857421875, -1.9072265625, -1.77587890625, -1.64453125, -1.51318359375, -1.3818359375, -1.25048828125, -1.119140625, -0.98779296875, -0.8564453125, -0.72509765625, -0.59375, -0.46240234375, -0.3310546875, -0.19970703125, -0.068359375, 0.06298828125, 0.1943359375, 0.32568359375, 0.45703125, 0.58837890625, 0.7197265625, 0.85107421875, 0.982421875, 1.11376953125, 1.2451171875, 1.37646484375, 1.5078125, 1.63916015625, 1.7705078125, 1.90185546875, 2.033203125, 2.16455078125, 2.2958984375, 2.42724609375, 2.55859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 22.0, 39.0, 49.0, 106.0, 200.0, 362.0, 709.0, 1392.0, 2918.0, 5901.0, 12410.0, 26480.0, 55651.0, 112522.0, 197452.0, 244623.0, 186249.0, 103633.0, 51277.0, 24084.0, 11512.0, 5481.0, 2728.0, 1291.0, 680.0, 346.0, 162.0, 98.0, 58.0, 29.0, 15.0, 16.0, 11.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.353759765625, -0.3434867858886719, -0.33321380615234375, -0.3229408264160156, -0.3126678466796875, -0.3023948669433594, -0.29212188720703125, -0.2818489074707031, -0.271575927734375, -0.2613029479980469, -0.25102996826171875, -0.24075698852539062, -0.2304840087890625, -0.22021102905273438, -0.20993804931640625, -0.19966506958007812, -0.18939208984375, -0.17911911010742188, -0.16884613037109375, -0.15857315063476562, -0.1483001708984375, -0.13802719116210938, -0.12775421142578125, -0.11748123168945312, -0.107208251953125, -0.09693527221679688, -0.08666229248046875, -0.07638931274414062, -0.0661163330078125, -0.055843353271484375, -0.04557037353515625, -0.035297393798828125, -0.0250244140625, -0.014751434326171875, -0.00447845458984375, 0.005794525146484375, 0.0160675048828125, 0.026340484619140625, 0.03661346435546875, 0.046886444091796875, 0.057159423828125, 0.06743240356445312, 0.07770538330078125, 0.08797836303710938, 0.0982513427734375, 0.10852432250976562, 0.11879730224609375, 0.12907028198242188, 0.13934326171875, 0.14961624145507812, 0.15988922119140625, 0.17016220092773438, 0.1804351806640625, 0.19070816040039062, 0.20098114013671875, 0.21125411987304688, 0.221527099609375, 0.23180007934570312, 0.24207305908203125, 0.2523460388183594, 0.2626190185546875, 0.2728919982910156, 0.28316497802734375, 0.2934379577636719, 0.3037109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 5.0, 8.0, 14.0, 7.0, 16.0, 9.0, 18.0, 27.0, 29.0, 31.0, 43.0, 55.0, 51.0, 41.0, 57.0, 53.0, 67.0, 64.0, 46.0, 61.0, 45.0, 39.0, 32.0, 27.0, 24.0, 24.0, 26.0, 12.0, 13.0, 16.0, 7.0, 5.0, 6.0, 3.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.27703857421875, -5.0736083984375, -4.87017822265625, -4.666748046875, -4.46331787109375, -4.2598876953125, -4.05645751953125, -3.85302734375, -3.64959716796875, -3.4461669921875, -3.24273681640625, -3.039306640625, -2.83587646484375, -2.6324462890625, -2.42901611328125, -2.2255859375, -2.02215576171875, -1.8187255859375, -1.61529541015625, -1.411865234375, -1.20843505859375, -1.0050048828125, -0.80157470703125, -0.59814453125, -0.39471435546875, -0.1912841796875, 0.01214599609375, 0.215576171875, 0.41900634765625, 0.6224365234375, 0.82586669921875, 1.029296875, 1.23272705078125, 1.4361572265625, 1.63958740234375, 1.843017578125, 2.04644775390625, 2.2498779296875, 2.45330810546875, 2.65673828125, 2.86016845703125, 3.0635986328125, 3.26702880859375, 3.470458984375, 3.67388916015625, 3.8773193359375, 4.08074951171875, 4.2841796875, 4.48760986328125, 4.6910400390625, 4.89447021484375, 5.097900390625, 5.30133056640625, 5.5047607421875, 5.70819091796875, 5.91162109375, 6.11505126953125, 6.3184814453125, 6.52191162109375, 6.725341796875, 6.92877197265625, 7.1322021484375, 7.33563232421875, 7.5390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 11.0, 15.0, 24.0, 54.0, 58.0, 80.0, 142.0, 231.0, 408.0, 774.0, 1507.0, 3885.0, 11961.0, 47680.0, 255663.0, 543082.0, 141291.0, 28604.0, 7739.0, 2671.0, 1196.0, 554.0, 316.0, 198.0, 127.0, 74.0, 53.0, 46.0, 20.0, 27.0, 19.0, 15.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.100830078125, -0.09789276123046875, -0.0949554443359375, -0.09201812744140625, -0.089080810546875, -0.08614349365234375, -0.0832061767578125, -0.08026885986328125, -0.07733154296875, -0.07439422607421875, -0.0714569091796875, -0.06851959228515625, -0.065582275390625, -0.06264495849609375, -0.0597076416015625, -0.05677032470703125, -0.0538330078125, -0.05089569091796875, -0.0479583740234375, -0.04502105712890625, -0.042083740234375, -0.03914642333984375, -0.0362091064453125, -0.03327178955078125, -0.03033447265625, -0.02739715576171875, -0.0244598388671875, -0.02152252197265625, -0.018585205078125, -0.01564788818359375, -0.0127105712890625, -0.00977325439453125, -0.0068359375, -0.00389862060546875, -0.0009613037109375, 0.00197601318359375, 0.004913330078125, 0.00785064697265625, 0.0107879638671875, 0.01372528076171875, 0.01666259765625, 0.01959991455078125, 0.0225372314453125, 0.02547454833984375, 0.028411865234375, 0.03134918212890625, 0.0342864990234375, 0.03722381591796875, 0.0401611328125, 0.04309844970703125, 0.0460357666015625, 0.04897308349609375, 0.051910400390625, 0.05484771728515625, 0.0577850341796875, 0.06072235107421875, 0.06365966796875, 0.06659698486328125, 0.0695343017578125, 0.07247161865234375, 0.075408935546875, 0.07834625244140625, 0.0812835693359375, 0.08422088623046875, 0.087158203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 15.0, 25.0, 46.0, 46.0, 68.0, 76.0, 85.0, 101.0, 103.0, 97.0, 66.0, 58.0, 61.0, 35.0, 35.0, 18.0, 13.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.577108383178711e-05, -8.361786603927612e-05, -8.146464824676514e-05, -7.931143045425415e-05, -7.715821266174316e-05, -7.500499486923218e-05, -7.285177707672119e-05, -7.06985592842102e-05, -6.854534149169922e-05, -6.639212369918823e-05, -6.423890590667725e-05, -6.208568811416626e-05, -5.9932470321655273e-05, -5.777925252914429e-05, -5.56260347366333e-05, -5.3472816944122314e-05, -5.131959915161133e-05, -4.916638135910034e-05, -4.7013163566589355e-05, -4.485994577407837e-05, -4.270672798156738e-05, -4.0553510189056396e-05, -3.840029239654541e-05, -3.6247074604034424e-05, -3.409385681152344e-05, -3.194063901901245e-05, -2.9787421226501465e-05, -2.763420343399048e-05, -2.5480985641479492e-05, -2.3327767848968506e-05, -2.117455005645752e-05, -1.9021332263946533e-05, -1.6868114471435547e-05, -1.471489667892456e-05, -1.2561678886413574e-05, -1.0408461093902588e-05, -8.255243301391602e-06, -6.102025508880615e-06, -3.948807716369629e-06, -1.7955899238586426e-06, 3.5762786865234375e-07, 2.51084566116333e-06, 4.664063453674316e-06, 6.817281246185303e-06, 8.970499038696289e-06, 1.1123716831207275e-05, 1.3276934623718262e-05, 1.5430152416229248e-05, 1.7583370208740234e-05, 1.973658800125122e-05, 2.1889805793762207e-05, 2.4043023586273193e-05, 2.619624137878418e-05, 2.8349459171295166e-05, 3.0502676963806152e-05, 3.265589475631714e-05, 3.4809112548828125e-05, 3.696233034133911e-05, 3.91155481338501e-05, 4.1268765926361084e-05, 4.342198371887207e-05, 4.557520151138306e-05, 4.772841930389404e-05, 4.988163709640503e-05, 5.2034854888916016e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 11.0, 6.0, 18.0, 24.0, 29.0, 33.0, 48.0, 63.0, 90.0, 143.0, 205.0, 415.0, 772.0, 1549.0, 3726.0, 10181.0, 35577.0, 193051.0, 619493.0, 139974.0, 28240.0, 8605.0, 3258.0, 1359.0, 681.0, 358.0, 205.0, 127.0, 87.0, 59.0, 45.0, 19.0, 23.0, 6.0, 14.0, 12.0, 15.0, 5.0, 5.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1195068359375, -0.1162252426147461, -0.11294364929199219, -0.10966205596923828, -0.10638046264648438, -0.10309886932373047, -0.09981727600097656, -0.09653568267822266, -0.09325408935546875, -0.08997249603271484, -0.08669090270996094, -0.08340930938720703, -0.08012771606445312, -0.07684612274169922, -0.07356452941894531, -0.0702829360961914, -0.0670013427734375, -0.0637197494506836, -0.06043815612792969, -0.05715656280517578, -0.053874969482421875, -0.05059337615966797, -0.04731178283691406, -0.044030189514160156, -0.04074859619140625, -0.037467002868652344, -0.03418540954589844, -0.03090381622314453, -0.027622222900390625, -0.02434062957763672, -0.021059036254882812, -0.017777442932128906, -0.014495849609375, -0.011214256286621094, -0.007932662963867188, -0.004651069641113281, -0.001369476318359375, 0.0019121170043945312, 0.0051937103271484375, 0.008475303649902344, 0.01175689697265625, 0.015038490295410156, 0.018320083618164062, 0.02160167694091797, 0.024883270263671875, 0.02816486358642578, 0.03144645690917969, 0.034728050231933594, 0.0380096435546875, 0.041291236877441406, 0.04457283020019531, 0.04785442352294922, 0.051136016845703125, 0.05441761016845703, 0.05769920349121094, 0.060980796813964844, 0.06426239013671875, 0.06754398345947266, 0.07082557678222656, 0.07410717010498047, 0.07738876342773438, 0.08067035675048828, 0.08395195007324219, 0.0872335433959961, 0.09051513671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 2.0, 6.0, 6.0, 7.0, 7.0, 9.0, 7.0, 15.0, 14.0, 13.0, 26.0, 27.0, 33.0, 56.0, 60.0, 72.0, 85.0, 109.0, 87.0, 72.0, 40.0, 55.0, 33.0, 29.0, 26.0, 16.0, 17.0, 7.0, 8.0, 6.0, 7.0, 6.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.026611328125, -0.025833845138549805, -0.02505636215209961, -0.024278879165649414, -0.02350139617919922, -0.022723913192749023, -0.021946430206298828, -0.021168947219848633, -0.020391464233398438, -0.019613981246948242, -0.018836498260498047, -0.01805901527404785, -0.017281532287597656, -0.01650404930114746, -0.015726566314697266, -0.01494908332824707, -0.014171600341796875, -0.01339411735534668, -0.012616634368896484, -0.011839151382446289, -0.011061668395996094, -0.010284185409545898, -0.009506702423095703, -0.008729219436645508, -0.007951736450195312, -0.007174253463745117, -0.006396770477294922, -0.0056192874908447266, -0.004841804504394531, -0.004064321517944336, -0.0032868385314941406, -0.0025093555450439453, -0.00173187255859375, -0.0009543895721435547, -0.00017690658569335938, 0.0006005764007568359, 0.0013780593872070312, 0.0021555423736572266, 0.002933025360107422, 0.003710508346557617, 0.0044879913330078125, 0.005265474319458008, 0.006042957305908203, 0.0068204402923583984, 0.007597923278808594, 0.008375406265258789, 0.009152889251708984, 0.00993037223815918, 0.010707855224609375, 0.01148533821105957, 0.012262821197509766, 0.013040304183959961, 0.013817787170410156, 0.014595270156860352, 0.015372753143310547, 0.016150236129760742, 0.016927719116210938, 0.017705202102661133, 0.018482685089111328, 0.019260168075561523, 0.02003765106201172, 0.020815134048461914, 0.02159261703491211, 0.022370100021362305, 0.0231475830078125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 16.0, 43.0, 82.0, 95.0, 146.0, 147.0, 153.0, 135.0, 80.0, 50.0, 24.0, 13.0, 10.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818401575088501, -3.6155362129211426, -3.4126710891723633, -3.209805727005005, -3.0069403648376465, -2.804075002670288, -2.6012096405029297, -2.3983445167541504, -2.195479154586792, -1.9926137924194336, -1.7897485494613647, -1.586883306503296, -1.3840179443359375, -1.181152582168579, -0.9782873392105103, -0.7754220962524414, -0.572556734085083, -0.3696914315223694, -0.16682612895965576, 0.03603917360305786, 0.23890447616577148, 0.4417698383331299, 0.6446350812911987, 0.8475003242492676, 1.050365686416626, 1.2532310485839844, 1.4560962915420532, 1.658961534500122, 1.8618268966674805, 2.064692258834839, 2.2675576210021973, 2.4704227447509766, 2.673288345336914, 2.8761537075042725, 3.079019069671631, 3.28188419342041, 3.4847495555877686, 3.687614917755127, 3.8904800415039062, 4.093345642089844, 4.296210765838623, 4.499075889587402, 4.70194149017334, 4.904806613922119, 5.107671737670898, 5.310537338256836, 5.513402462005615, 5.7162675857543945, 5.919133186340332, 6.121998310089111, 6.324863910675049, 6.527729034423828, 6.730594635009766, 6.933459758758545, 7.136324882507324, 7.339190483093262, 7.542055606842041, 7.74492073059082, 7.947786331176758, 8.150651931762695, 8.353516578674316, 8.556382179260254, 8.759247779846191, 8.962112426757812, 9.16497802734375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 5.0, 11.0, 25.0, 30.0, 29.0, 40.0, 44.0, 47.0, 47.0, 53.0, 71.0, 59.0, 66.0, 66.0, 57.0, 67.0, 58.0, 35.0, 44.0, 33.0, 24.0, 20.0, 20.0, 8.0, 12.0, 4.0, 6.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.6918487548828125, -4.581019401550293, -4.470190525054932, -4.359361171722412, -4.248531818389893, -4.137702941894531, -4.026873588562012, -3.9160444736480713, -3.805215358734131, -3.6943862438201904, -3.583556890487671, -3.4727277755737305, -3.36189866065979, -3.2510695457458496, -3.14024019241333, -3.0294110774993896, -2.91858172416687, -2.8077526092529297, -2.69692325592041, -2.5860941410064697, -2.4752650260925293, -2.3644356727600098, -2.2536065578460693, -2.142777442932129, -2.0319480895996094, -1.9211188554763794, -1.810289740562439, -1.699460506439209, -1.5886313915252686, -1.4778021574020386, -1.3669729232788086, -1.2561438083648682, -1.1453146934509277, -1.0344854593276978, -0.9236563444137573, -0.8128271102905273, -0.7019979357719421, -0.5911687612533569, -0.48033952713012695, -0.36951035261154175, -0.25868117809295654, -0.14785198867321014, -0.037022799253463745, 0.07380640506744385, 0.18463557958602905, 0.29546475410461426, 0.40629398822784424, 0.5171231627464294, 0.6279523372650146, 0.7387815117835999, 0.8496106863021851, 0.960439920425415, 1.0712690353393555, 1.1820982694625854, 1.2929275035858154, 1.4037566184997559, 1.5145858526229858, 1.6254150867462158, 1.7362442016601562, 1.8470734357833862, 1.9579026699066162, 2.0687317848205566, 2.179561138153076, 2.2903902530670166, 2.401219367980957]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 4.0, 6.0, 6.0, 10.0, 10.0, 15.0, 22.0, 19.0, 57.0, 61.0, 95.0, 139.0, 218.0, 430.0, 811.0, 2073.0, 5814.0, 20848.0, 83657.0, 511142.0, 335240.0, 63293.0, 16319.0, 4849.0, 1750.0, 693.0, 387.0, 182.0, 124.0, 83.0, 51.0, 58.0, 29.0, 18.0, 10.0, 8.0, 13.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.921875, -4.78851318359375, -4.6551513671875, -4.52178955078125, -4.388427734375, -4.25506591796875, -4.1217041015625, -3.98834228515625, -3.85498046875, -3.72161865234375, -3.5882568359375, -3.45489501953125, -3.321533203125, -3.18817138671875, -3.0548095703125, -2.92144775390625, -2.7880859375, -2.65472412109375, -2.5213623046875, -2.38800048828125, -2.254638671875, -2.12127685546875, -1.9879150390625, -1.85455322265625, -1.72119140625, -1.58782958984375, -1.4544677734375, -1.32110595703125, -1.187744140625, -1.05438232421875, -0.9210205078125, -0.78765869140625, -0.654296875, -0.52093505859375, -0.3875732421875, -0.25421142578125, -0.120849609375, 0.01251220703125, 0.1458740234375, 0.27923583984375, 0.41259765625, 0.54595947265625, 0.6793212890625, 0.81268310546875, 0.946044921875, 1.07940673828125, 1.2127685546875, 1.34613037109375, 1.4794921875, 1.61285400390625, 1.7462158203125, 1.87957763671875, 2.012939453125, 2.14630126953125, 2.2796630859375, 2.41302490234375, 2.54638671875, 2.67974853515625, 2.8131103515625, 2.94647216796875, 3.079833984375, 3.21319580078125, 3.3465576171875, 3.47991943359375, 3.61328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 8.0, 19.0, 17.0, 20.0, 27.0, 23.0, 32.0, 34.0, 50.0, 46.0, 41.0, 56.0, 49.0, 51.0, 50.0, 59.0, 58.0, 50.0, 40.0, 38.0, 37.0, 37.0, 26.0, 27.0, 21.0, 15.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.76171875, -5.60162353515625, -5.4415283203125, -5.28143310546875, -5.121337890625, -4.96124267578125, -4.8011474609375, -4.64105224609375, -4.48095703125, -4.32086181640625, -4.1607666015625, -4.00067138671875, -3.840576171875, -3.68048095703125, -3.5203857421875, -3.36029052734375, -3.2001953125, -3.04010009765625, -2.8800048828125, -2.71990966796875, -2.559814453125, -2.39971923828125, -2.2396240234375, -2.07952880859375, -1.91943359375, -1.75933837890625, -1.5992431640625, -1.43914794921875, -1.279052734375, -1.11895751953125, -0.9588623046875, -0.79876708984375, -0.638671875, -0.47857666015625, -0.3184814453125, -0.15838623046875, 0.001708984375, 0.16180419921875, 0.3218994140625, 0.48199462890625, 0.64208984375, 0.80218505859375, 0.9622802734375, 1.12237548828125, 1.282470703125, 1.44256591796875, 1.6026611328125, 1.76275634765625, 1.9228515625, 2.08294677734375, 2.2430419921875, 2.40313720703125, 2.563232421875, 2.72332763671875, 2.8834228515625, 3.04351806640625, 3.20361328125, 3.36370849609375, 3.5238037109375, 3.68389892578125, 3.843994140625, 4.00408935546875, 4.1641845703125, 4.32427978515625, 4.484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 9.0, 10.0, 5.0, 14.0, 12.0, 18.0, 25.0, 27.0, 40.0, 56.0, 72.0, 83.0, 111.0, 207.0, 301.0, 755.0, 3520.0, 37107.0, 783240.0, 208058.0, 12109.0, 1545.0, 430.0, 211.0, 142.0, 102.0, 60.0, 65.0, 45.0, 37.0, 28.0, 22.0, 21.0, 9.0, 15.0, 7.0, 7.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.890625, -9.62176513671875, -9.3529052734375, -9.08404541015625, -8.815185546875, -8.54632568359375, -8.2774658203125, -8.00860595703125, -7.73974609375, -7.47088623046875, -7.2020263671875, -6.93316650390625, -6.664306640625, -6.39544677734375, -6.1265869140625, -5.85772705078125, -5.5888671875, -5.32000732421875, -5.0511474609375, -4.78228759765625, -4.513427734375, -4.24456787109375, -3.9757080078125, -3.70684814453125, -3.43798828125, -3.16912841796875, -2.9002685546875, -2.63140869140625, -2.362548828125, -2.09368896484375, -1.8248291015625, -1.55596923828125, -1.287109375, -1.01824951171875, -0.7493896484375, -0.48052978515625, -0.211669921875, 0.05718994140625, 0.3260498046875, 0.59490966796875, 0.86376953125, 1.13262939453125, 1.4014892578125, 1.67034912109375, 1.939208984375, 2.20806884765625, 2.4769287109375, 2.74578857421875, 3.0146484375, 3.28350830078125, 3.5523681640625, 3.82122802734375, 4.090087890625, 4.35894775390625, 4.6278076171875, 4.89666748046875, 5.16552734375, 5.43438720703125, 5.7032470703125, 5.97210693359375, 6.240966796875, 6.50982666015625, 6.7786865234375, 7.04754638671875, 7.31640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 1.0, 4.0, 8.0, 6.0, 12.0, 23.0, 22.0, 13.0, 22.0, 36.0, 21.0, 25.0, 31.0, 33.0, 35.0, 43.0, 54.0, 41.0, 52.0, 51.0, 41.0, 48.0, 36.0, 47.0, 42.0, 24.0, 47.0, 33.0, 16.0, 25.0, 19.0, 12.0, 9.0, 12.0, 8.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0], "bins": [-5.7109375, -5.555908203125, -5.40087890625, -5.245849609375, -5.0908203125, -4.935791015625, -4.78076171875, -4.625732421875, -4.470703125, -4.315673828125, -4.16064453125, -4.005615234375, -3.8505859375, -3.695556640625, -3.54052734375, -3.385498046875, -3.23046875, -3.075439453125, -2.92041015625, -2.765380859375, -2.6103515625, -2.455322265625, -2.30029296875, -2.145263671875, -1.990234375, -1.835205078125, -1.68017578125, -1.525146484375, -1.3701171875, -1.215087890625, -1.06005859375, -0.905029296875, -0.75, -0.594970703125, -0.43994140625, -0.284912109375, -0.1298828125, 0.025146484375, 0.18017578125, 0.335205078125, 0.490234375, 0.645263671875, 0.80029296875, 0.955322265625, 1.1103515625, 1.265380859375, 1.42041015625, 1.575439453125, 1.73046875, 1.885498046875, 2.04052734375, 2.195556640625, 2.3505859375, 2.505615234375, 2.66064453125, 2.815673828125, 2.970703125, 3.125732421875, 3.28076171875, 3.435791015625, 3.5908203125, 3.745849609375, 3.90087890625, 4.055908203125, 4.2109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 12.0, 8.0, 12.0, 20.0, 41.0, 45.0, 78.0, 155.0, 353.0, 1078.0, 6333.0, 119976.0, 862275.0, 53103.0, 3570.0, 816.0, 267.0, 137.0, 91.0, 51.0, 38.0, 22.0, 14.0, 11.0, 6.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.248046875, -2.174041748046875, -2.10003662109375, -2.026031494140625, -1.9520263671875, -1.878021240234375, -1.80401611328125, -1.730010986328125, -1.656005859375, -1.582000732421875, -1.50799560546875, -1.433990478515625, -1.3599853515625, -1.285980224609375, -1.21197509765625, -1.137969970703125, -1.06396484375, -0.989959716796875, -0.91595458984375, -0.841949462890625, -0.7679443359375, -0.693939208984375, -0.61993408203125, -0.545928955078125, -0.471923828125, -0.397918701171875, -0.32391357421875, -0.249908447265625, -0.1759033203125, -0.101898193359375, -0.02789306640625, 0.046112060546875, 0.1201171875, 0.194122314453125, 0.26812744140625, 0.342132568359375, 0.4161376953125, 0.490142822265625, 0.56414794921875, 0.638153076171875, 0.712158203125, 0.786163330078125, 0.86016845703125, 0.934173583984375, 1.0081787109375, 1.082183837890625, 1.15618896484375, 1.230194091796875, 1.30419921875, 1.378204345703125, 1.45220947265625, 1.526214599609375, 1.6002197265625, 1.674224853515625, 1.74822998046875, 1.822235107421875, 1.896240234375, 1.970245361328125, 2.04425048828125, 2.118255615234375, 2.1922607421875, 2.266265869140625, 2.34027099609375, 2.414276123046875, 2.48828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 9.0, 7.0, 8.0, 23.0, 24.0, 47.0, 28.0, 57.0, 73.0, 105.0, 118.0, 135.0, 86.0, 66.0, 51.0, 32.0, 28.0, 19.0, 24.0, 16.0, 6.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.0001824982464313507, -0.00017593055963516235, -0.000169362872838974, -0.00016279518604278564, -0.0001562274992465973, -0.00014965981245040894, -0.00014309212565422058, -0.00013652443885803223, -0.00012995675206184387, -0.00012338906526565552, -0.00011682137846946716, -0.00011025369167327881, -0.00010368600487709045, -9.71183180809021e-05, -9.055063128471375e-05, -8.398294448852539e-05, -7.741525769233704e-05, -7.084757089614868e-05, -6.427988409996033e-05, -5.771219730377197e-05, -5.114451050758362e-05, -4.4576823711395264e-05, -3.800913691520691e-05, -3.1441450119018555e-05, -2.48737633228302e-05, -1.8306076526641846e-05, -1.1738389730453491e-05, -5.170702934265137e-06, 1.3969838619232178e-06, 7.964670658111572e-06, 1.4532357454299927e-05, 2.110004425048828e-05, 2.7667731046676636e-05, 3.423541784286499e-05, 4.0803104639053345e-05, 4.73707914352417e-05, 5.3938478231430054e-05, 6.050616502761841e-05, 6.707385182380676e-05, 7.364153861999512e-05, 8.020922541618347e-05, 8.677691221237183e-05, 9.334459900856018e-05, 9.991228580474854e-05, 0.00010647997260093689, 0.00011304765939712524, 0.0001196153461933136, 0.00012618303298950195, 0.0001327507197856903, 0.00013931840658187866, 0.00014588609337806702, 0.00015245378017425537, 0.00015902146697044373, 0.00016558915376663208, 0.00017215684056282043, 0.0001787245273590088, 0.00018529221415519714, 0.0001918599009513855, 0.00019842758774757385, 0.0002049952745437622, 0.00021156296133995056, 0.00021813064813613892, 0.00022469833493232727, 0.00023126602172851562]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 9.0, 19.0, 40.0, 74.0, 185.0, 471.0, 1204.0, 4989.0, 199320.0, 828090.0, 11412.0, 1695.0, 583.0, 237.0, 100.0, 51.0, 25.0, 17.0, 6.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6484375, -3.5313720703125, -3.414306640625, -3.2972412109375, -3.18017578125, -3.0631103515625, -2.946044921875, -2.8289794921875, -2.7119140625, -2.5948486328125, -2.477783203125, -2.3607177734375, -2.24365234375, -2.1265869140625, -2.009521484375, -1.8924560546875, -1.775390625, -1.6583251953125, -1.541259765625, -1.4241943359375, -1.30712890625, -1.1900634765625, -1.072998046875, -0.9559326171875, -0.8388671875, -0.7218017578125, -0.604736328125, -0.4876708984375, -0.37060546875, -0.2535400390625, -0.136474609375, -0.0194091796875, 0.09765625, 0.2147216796875, 0.331787109375, 0.4488525390625, 0.56591796875, 0.6829833984375, 0.800048828125, 0.9171142578125, 1.0341796875, 1.1512451171875, 1.268310546875, 1.3853759765625, 1.50244140625, 1.6195068359375, 1.736572265625, 1.8536376953125, 1.970703125, 2.0877685546875, 2.204833984375, 2.3218994140625, 2.43896484375, 2.5560302734375, 2.673095703125, 2.7901611328125, 2.9072265625, 3.0242919921875, 3.141357421875, 3.2584228515625, 3.37548828125, 3.4925537109375, 3.609619140625, 3.7266845703125, 3.84375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 20.0, 19.0, 48.0, 68.0, 104.0, 199.0, 229.0, 122.0, 71.0, 31.0, 24.0, 22.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2599945068359375, -1.226043701171875, -1.1920928955078125, -1.15814208984375, -1.1241912841796875, -1.090240478515625, -1.0562896728515625, -1.0223388671875, -0.9883880615234375, -0.954437255859375, -0.9204864501953125, -0.88653564453125, -0.8525848388671875, -0.818634033203125, -0.7846832275390625, -0.750732421875, -0.7167816162109375, -0.682830810546875, -0.6488800048828125, -0.61492919921875, -0.5809783935546875, -0.547027587890625, -0.5130767822265625, -0.4791259765625, -0.4451751708984375, -0.411224365234375, -0.3772735595703125, -0.34332275390625, -0.3093719482421875, -0.275421142578125, -0.2414703369140625, -0.20751953125, -0.1735687255859375, -0.139617919921875, -0.1056671142578125, -0.07171630859375, -0.0377655029296875, -0.003814697265625, 0.0301361083984375, 0.0640869140625, 0.0980377197265625, 0.131988525390625, 0.1659393310546875, 0.19989013671875, 0.2338409423828125, 0.267791748046875, 0.3017425537109375, 0.335693359375, 0.3696441650390625, 0.403594970703125, 0.4375457763671875, 0.47149658203125, 0.5054473876953125, 0.539398193359375, 0.5733489990234375, 0.6072998046875, 0.6412506103515625, 0.675201416015625, 0.7091522216796875, 0.74310302734375, 0.7770538330078125, 0.811004638671875, 0.8449554443359375, 0.87890625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 16.0, 10.0, 17.0, 28.0, 38.0, 36.0, 56.0, 68.0, 52.0, 66.0, 73.0, 75.0, 99.0, 68.0, 52.0, 53.0, 46.0, 38.0, 27.0, 16.0, 19.0, 27.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3045148849487305, -6.111701011657715, -5.918887138366699, -5.726073265075684, -5.533259391784668, -5.340445518493652, -5.147631645202637, -4.954817771911621, -4.7620038986206055, -4.56919002532959, -4.376376152038574, -4.183562278747559, -3.990748405456543, -3.7979345321655273, -3.605120897293091, -3.412307024002075, -3.2194933891296387, -3.026679515838623, -2.8338656425476074, -2.641051769256592, -2.448237895965576, -2.2554240226745605, -2.062610387802124, -1.8697965145111084, -1.6769826412200928, -1.4841687679290771, -1.2913548946380615, -1.0985411405563354, -0.9057272672653198, -0.7129133939743042, -0.5200996398925781, -0.3272857666015625, -0.13447141647338867, 0.058342427015304565, 0.2511562705039978, 0.44397008419036865, 0.6367839574813843, 0.8295978307723999, 1.022411584854126, 1.2152254581451416, 1.4080393314361572, 1.6008532047271729, 1.7936670780181885, 1.9864808320999146, 2.1792945861816406, 2.3721084594726562, 2.564922332763672, 2.7577362060546875, 2.950550079345703, 3.1433639526367188, 3.3361778259277344, 3.52899169921875, 3.7218055725097656, 3.9146194458007812, 4.107433319091797, 4.3002471923828125, 4.493061065673828, 4.685874938964844, 4.878688812255859, 5.071502685546875, 5.264316558837891, 5.457130432128906, 5.649944305419922, 5.8427581787109375, 6.035571575164795]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 12.0, 13.0, 10.0, 20.0, 18.0, 20.0, 23.0, 36.0, 32.0, 37.0, 47.0, 48.0, 52.0, 50.0, 50.0, 46.0, 49.0, 55.0, 40.0, 54.0, 38.0, 46.0, 42.0, 32.0, 24.0, 18.0, 14.0, 15.0, 11.0, 8.0, 12.0, 3.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.694814682006836, -9.386423110961914, -9.078031539916992, -8.769640922546387, -8.461249351501465, -8.152857780456543, -7.844466209411621, -7.536074638366699, -7.2276835441589355, -6.919291973114014, -6.61090087890625, -6.302509307861328, -5.994117736816406, -5.685726642608643, -5.377335071563721, -5.068943977355957, -4.760552406311035, -4.452160835266113, -4.14376974105835, -3.8353781700134277, -3.526986837387085, -3.218595504760742, -2.9102039337158203, -2.6018126010894775, -2.2934212684631348, -1.985029935836792, -1.6766384840011597, -1.3682470321655273, -1.0598556995391846, -0.7514643669128418, -0.4430729150772095, -0.13468146324157715, 0.17371082305908203, 0.4821022152900696, 0.7904936075210571, 1.0988850593566895, 1.4072763919830322, 1.715667724609375, 2.024059295654297, 2.3324506282806396, 2.6408419609069824, 2.949233293533325, 3.257624626159668, 3.56601619720459, 3.8744075298309326, 4.182798862457275, 4.491190433502197, 4.799581527709961, 5.107973098754883, 5.416364669799805, 5.724755764007568, 6.03314733505249, 6.341538429260254, 6.649930000305176, 6.958321571350098, 7.2667131423950195, 7.575104236602783, 7.883495807647705, 8.191886901855469, 8.50027847290039, 8.808670043945312, 9.117061614990234, 9.42545223236084, 9.733843803405762, 10.042235374450684]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 14.0, 15.0, 40.0, 52.0, 108.0, 158.0, 268.0, 463.0, 920.0, 1935.0, 4949.0, 16966.0, 85556.0, 676130.0, 2440891.0, 832948.0, 104197.0, 19205.0, 5313.0, 2054.0, 983.0, 481.0, 254.0, 142.0, 86.0, 60.0, 34.0, 17.0, 14.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.421875, -5.281219482421875, -5.14056396484375, -4.999908447265625, -4.8592529296875, -4.718597412109375, -4.57794189453125, -4.437286376953125, -4.296630859375, -4.155975341796875, -4.01531982421875, -3.874664306640625, -3.7340087890625, -3.593353271484375, -3.45269775390625, -3.312042236328125, -3.17138671875, -3.030731201171875, -2.89007568359375, -2.749420166015625, -2.6087646484375, -2.468109130859375, -2.32745361328125, -2.186798095703125, -2.046142578125, -1.905487060546875, -1.76483154296875, -1.624176025390625, -1.4835205078125, -1.342864990234375, -1.20220947265625, -1.061553955078125, -0.9208984375, -0.780242919921875, -0.63958740234375, -0.498931884765625, -0.3582763671875, -0.217620849609375, -0.07696533203125, 0.063690185546875, 0.204345703125, 0.345001220703125, 0.48565673828125, 0.626312255859375, 0.7669677734375, 0.907623291015625, 1.04827880859375, 1.188934326171875, 1.32958984375, 1.470245361328125, 1.61090087890625, 1.751556396484375, 1.8922119140625, 2.032867431640625, 2.17352294921875, 2.314178466796875, 2.454833984375, 2.595489501953125, 2.73614501953125, 2.876800537109375, 3.0174560546875, 3.158111572265625, 3.29876708984375, 3.439422607421875, 3.580078125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 15.0, 8.0, 11.0, 20.0, 11.0, 20.0, 16.0, 23.0, 23.0, 18.0, 31.0, 29.0, 31.0, 39.0, 37.0, 51.0, 44.0, 31.0, 37.0, 39.0, 37.0, 45.0, 49.0, 41.0, 28.0, 34.0, 31.0, 22.0, 25.0, 21.0, 21.0, 24.0, 14.0, 14.0, 10.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.373046875, -2.2923583984375, -2.211669921875, -2.1309814453125, -2.05029296875, -1.9696044921875, -1.888916015625, -1.8082275390625, -1.7275390625, -1.6468505859375, -1.566162109375, -1.4854736328125, -1.40478515625, -1.3240966796875, -1.243408203125, -1.1627197265625, -1.08203125, -1.0013427734375, -0.920654296875, -0.8399658203125, -0.75927734375, -0.6785888671875, -0.597900390625, -0.5172119140625, -0.4365234375, -0.3558349609375, -0.275146484375, -0.1944580078125, -0.11376953125, -0.0330810546875, 0.047607421875, 0.1282958984375, 0.208984375, 0.2896728515625, 0.370361328125, 0.4510498046875, 0.53173828125, 0.6124267578125, 0.693115234375, 0.7738037109375, 0.8544921875, 0.9351806640625, 1.015869140625, 1.0965576171875, 1.17724609375, 1.2579345703125, 1.338623046875, 1.4193115234375, 1.5, 1.5806884765625, 1.661376953125, 1.7420654296875, 1.82275390625, 1.9034423828125, 1.984130859375, 2.0648193359375, 2.1455078125, 2.2261962890625, 2.306884765625, 2.3875732421875, 2.46826171875, 2.5489501953125, 2.629638671875, 2.7103271484375, 2.791015625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 17.0, 19.0, 20.0, 43.0, 80.0, 126.0, 248.0, 642.0, 2142.0, 16448.0, 1078343.0, 3060309.0, 31290.0, 3065.0, 771.0, 302.0, 142.0, 102.0, 47.0, 36.0, 25.0, 12.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -11.0390625, -10.6953125, -10.3515625, -10.0078125, -9.6640625, -9.3203125, -8.9765625, -8.6328125, -8.2890625, -7.9453125, -7.6015625, -7.2578125, -6.9140625, -6.5703125, -6.2265625, -5.8828125, -5.5390625, -5.1953125, -4.8515625, -4.5078125, -4.1640625, -3.8203125, -3.4765625, -3.1328125, -2.7890625, -2.4453125, -2.1015625, -1.7578125, -1.4140625, -1.0703125, -0.7265625, -0.3828125, -0.0390625, 0.3046875, 0.6484375, 0.9921875, 1.3359375, 1.6796875, 2.0234375, 2.3671875, 2.7109375, 3.0546875, 3.3984375, 3.7421875, 4.0859375, 4.4296875, 4.7734375, 5.1171875, 5.4609375, 5.8046875, 6.1484375, 6.4921875, 6.8359375, 7.1796875, 7.5234375, 7.8671875, 8.2109375, 8.5546875, 8.8984375, 9.2421875, 9.5859375, 9.9296875, 10.2734375, 10.6171875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 6.0, 10.0, 10.0, 17.0, 19.0, 31.0, 26.0, 53.0, 73.0, 102.0, 150.0, 221.0, 283.0, 382.0, 474.0, 500.0, 403.0, 353.0, 272.0, 181.0, 127.0, 101.0, 64.0, 57.0, 31.0, 26.0, 19.0, 10.0, 8.0, 13.0, 6.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.3701171875, -1.3249969482421875, -1.279876708984375, -1.2347564697265625, -1.18963623046875, -1.1445159912109375, -1.099395751953125, -1.0542755126953125, -1.0091552734375, -0.9640350341796875, -0.918914794921875, -0.8737945556640625, -0.82867431640625, -0.7835540771484375, -0.738433837890625, -0.6933135986328125, -0.648193359375, -0.6030731201171875, -0.557952880859375, -0.5128326416015625, -0.46771240234375, -0.4225921630859375, -0.377471923828125, -0.3323516845703125, -0.2872314453125, -0.2421112060546875, -0.196990966796875, -0.1518707275390625, -0.10675048828125, -0.0616302490234375, -0.016510009765625, 0.0286102294921875, 0.07373046875, 0.1188507080078125, 0.163970947265625, 0.2090911865234375, 0.25421142578125, 0.2993316650390625, 0.344451904296875, 0.3895721435546875, 0.4346923828125, 0.4798126220703125, 0.524932861328125, 0.5700531005859375, 0.61517333984375, 0.6602935791015625, 0.705413818359375, 0.7505340576171875, 0.795654296875, 0.8407745361328125, 0.885894775390625, 0.9310150146484375, 0.97613525390625, 1.0212554931640625, 1.066375732421875, 1.1114959716796875, 1.1566162109375, 1.2017364501953125, 1.246856689453125, 1.2919769287109375, 1.33709716796875, 1.3822174072265625, 1.427337646484375, 1.4724578857421875, 1.517578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 16.0, 25.0, 23.0, 31.0, 37.0, 46.0, 50.0, 64.0, 71.0, 63.0, 68.0, 76.0, 57.0, 60.0, 58.0, 59.0, 49.0, 26.0, 36.0, 24.0, 8.0, 12.0, 6.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.058391571044922, -2.923959732055664, -2.789527654647827, -2.6550958156585693, -2.5206637382507324, -2.3862318992614746, -2.251800060272217, -2.11736798286438, -1.9829360246658325, -1.8485040664672852, -1.7140721082687378, -1.5796401500701904, -1.4452083110809326, -1.3107762336730957, -1.176344394683838, -1.0419124364852905, -0.9074804782867432, -0.7730485200881958, -0.6386165618896484, -0.5041846632957458, -0.3697527050971985, -0.23532074689865112, -0.10088884830474854, 0.03354310989379883, 0.1679750680923462, 0.30240702629089355, 0.43683895468711853, 0.5712708830833435, 0.7057028412818909, 0.8401347994804382, 0.9745666980743408, 1.1089986562728882, 1.2434306144714355, 1.377862572669983, 1.5122945308685303, 1.646726369857788, 1.781158447265625, 1.9155902862548828, 2.0500221252441406, 2.1844542026519775, 2.3188862800598145, 2.4533181190490723, 2.587750196456909, 2.722182035446167, 2.856614112854004, 2.9910459518432617, 3.1254777908325195, 3.2599098682403564, 3.3943417072296143, 3.528773546218872, 3.663205623626709, 3.797637462615967, 3.9320695400238037, 4.066501617431641, 4.200933456420898, 4.335365295410156, 4.469797134399414, 4.604228973388672, 4.73866081237793, 4.873093128204346, 5.0075249671936035, 5.141956806182861, 5.276388645172119, 5.410820960998535, 5.545252799987793]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 11.0, 6.0, 10.0, 10.0, 12.0, 20.0, 20.0, 21.0, 19.0, 20.0, 23.0, 26.0, 25.0, 35.0, 40.0, 42.0, 55.0, 39.0, 41.0, 33.0, 45.0, 30.0, 43.0, 38.0, 29.0, 40.0, 31.0, 35.0, 35.0, 24.0, 22.0, 30.0, 18.0, 7.0, 9.0, 8.0, 5.0, 7.0, 10.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.383267879486084, -3.282144069671631, -3.1810200214385986, -3.0798962116241455, -2.9787721633911133, -2.87764835357666, -2.776524543762207, -2.675400733947754, -2.5742766857147217, -2.4731528759002686, -2.3720288276672363, -2.270905017852783, -2.16978120803833, -2.068657159805298, -1.9675333499908447, -1.866409420967102, -1.7652854919433594, -1.6641615629196167, -1.563037633895874, -1.461913824081421, -1.3607898950576782, -1.2596659660339355, -1.1585421562194824, -1.0574182271957397, -0.9562942981719971, -0.8551703691482544, -0.7540464997291565, -0.6529226303100586, -0.5517987012863159, -0.45067477226257324, -0.34955090284347534, -0.24842703342437744, -0.14730310440063477, -0.04617920517921448, 0.05494469404220581, 0.1560685932636261, 0.2571924924850464, 0.35831642150878906, 0.45944029092788696, 0.5605641603469849, 0.6616880893707275, 0.7628120183944702, 0.8639358878135681, 0.965059757232666, 1.0661836862564087, 1.1673076152801514, 1.2684314250946045, 1.3695553541183472, 1.4706792831420898, 1.5718032121658325, 1.6729271411895752, 1.7740509510040283, 1.875174880027771, 1.9762988090515137, 2.077422618865967, 2.17854642868042, 2.279670476913452, 2.3807942867279053, 2.4819183349609375, 2.5830421447753906, 2.6841659545898438, 2.785290002822876, 2.886413812637329, 2.9875378608703613, 3.0886616706848145]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 9.0, 12.0, 9.0, 15.0, 28.0, 36.0, 41.0, 42.0, 78.0, 111.0, 175.0, 288.0, 478.0, 843.0, 1584.0, 3205.0, 8517.0, 31105.0, 151964.0, 504876.0, 268588.0, 54171.0, 13219.0, 4639.0, 1995.0, 998.0, 569.0, 334.0, 186.0, 140.0, 87.0, 64.0, 41.0, 28.0, 13.0, 14.0, 11.0, 11.0, 6.0, 6.0, 7.0, 0.0, 3.0, 6.0, 2.0, 1.0], "bins": [-0.974609375, -0.9487457275390625, -0.922882080078125, -0.8970184326171875, -0.87115478515625, -0.8452911376953125, -0.819427490234375, -0.7935638427734375, -0.7677001953125, -0.7418365478515625, -0.715972900390625, -0.6901092529296875, -0.66424560546875, -0.6383819580078125, -0.612518310546875, -0.5866546630859375, -0.560791015625, -0.5349273681640625, -0.509063720703125, -0.4832000732421875, -0.45733642578125, -0.4314727783203125, -0.405609130859375, -0.3797454833984375, -0.3538818359375, -0.3280181884765625, -0.302154541015625, -0.2762908935546875, -0.25042724609375, -0.2245635986328125, -0.198699951171875, -0.1728363037109375, -0.14697265625, -0.1211090087890625, -0.095245361328125, -0.0693817138671875, -0.04351806640625, -0.0176544189453125, 0.008209228515625, 0.0340728759765625, 0.0599365234375, 0.0858001708984375, 0.111663818359375, 0.1375274658203125, 0.16339111328125, 0.1892547607421875, 0.215118408203125, 0.2409820556640625, 0.266845703125, 0.2927093505859375, 0.318572998046875, 0.3444366455078125, 0.37030029296875, 0.3961639404296875, 0.422027587890625, 0.4478912353515625, 0.4737548828125, 0.4996185302734375, 0.525482177734375, 0.5513458251953125, 0.57720947265625, 0.6030731201171875, 0.628936767578125, 0.6548004150390625, 0.6806640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 9.0, 8.0, 9.0, 11.0, 19.0, 15.0, 13.0, 27.0, 22.0, 20.0, 26.0, 31.0, 34.0, 40.0, 46.0, 41.0, 49.0, 45.0, 27.0, 50.0, 44.0, 49.0, 39.0, 40.0, 42.0, 40.0, 37.0, 22.0, 25.0, 23.0, 20.0, 14.0, 9.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0], "bins": [-2.466796875, -2.3994293212890625, -2.332061767578125, -2.2646942138671875, -2.19732666015625, -2.1299591064453125, -2.062591552734375, -1.9952239990234375, -1.9278564453125, -1.8604888916015625, -1.793121337890625, -1.7257537841796875, -1.65838623046875, -1.5910186767578125, -1.523651123046875, -1.4562835693359375, -1.388916015625, -1.3215484619140625, -1.254180908203125, -1.1868133544921875, -1.11944580078125, -1.0520782470703125, -0.984710693359375, -0.9173431396484375, -0.8499755859375, -0.7826080322265625, -0.715240478515625, -0.6478729248046875, -0.58050537109375, -0.5131378173828125, -0.445770263671875, -0.3784027099609375, -0.31103515625, -0.2436676025390625, -0.176300048828125, -0.1089324951171875, -0.04156494140625, 0.0258026123046875, 0.093170166015625, 0.1605377197265625, 0.2279052734375, 0.2952728271484375, 0.362640380859375, 0.4300079345703125, 0.49737548828125, 0.5647430419921875, 0.632110595703125, 0.6994781494140625, 0.766845703125, 0.8342132568359375, 0.901580810546875, 0.9689483642578125, 1.03631591796875, 1.1036834716796875, 1.171051025390625, 1.2384185791015625, 1.3057861328125, 1.3731536865234375, 1.440521240234375, 1.5078887939453125, 1.57525634765625, 1.6426239013671875, 1.709991455078125, 1.7773590087890625, 1.8447265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 6.0, 12.0, 16.0, 25.0, 24.0, 45.0, 75.0, 122.0, 230.0, 469.0, 857.0, 1901.0, 4089.0, 8908.0, 19797.0, 43697.0, 93367.0, 183521.0, 265505.0, 212482.0, 113807.0, 53824.0, 24718.0, 11420.0, 5036.0, 2298.0, 1095.0, 554.0, 277.0, 146.0, 93.0, 42.0, 31.0, 25.0, 16.0, 10.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2759056091308594, -0.26689910888671875, -0.2578926086425781, -0.2488861083984375, -0.23987960815429688, -0.23087310791015625, -0.22186660766601562, -0.212860107421875, -0.20385360717773438, -0.19484710693359375, -0.18584060668945312, -0.1768341064453125, -0.16782760620117188, -0.15882110595703125, -0.14981460571289062, -0.14080810546875, -0.13180160522460938, -0.12279510498046875, -0.11378860473632812, -0.1047821044921875, -0.09577560424804688, -0.08676910400390625, -0.07776260375976562, -0.068756103515625, -0.059749603271484375, -0.05074310302734375, -0.041736602783203125, -0.0327301025390625, -0.023723602294921875, -0.01471710205078125, -0.005710601806640625, 0.0032958984375, 0.012302398681640625, 0.02130889892578125, 0.030315399169921875, 0.0393218994140625, 0.048328399658203125, 0.05733489990234375, 0.06634140014648438, 0.075347900390625, 0.08435440063476562, 0.09336090087890625, 0.10236740112304688, 0.1113739013671875, 0.12038040161132812, 0.12938690185546875, 0.13839340209960938, 0.14739990234375, 0.15640640258789062, 0.16541290283203125, 0.17441940307617188, 0.1834259033203125, 0.19243240356445312, 0.20143890380859375, 0.21044540405273438, 0.219451904296875, 0.22845840454101562, 0.23746490478515625, 0.24647140502929688, 0.2554779052734375, 0.2644844055175781, 0.27349090576171875, 0.2824974060058594, 0.29150390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 2.0, 6.0, 6.0, 6.0, 10.0, 12.0, 12.0, 15.0, 18.0, 31.0, 31.0, 20.0, 35.0, 44.0, 34.0, 42.0, 56.0, 51.0, 44.0, 42.0, 50.0, 44.0, 37.0, 48.0, 38.0, 34.0, 39.0, 33.0, 18.0, 25.0, 18.0, 14.0, 20.0, 8.0, 6.0, 10.0, 15.0, 4.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.16253662109375, -4.0203857421875, -3.87823486328125, -3.736083984375, -3.59393310546875, -3.4517822265625, -3.30963134765625, -3.16748046875, -3.02532958984375, -2.8831787109375, -2.74102783203125, -2.598876953125, -2.45672607421875, -2.3145751953125, -2.17242431640625, -2.0302734375, -1.88812255859375, -1.7459716796875, -1.60382080078125, -1.461669921875, -1.31951904296875, -1.1773681640625, -1.03521728515625, -0.89306640625, -0.75091552734375, -0.6087646484375, -0.46661376953125, -0.324462890625, -0.18231201171875, -0.0401611328125, 0.10198974609375, 0.244140625, 0.38629150390625, 0.5284423828125, 0.67059326171875, 0.812744140625, 0.95489501953125, 1.0970458984375, 1.23919677734375, 1.38134765625, 1.52349853515625, 1.6656494140625, 1.80780029296875, 1.949951171875, 2.09210205078125, 2.2342529296875, 2.37640380859375, 2.5185546875, 2.66070556640625, 2.8028564453125, 2.94500732421875, 3.087158203125, 3.22930908203125, 3.3714599609375, 3.51361083984375, 3.65576171875, 3.79791259765625, 3.9400634765625, 4.08221435546875, 4.224365234375, 4.36651611328125, 4.5086669921875, 4.65081787109375, 4.79296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 7.0, 7.0, 10.0, 22.0, 18.0, 37.0, 52.0, 55.0, 86.0, 107.0, 216.0, 386.0, 737.0, 1708.0, 5715.0, 32590.0, 577613.0, 396397.0, 24968.0, 4822.0, 1501.0, 629.0, 322.0, 173.0, 114.0, 86.0, 47.0, 32.0, 29.0, 23.0, 18.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171875, -0.1663188934326172, -0.16076278686523438, -0.15520668029785156, -0.14965057373046875, -0.14409446716308594, -0.13853836059570312, -0.1329822540283203, -0.1274261474609375, -0.12187004089355469, -0.11631393432617188, -0.11075782775878906, -0.10520172119140625, -0.09964561462402344, -0.09408950805664062, -0.08853340148925781, -0.082977294921875, -0.07742118835449219, -0.07186508178710938, -0.06630897521972656, -0.06075286865234375, -0.05519676208496094, -0.049640655517578125, -0.04408454895019531, -0.0385284423828125, -0.03297233581542969, -0.027416229248046875, -0.021860122680664062, -0.01630401611328125, -0.010747909545898438, -0.005191802978515625, 0.0003643035888671875, 0.00592041015625, 0.011476516723632812, 0.017032623291015625, 0.022588729858398438, 0.02814483642578125, 0.03370094299316406, 0.039257049560546875, 0.04481315612792969, 0.0503692626953125, 0.05592536926269531, 0.061481475830078125, 0.06703758239746094, 0.07259368896484375, 0.07814979553222656, 0.08370590209960938, 0.08926200866699219, 0.094818115234375, 0.10037422180175781, 0.10593032836914062, 0.11148643493652344, 0.11704254150390625, 0.12259864807128906, 0.12815475463867188, 0.1337108612060547, 0.1392669677734375, 0.1448230743408203, 0.15037918090820312, 0.15593528747558594, 0.16149139404296875, 0.16704750061035156, 0.17260360717773438, 0.1781597137451172, 0.1837158203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 8.0, 6.0, 12.0, 8.0, 20.0, 30.0, 45.0, 40.0, 67.0, 80.0, 85.0, 96.0, 107.0, 97.0, 83.0, 45.0, 45.0, 27.0, 27.0, 19.0, 12.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16908073425293e-05, -5.9752725064754486e-05, -5.7814642786979675e-05, -5.5876560509204865e-05, -5.3938478231430054e-05, -5.200039595365524e-05, -5.006231367588043e-05, -4.812423139810562e-05, -4.618614912033081e-05, -4.4248066842556e-05, -4.230998456478119e-05, -4.037190228700638e-05, -3.843382000923157e-05, -3.6495737731456757e-05, -3.4557655453681946e-05, -3.2619573175907135e-05, -3.0681490898132324e-05, -2.8743408620357513e-05, -2.6805326342582703e-05, -2.4867244064807892e-05, -2.292916178703308e-05, -2.099107950925827e-05, -1.905299723148346e-05, -1.711491495370865e-05, -1.5176832675933838e-05, -1.3238750398159027e-05, -1.1300668120384216e-05, -9.362585842609406e-06, -7.424503564834595e-06, -5.486421287059784e-06, -3.548339009284973e-06, -1.6102567315101624e-06, 3.2782554626464844e-07, 2.2659078240394592e-06, 4.20399010181427e-06, 6.142072379589081e-06, 8.080154657363892e-06, 1.0018236935138702e-05, 1.1956319212913513e-05, 1.3894401490688324e-05, 1.5832483768463135e-05, 1.7770566046237946e-05, 1.9708648324012756e-05, 2.1646730601787567e-05, 2.3584812879562378e-05, 2.552289515733719e-05, 2.7460977435112e-05, 2.939905971288681e-05, 3.133714199066162e-05, 3.327522426843643e-05, 3.521330654621124e-05, 3.7151388823986053e-05, 3.9089471101760864e-05, 4.1027553379535675e-05, 4.2965635657310486e-05, 4.49037179350853e-05, 4.684180021286011e-05, 4.877988249063492e-05, 5.071796476840973e-05, 5.265604704618454e-05, 5.459412932395935e-05, 5.653221160173416e-05, 5.847029387950897e-05, 6.040837615728378e-05, 6.23464584350586e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 4.0, 13.0, 21.0, 22.0, 41.0, 65.0, 98.0, 202.0, 507.0, 1679.0, 7380.0, 62628.0, 898244.0, 67112.0, 7785.0, 1721.0, 497.0, 211.0, 101.0, 85.0, 37.0, 24.0, 24.0, 9.0, 5.0, 8.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.24936294555664062, -0.24091339111328125, -0.23246383666992188, -0.2240142822265625, -0.21556472778320312, -0.20711517333984375, -0.19866561889648438, -0.190216064453125, -0.18176651000976562, -0.17331695556640625, -0.16486740112304688, -0.1564178466796875, -0.14796829223632812, -0.13951873779296875, -0.13106918334960938, -0.12261962890625, -0.11417007446289062, -0.10572052001953125, -0.09727096557617188, -0.0888214111328125, -0.08037185668945312, -0.07192230224609375, -0.06347274780273438, -0.055023193359375, -0.046573638916015625, -0.03812408447265625, -0.029674530029296875, -0.0212249755859375, -0.012775421142578125, -0.00432586669921875, 0.004123687744140625, 0.0125732421875, 0.021022796630859375, 0.02947235107421875, 0.037921905517578125, 0.0463714599609375, 0.054821014404296875, 0.06327056884765625, 0.07172012329101562, 0.080169677734375, 0.08861923217773438, 0.09706878662109375, 0.10551834106445312, 0.1139678955078125, 0.12241744995117188, 0.13086700439453125, 0.13931655883789062, 0.14776611328125, 0.15621566772460938, 0.16466522216796875, 0.17311477661132812, 0.1815643310546875, 0.19001388549804688, 0.19846343994140625, 0.20691299438476562, 0.215362548828125, 0.22381210327148438, 0.23226165771484375, 0.24071121215820312, 0.2491607666015625, 0.2576103210449219, 0.26605987548828125, 0.2745094299316406, 0.282958984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 11.0, 14.0, 12.0, 14.0, 29.0, 52.0, 126.0, 298.0, 203.0, 82.0, 34.0, 24.0, 20.0, 18.0, 10.0, 4.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.071533203125, -0.06973075866699219, -0.06792831420898438, -0.06612586975097656, -0.06432342529296875, -0.06252098083496094, -0.060718536376953125, -0.05891609191894531, -0.0571136474609375, -0.05531120300292969, -0.053508758544921875, -0.05170631408691406, -0.04990386962890625, -0.04810142517089844, -0.046298980712890625, -0.04449653625488281, -0.042694091796875, -0.04089164733886719, -0.039089202880859375, -0.03728675842285156, -0.03548431396484375, -0.03368186950683594, -0.031879425048828125, -0.030076980590820312, -0.0282745361328125, -0.026472091674804688, -0.024669647216796875, -0.022867202758789062, -0.02106475830078125, -0.019262313842773438, -0.017459869384765625, -0.015657424926757812, -0.01385498046875, -0.012052536010742188, -0.010250091552734375, -0.008447647094726562, -0.00664520263671875, -0.0048427581787109375, -0.003040313720703125, -0.0012378692626953125, 0.0005645751953125, 0.0023670196533203125, 0.004169464111328125, 0.0059719085693359375, 0.00777435302734375, 0.009576797485351562, 0.011379241943359375, 0.013181686401367188, 0.014984130859375, 0.016786575317382812, 0.018589019775390625, 0.020391464233398438, 0.02219390869140625, 0.023996353149414062, 0.025798797607421875, 0.027601242065429688, 0.0294036865234375, 0.031206130981445312, 0.033008575439453125, 0.03481101989746094, 0.03661346435546875, 0.03841590881347656, 0.040218353271484375, 0.04202079772949219, 0.0438232421875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 12.0, 22.0, 33.0, 39.0, 57.0, 66.0, 76.0, 97.0, 84.0, 92.0, 76.0, 84.0, 77.0, 53.0, 36.0, 32.0, 18.0, 10.0, 11.0, 6.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4458606243133545, -3.347395658493042, -3.2489306926727295, -3.150465726852417, -3.0520005226135254, -2.953535556793213, -2.8550705909729004, -2.756605625152588, -2.6581406593322754, -2.559675693511963, -2.4612107276916504, -2.362745761871338, -2.2642807960510254, -2.165815591812134, -2.0673506259918213, -1.9688856601715088, -1.8704206943511963, -1.7719557285308838, -1.6734907627105713, -1.5750256776809692, -1.4765607118606567, -1.3780957460403442, -1.2796306610107422, -1.1811656951904297, -1.0827007293701172, -0.9842357635498047, -0.8857707381248474, -0.7873057126998901, -0.6888407468795776, -0.5903757810592651, -0.49191075563430786, -0.3934457302093506, -0.2949807643890381, -0.1965157687664032, -0.09805077314376831, 0.00041422247886657715, 0.09887921810150146, 0.19734421372413635, 0.29580920934677124, 0.3942742347717285, 0.492739200592041, 0.5912041664123535, 0.6896691918373108, 0.7881342172622681, 0.8865991830825806, 0.9850641489028931, 1.0835292339324951, 1.1819941997528076, 1.2804591655731201, 1.3789241313934326, 1.4773890972137451, 1.5758541822433472, 1.6743191480636597, 1.7727841138839722, 1.8712491989135742, 1.9697141647338867, 2.068179130554199, 2.1666440963745117, 2.265109062194824, 2.3635740280151367, 2.462038993835449, 2.560504198074341, 2.6589691638946533, 2.757434129714966, 2.8558990955352783]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 4.0, 11.0, 10.0, 11.0, 15.0, 20.0, 25.0, 21.0, 22.0, 15.0, 23.0, 33.0, 36.0, 33.0, 52.0, 52.0, 47.0, 45.0, 40.0, 41.0, 36.0, 41.0, 38.0, 42.0, 37.0, 33.0, 26.0, 42.0, 14.0, 26.0, 27.0, 8.0, 14.0, 6.0, 8.0, 5.0, 8.0, 0.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.075538158416748, -2.012981653213501, -1.950425148010254, -1.8878685235977173, -1.8253120183944702, -1.7627555131912231, -1.7001988887786865, -1.6376423835754395, -1.5750858783721924, -1.5125293731689453, -1.4499728679656982, -1.3874162435531616, -1.3248597383499146, -1.2623032331466675, -1.1997466087341309, -1.1371901035308838, -1.0746335983276367, -1.0120770931243896, -0.9495205283164978, -0.886963963508606, -0.8244074583053589, -0.7618509531021118, -0.69929438829422, -0.6367378234863281, -0.574181318283081, -0.511624813079834, -0.44906824827194214, -0.3865117132663727, -0.3239551782608032, -0.26139864325523376, -0.1988421082496643, -0.13628557324409485, -0.07372915744781494, -0.011172622442245483, 0.051383912563323975, 0.11394044756889343, 0.1764969825744629, 0.23905351758003235, 0.3016100525856018, 0.36416658759117126, 0.4267231225967407, 0.4892796576023102, 0.5518361926078796, 0.6143927574157715, 0.6769492626190186, 0.7395057678222656, 0.8020623326301575, 0.8646188974380493, 0.9271754026412964, 0.9897319078445435, 1.05228853225708, 1.1148450374603271, 1.1774015426635742, 1.2399580478668213, 1.3025145530700684, 1.365071177482605, 1.427627682685852, 1.4901841878890991, 1.5527408123016357, 1.6152973175048828, 1.6778538227081299, 1.740410327911377, 1.802966833114624, 1.8655234575271606, 1.9280799627304077]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 14.0, 14.0, 29.0, 35.0, 52.0, 87.0, 172.0, 254.0, 401.0, 835.0, 1591.0, 3217.0, 7048.0, 15984.0, 38859.0, 100265.0, 261850.0, 355543.0, 159474.0, 59233.0, 23927.0, 10249.0, 4706.0, 2214.0, 1120.0, 521.0, 307.0, 205.0, 128.0, 79.0, 46.0, 31.0, 12.0, 18.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.15985107421875, -2.0775146484375, -1.99517822265625, -1.912841796875, -1.83050537109375, -1.7481689453125, -1.66583251953125, -1.58349609375, -1.50115966796875, -1.4188232421875, -1.33648681640625, -1.254150390625, -1.17181396484375, -1.0894775390625, -1.00714111328125, -0.9248046875, -0.84246826171875, -0.7601318359375, -0.67779541015625, -0.595458984375, -0.51312255859375, -0.4307861328125, -0.34844970703125, -0.26611328125, -0.18377685546875, -0.1014404296875, -0.01910400390625, 0.063232421875, 0.14556884765625, 0.2279052734375, 0.31024169921875, 0.392578125, 0.47491455078125, 0.5572509765625, 0.63958740234375, 0.721923828125, 0.80426025390625, 0.8865966796875, 0.96893310546875, 1.05126953125, 1.13360595703125, 1.2159423828125, 1.29827880859375, 1.380615234375, 1.46295166015625, 1.5452880859375, 1.62762451171875, 1.7099609375, 1.79229736328125, 1.8746337890625, 1.95697021484375, 2.039306640625, 2.12164306640625, 2.2039794921875, 2.28631591796875, 2.36865234375, 2.45098876953125, 2.5333251953125, 2.61566162109375, 2.697998046875, 2.78033447265625, 2.8626708984375, 2.94500732421875, 3.02734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 8.0, 10.0, 13.0, 10.0, 15.0, 13.0, 19.0, 20.0, 28.0, 23.0, 33.0, 31.0, 42.0, 48.0, 39.0, 57.0, 44.0, 41.0, 56.0, 44.0, 53.0, 32.0, 45.0, 35.0, 36.0, 30.0, 25.0, 28.0, 31.0, 8.0, 21.0, 7.0, 11.0, 7.0, 7.0, 6.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.359375, -4.2303466796875, -4.101318359375, -3.9722900390625, -3.84326171875, -3.7142333984375, -3.585205078125, -3.4561767578125, -3.3271484375, -3.1981201171875, -3.069091796875, -2.9400634765625, -2.81103515625, -2.6820068359375, -2.552978515625, -2.4239501953125, -2.294921875, -2.1658935546875, -2.036865234375, -1.9078369140625, -1.77880859375, -1.6497802734375, -1.520751953125, -1.3917236328125, -1.2626953125, -1.1336669921875, -1.004638671875, -0.8756103515625, -0.74658203125, -0.6175537109375, -0.488525390625, -0.3594970703125, -0.23046875, -0.1014404296875, 0.027587890625, 0.1566162109375, 0.28564453125, 0.4146728515625, 0.543701171875, 0.6727294921875, 0.8017578125, 0.9307861328125, 1.059814453125, 1.1888427734375, 1.31787109375, 1.4468994140625, 1.575927734375, 1.7049560546875, 1.833984375, 1.9630126953125, 2.092041015625, 2.2210693359375, 2.35009765625, 2.4791259765625, 2.608154296875, 2.7371826171875, 2.8662109375, 2.9952392578125, 3.124267578125, 3.2532958984375, 3.38232421875, 3.5113525390625, 3.640380859375, 3.7694091796875, 3.8984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 0.0, 3.0, 8.0, 4.0, 8.0, 12.0, 6.0, 19.0, 23.0, 28.0, 44.0, 64.0, 95.0, 149.0, 233.0, 451.0, 1028.0, 4194.0, 25928.0, 280746.0, 653690.0, 70054.0, 8559.0, 1747.0, 622.0, 313.0, 159.0, 109.0, 73.0, 63.0, 37.0, 34.0, 10.0, 10.0, 5.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.9547119140625, -6.745361328125, -6.5360107421875, -6.32666015625, -6.1173095703125, -5.907958984375, -5.6986083984375, -5.4892578125, -5.2799072265625, -5.070556640625, -4.8612060546875, -4.65185546875, -4.4425048828125, -4.233154296875, -4.0238037109375, -3.814453125, -3.6051025390625, -3.395751953125, -3.1864013671875, -2.97705078125, -2.7677001953125, -2.558349609375, -2.3489990234375, -2.1396484375, -1.9302978515625, -1.720947265625, -1.5115966796875, -1.30224609375, -1.0928955078125, -0.883544921875, -0.6741943359375, -0.46484375, -0.2554931640625, -0.046142578125, 0.1632080078125, 0.37255859375, 0.5819091796875, 0.791259765625, 1.0006103515625, 1.2099609375, 1.4193115234375, 1.628662109375, 1.8380126953125, 2.04736328125, 2.2567138671875, 2.466064453125, 2.6754150390625, 2.884765625, 3.0941162109375, 3.303466796875, 3.5128173828125, 3.72216796875, 3.9315185546875, 4.140869140625, 4.3502197265625, 4.5595703125, 4.7689208984375, 4.978271484375, 5.1876220703125, 5.39697265625, 5.6063232421875, 5.815673828125, 6.0250244140625, 6.234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 5.0, 9.0, 14.0, 18.0, 27.0, 14.0, 34.0, 33.0, 32.0, 46.0, 45.0, 47.0, 51.0, 46.0, 46.0, 67.0, 56.0, 39.0, 49.0, 53.0, 37.0, 30.0, 34.0, 23.0, 28.0, 20.0, 18.0, 16.0, 7.0, 4.0, 5.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.73046875, -5.5633544921875, -5.396240234375, -5.2291259765625, -5.06201171875, -4.8948974609375, -4.727783203125, -4.5606689453125, -4.3935546875, -4.2264404296875, -4.059326171875, -3.8922119140625, -3.72509765625, -3.5579833984375, -3.390869140625, -3.2237548828125, -3.056640625, -2.8895263671875, -2.722412109375, -2.5552978515625, -2.38818359375, -2.2210693359375, -2.053955078125, -1.8868408203125, -1.7197265625, -1.5526123046875, -1.385498046875, -1.2183837890625, -1.05126953125, -0.8841552734375, -0.717041015625, -0.5499267578125, -0.3828125, -0.2156982421875, -0.048583984375, 0.1185302734375, 0.28564453125, 0.4527587890625, 0.619873046875, 0.7869873046875, 0.9541015625, 1.1212158203125, 1.288330078125, 1.4554443359375, 1.62255859375, 1.7896728515625, 1.956787109375, 2.1239013671875, 2.291015625, 2.4581298828125, 2.625244140625, 2.7923583984375, 2.95947265625, 3.1265869140625, 3.293701171875, 3.4608154296875, 3.6279296875, 3.7950439453125, 3.962158203125, 4.1292724609375, 4.29638671875, 4.4635009765625, 4.630615234375, 4.7977294921875, 4.96484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 11.0, 13.0, 15.0, 25.0, 41.0, 60.0, 67.0, 121.0, 201.0, 414.0, 865.0, 2432.0, 8762.0, 45218.0, 308825.0, 579359.0, 81922.0, 14249.0, 3576.0, 1196.0, 486.0, 252.0, 146.0, 77.0, 52.0, 50.0, 20.0, 26.0, 8.0, 11.0, 7.0, 8.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4482421875, -1.401763916015625, -1.35528564453125, -1.308807373046875, -1.2623291015625, -1.215850830078125, -1.16937255859375, -1.122894287109375, -1.076416015625, -1.029937744140625, -0.98345947265625, -0.936981201171875, -0.8905029296875, -0.844024658203125, -0.79754638671875, -0.751068115234375, -0.70458984375, -0.658111572265625, -0.61163330078125, -0.565155029296875, -0.5186767578125, -0.472198486328125, -0.42572021484375, -0.379241943359375, -0.332763671875, -0.286285400390625, -0.23980712890625, -0.193328857421875, -0.1468505859375, -0.100372314453125, -0.05389404296875, -0.007415771484375, 0.0390625, 0.085540771484375, 0.13201904296875, 0.178497314453125, 0.2249755859375, 0.271453857421875, 0.31793212890625, 0.364410400390625, 0.410888671875, 0.457366943359375, 0.50384521484375, 0.550323486328125, 0.5968017578125, 0.643280029296875, 0.68975830078125, 0.736236572265625, 0.78271484375, 0.829193115234375, 0.87567138671875, 0.922149658203125, 0.9686279296875, 1.015106201171875, 1.06158447265625, 1.108062744140625, 1.154541015625, 1.201019287109375, 1.24749755859375, 1.293975830078125, 1.3404541015625, 1.386932373046875, 1.43341064453125, 1.479888916015625, 1.5263671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 13.0, 8.0, 12.0, 15.0, 25.0, 22.0, 24.0, 47.0, 38.0, 79.0, 85.0, 145.0, 120.0, 93.0, 62.0, 52.0, 54.0, 22.0, 19.0, 12.0, 14.0, 14.0, 8.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002155303955078125, -0.00020856782793998718, -0.00020160526037216187, -0.00019464269280433655, -0.00018768012523651123, -0.0001807175576686859, -0.0001737549901008606, -0.00016679242253303528, -0.00015982985496520996, -0.00015286728739738464, -0.00014590471982955933, -0.000138942152261734, -0.0001319795846939087, -0.00012501701712608337, -0.00011805444955825806, -0.00011109188199043274, -0.00010412931442260742, -9.71667468547821e-05, -9.020417928695679e-05, -8.324161171913147e-05, -7.627904415130615e-05, -6.931647658348083e-05, -6.235390901565552e-05, -5.53913414478302e-05, -4.842877388000488e-05, -4.1466206312179565e-05, -3.450363874435425e-05, -2.754107117652893e-05, -2.0578503608703613e-05, -1.3615936040878296e-05, -6.6533684730529785e-06, 3.0919909477233887e-07, 7.271766662597656e-06, 1.4234334230422974e-05, 2.119690179824829e-05, 2.815946936607361e-05, 3.5122036933898926e-05, 4.208460450172424e-05, 4.904717206954956e-05, 5.600973963737488e-05, 6.29723072052002e-05, 6.993487477302551e-05, 7.689744234085083e-05, 8.386000990867615e-05, 9.082257747650146e-05, 9.778514504432678e-05, 0.0001047477126121521, 0.00011171028017997742, 0.00011867284774780273, 0.00012563541531562805, 0.00013259798288345337, 0.0001395605504512787, 0.000146523118019104, 0.00015348568558692932, 0.00016044825315475464, 0.00016741082072257996, 0.00017437338829040527, 0.0001813359558582306, 0.0001882985234260559, 0.00019526109099388123, 0.00020222365856170654, 0.00020918622612953186, 0.00021614879369735718, 0.0002231113612651825, 0.0002300739288330078]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 5.0, 9.0, 12.0, 18.0, 47.0, 130.0, 334.0, 993.0, 3478.0, 29913.0, 824559.0, 178200.0, 8203.0, 1760.0, 562.0, 177.0, 69.0, 32.0, 18.0, 13.0, 3.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8690185546875, -2.757568359375, -2.6461181640625, -2.53466796875, -2.4232177734375, -2.311767578125, -2.2003173828125, -2.0888671875, -1.9774169921875, -1.865966796875, -1.7545166015625, -1.64306640625, -1.5316162109375, -1.420166015625, -1.3087158203125, -1.197265625, -1.0858154296875, -0.974365234375, -0.8629150390625, -0.75146484375, -0.6400146484375, -0.528564453125, -0.4171142578125, -0.3056640625, -0.1942138671875, -0.082763671875, 0.0286865234375, 0.14013671875, 0.2515869140625, 0.363037109375, 0.4744873046875, 0.5859375, 0.6973876953125, 0.808837890625, 0.9202880859375, 1.03173828125, 1.1431884765625, 1.254638671875, 1.3660888671875, 1.4775390625, 1.5889892578125, 1.700439453125, 1.8118896484375, 1.92333984375, 2.0347900390625, 2.146240234375, 2.2576904296875, 2.369140625, 2.4805908203125, 2.592041015625, 2.7034912109375, 2.81494140625, 2.9263916015625, 3.037841796875, 3.1492919921875, 3.2607421875, 3.3721923828125, 3.483642578125, 3.5950927734375, 3.70654296875, 3.8179931640625, 3.929443359375, 4.0408935546875, 4.15234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 23.0, 30.0, 54.0, 61.0, 91.0, 153.0, 180.0, 142.0, 82.0, 52.0, 41.0, 31.0, 21.0, 8.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.388671875, -1.3550262451171875, -1.321380615234375, -1.2877349853515625, -1.25408935546875, -1.2204437255859375, -1.186798095703125, -1.1531524658203125, -1.1195068359375, -1.0858612060546875, -1.052215576171875, -1.0185699462890625, -0.98492431640625, -0.9512786865234375, -0.917633056640625, -0.8839874267578125, -0.850341796875, -0.8166961669921875, -0.783050537109375, -0.7494049072265625, -0.71575927734375, -0.6821136474609375, -0.648468017578125, -0.6148223876953125, -0.5811767578125, -0.5475311279296875, -0.513885498046875, -0.4802398681640625, -0.44659423828125, -0.4129486083984375, -0.379302978515625, -0.3456573486328125, -0.31201171875, -0.2783660888671875, -0.244720458984375, -0.2110748291015625, -0.17742919921875, -0.1437835693359375, -0.110137939453125, -0.0764923095703125, -0.0428466796875, -0.0092010498046875, 0.024444580078125, 0.0580902099609375, 0.09173583984375, 0.1253814697265625, 0.159027099609375, 0.1926727294921875, 0.226318359375, 0.2599639892578125, 0.293609619140625, 0.3272552490234375, 0.36090087890625, 0.3945465087890625, 0.428192138671875, 0.4618377685546875, 0.4954833984375, 0.5291290283203125, 0.562774658203125, 0.5964202880859375, 0.63006591796875, 0.6637115478515625, 0.697357177734375, 0.7310028076171875, 0.7646484375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 17.0, 35.0, 72.0, 120.0, 182.0, 193.0, 150.0, 124.0, 60.0, 25.0, 8.0, 14.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.594183921813965, -9.166465759277344, -8.738748550415039, -8.311030387878418, -7.883312225341797, -7.455594062805176, -7.027876377105713, -6.60015869140625, -6.172440528869629, -5.744722366333008, -5.317004680633545, -4.889286994934082, -4.461568832397461, -4.03385066986084, -3.606132984161377, -3.178415060043335, -2.750697135925293, -2.322979211807251, -1.895261287689209, -1.467543363571167, -1.039825439453125, -0.612107515335083, -0.18438959121704102, 0.24332833290100098, 0.671046257019043, 1.098764181137085, 1.526482105255127, 1.954200029373169, 2.381917953491211, 2.809635877609253, 3.237353801727295, 3.665071725845337, 4.0927886962890625, 4.520506858825684, 4.9482245445251465, 5.375942230224609, 5.8036603927612305, 6.231378555297852, 6.6590962409973145, 7.086813926696777, 7.514532089233398, 7.9422502517700195, 8.36996841430664, 8.797685623168945, 9.225403785705566, 9.653121948242188, 10.080839157104492, 10.508557319641113, 10.936275482177734, 11.363993644714355, 11.791711807250977, 12.219429016113281, 12.647147178649902, 13.074865341186523, 13.502582550048828, 13.93030071258545, 14.35801887512207, 14.785737037658691, 15.213455200195312, 15.641172409057617, 16.068889617919922, 16.49660873413086, 16.924325942993164, 17.3520450592041, 17.779762268066406]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 10.0, 10.0, 16.0, 16.0, 18.0, 27.0, 19.0, 26.0, 20.0, 31.0, 24.0, 34.0, 39.0, 42.0, 45.0, 51.0, 34.0, 57.0, 38.0, 44.0, 44.0, 41.0, 28.0, 34.0, 33.0, 21.0, 32.0, 26.0, 17.0, 21.0, 11.0, 15.0, 7.0, 5.0, 9.0, 5.0, 7.0, 4.0, 1.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.976343631744385, -6.751397609710693, -6.526451587677002, -6.301505088806152, -6.076559066772461, -5.8516130447387695, -5.626667022705078, -5.401721000671387, -5.176774978637695, -4.951828956604004, -4.7268829345703125, -4.501936912536621, -4.2769904136657715, -4.05204439163208, -3.8270983695983887, -3.6021523475646973, -3.3772060871124268, -3.1522600650787354, -2.927313804626465, -2.7023677825927734, -2.477421760559082, -2.2524757385253906, -2.02752947807312, -1.8025834560394287, -1.5776373147964478, -1.3526911735534668, -1.1277451515197754, -0.9027990102767944, -0.6778529286384583, -0.45290684700012207, -0.2279607057571411, -0.003014683723449707, 0.22193145751953125, 0.44687753915786743, 0.6718236207962036, 0.8967697620391846, 1.121715784072876, 1.346661925315857, 1.571608066558838, 1.7965540885925293, 2.0215001106262207, 2.246446132659912, 2.4713923931121826, 2.696338415145874, 2.9212844371795654, 3.146230697631836, 3.3711767196655273, 3.5961227416992188, 3.8210690021514893, 4.04601526260376, 4.270961284637451, 4.495907306671143, 4.720853328704834, 4.945799350738525, 5.170745849609375, 5.395691871643066, 5.620637893676758, 5.845583915710449, 6.070529937744141, 6.295475959777832, 6.520422458648682, 6.745368480682373, 6.9703145027160645, 7.195260524749756, 7.420206546783447]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 13.0, 18.0, 19.0, 18.0, 30.0, 28.0, 61.0, 60.0, 98.0, 105.0, 154.0, 186.0, 284.0, 478.0, 904.0, 2167.0, 7810.0, 62446.0, 1293664.0, 2620416.0, 184603.0, 14551.0, 3201.0, 1157.0, 596.0, 318.0, 211.0, 168.0, 105.0, 96.0, 72.0, 50.0, 39.0, 38.0, 22.0, 19.0, 20.0, 12.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.046875, -5.85296630859375, -5.6590576171875, -5.46514892578125, -5.271240234375, -5.07733154296875, -4.8834228515625, -4.68951416015625, -4.49560546875, -4.30169677734375, -4.1077880859375, -3.91387939453125, -3.719970703125, -3.52606201171875, -3.3321533203125, -3.13824462890625, -2.9443359375, -2.75042724609375, -2.5565185546875, -2.36260986328125, -2.168701171875, -1.97479248046875, -1.7808837890625, -1.58697509765625, -1.39306640625, -1.19915771484375, -1.0052490234375, -0.81134033203125, -0.617431640625, -0.42352294921875, -0.2296142578125, -0.03570556640625, 0.158203125, 0.35211181640625, 0.5460205078125, 0.73992919921875, 0.933837890625, 1.12774658203125, 1.3216552734375, 1.51556396484375, 1.70947265625, 1.90338134765625, 2.0972900390625, 2.29119873046875, 2.485107421875, 2.67901611328125, 2.8729248046875, 3.06683349609375, 3.2607421875, 3.45465087890625, 3.6485595703125, 3.84246826171875, 4.036376953125, 4.23028564453125, 4.4241943359375, 4.61810302734375, 4.81201171875, 5.00592041015625, 5.1998291015625, 5.39373779296875, 5.587646484375, 5.78155517578125, 5.9754638671875, 6.16937255859375, 6.36328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 10.0, 11.0, 14.0, 19.0, 25.0, 21.0, 29.0, 26.0, 28.0, 30.0, 36.0, 27.0, 23.0, 38.0, 39.0, 56.0, 45.0, 48.0, 41.0, 46.0, 38.0, 37.0, 39.0, 33.0, 27.0, 33.0, 26.0, 26.0, 14.0, 15.0, 12.0, 15.0, 10.0, 5.0, 12.0, 8.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.287109375, -2.212738037109375, -2.13836669921875, -2.063995361328125, -1.9896240234375, -1.915252685546875, -1.84088134765625, -1.766510009765625, -1.692138671875, -1.617767333984375, -1.54339599609375, -1.469024658203125, -1.3946533203125, -1.320281982421875, -1.24591064453125, -1.171539306640625, -1.09716796875, -1.022796630859375, -0.94842529296875, -0.874053955078125, -0.7996826171875, -0.725311279296875, -0.65093994140625, -0.576568603515625, -0.502197265625, -0.427825927734375, -0.35345458984375, -0.279083251953125, -0.2047119140625, -0.130340576171875, -0.05596923828125, 0.018402099609375, 0.0927734375, 0.167144775390625, 0.24151611328125, 0.315887451171875, 0.3902587890625, 0.464630126953125, 0.53900146484375, 0.613372802734375, 0.687744140625, 0.762115478515625, 0.83648681640625, 0.910858154296875, 0.9852294921875, 1.059600830078125, 1.13397216796875, 1.208343505859375, 1.28271484375, 1.357086181640625, 1.43145751953125, 1.505828857421875, 1.5802001953125, 1.654571533203125, 1.72894287109375, 1.803314208984375, 1.877685546875, 1.952056884765625, 2.02642822265625, 2.100799560546875, 2.1751708984375, 2.249542236328125, 2.32391357421875, 2.398284912109375, 2.47265625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 6.0, 11.0, 18.0, 22.0, 41.0, 68.0, 157.0, 382.0, 1034.0, 4263.0, 64106.0, 3976602.0, 139772.0, 5658.0, 1323.0, 432.0, 196.0, 80.0, 32.0, 27.0, 12.0, 13.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.325439453125, -11.97900390625, -11.632568359375, -11.2861328125, -10.939697265625, -10.59326171875, -10.246826171875, -9.900390625, -9.553955078125, -9.20751953125, -8.861083984375, -8.5146484375, -8.168212890625, -7.82177734375, -7.475341796875, -7.12890625, -6.782470703125, -6.43603515625, -6.089599609375, -5.7431640625, -5.396728515625, -5.05029296875, -4.703857421875, -4.357421875, -4.010986328125, -3.66455078125, -3.318115234375, -2.9716796875, -2.625244140625, -2.27880859375, -1.932373046875, -1.5859375, -1.239501953125, -0.89306640625, -0.546630859375, -0.2001953125, 0.146240234375, 0.49267578125, 0.839111328125, 1.185546875, 1.531982421875, 1.87841796875, 2.224853515625, 2.5712890625, 2.917724609375, 3.26416015625, 3.610595703125, 3.95703125, 4.303466796875, 4.64990234375, 4.996337890625, 5.3427734375, 5.689208984375, 6.03564453125, 6.382080078125, 6.728515625, 7.074951171875, 7.42138671875, 7.767822265625, 8.1142578125, 8.460693359375, 8.80712890625, 9.153564453125, 9.5]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 14.0, 11.0, 17.0, 23.0, 36.0, 74.0, 73.0, 136.0, 215.0, 339.0, 484.0, 562.0, 556.0, 476.0, 374.0, 233.0, 137.0, 96.0, 80.0, 40.0, 31.0, 16.0, 16.0, 8.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.91015625, -1.860107421875, -1.81005859375, -1.760009765625, -1.7099609375, -1.659912109375, -1.60986328125, -1.559814453125, -1.509765625, -1.459716796875, -1.40966796875, -1.359619140625, -1.3095703125, -1.259521484375, -1.20947265625, -1.159423828125, -1.109375, -1.059326171875, -1.00927734375, -0.959228515625, -0.9091796875, -0.859130859375, -0.80908203125, -0.759033203125, -0.708984375, -0.658935546875, -0.60888671875, -0.558837890625, -0.5087890625, -0.458740234375, -0.40869140625, -0.358642578125, -0.30859375, -0.258544921875, -0.20849609375, -0.158447265625, -0.1083984375, -0.058349609375, -0.00830078125, 0.041748046875, 0.091796875, 0.141845703125, 0.19189453125, 0.241943359375, 0.2919921875, 0.342041015625, 0.39208984375, 0.442138671875, 0.4921875, 0.542236328125, 0.59228515625, 0.642333984375, 0.6923828125, 0.742431640625, 0.79248046875, 0.842529296875, 0.892578125, 0.942626953125, 0.99267578125, 1.042724609375, 1.0927734375, 1.142822265625, 1.19287109375, 1.242919921875, 1.29296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 2.0, 7.0, 9.0, 5.0, 7.0, 7.0, 11.0, 10.0, 21.0, 18.0, 16.0, 16.0, 28.0, 20.0, 27.0, 37.0, 23.0, 45.0, 35.0, 30.0, 38.0, 34.0, 26.0, 54.0, 35.0, 40.0, 50.0, 31.0, 31.0, 33.0, 30.0, 21.0, 29.0, 22.0, 19.0, 15.0, 23.0, 15.0, 17.0, 7.0, 10.0, 8.0, 9.0, 7.0, 6.0, 1.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.0933501720428467, -2.023475170135498, -1.9536001682281494, -1.8837251663208008, -1.8138502836227417, -1.743975281715393, -1.6741002798080444, -1.6042252779006958, -1.5343503952026367, -1.464475393295288, -1.3946003913879395, -1.3247253894805908, -1.2548505067825317, -1.184975504875183, -1.1151005029678345, -1.0452255010604858, -0.9753504991531372, -0.9054754972457886, -0.8356005549430847, -0.7657255530357361, -0.6958506107330322, -0.6259756088256836, -0.556100606918335, -0.4862256348133087, -0.41635066270828247, -0.3464756906032562, -0.27660071849823, -0.20672571659088135, -0.1368507444858551, -0.06697577238082886, 0.0028992295265197754, 0.07277420163154602, 0.14264917373657227, 0.2125241458415985, 0.28239911794662476, 0.3522741198539734, 0.42214909195899963, 0.4920240640640259, 0.5618990659713745, 0.6317740678787231, 0.701649010181427, 0.7715240120887756, 0.8413989543914795, 0.9112739562988281, 0.9811489582061768, 1.0510239601135254, 1.120898962020874, 1.190773844718933, 1.2606488466262817, 1.3305238485336304, 1.400398850440979, 1.470273733139038, 1.5401487350463867, 1.6100237369537354, 1.679898738861084, 1.7497737407684326, 1.8196487426757812, 1.8895237445831299, 1.9593987464904785, 2.029273748397827, 2.099148750305176, 2.1690235137939453, 2.238898754119873, 2.3087735176086426, 2.378648519515991]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 10.0, 6.0, 8.0, 9.0, 20.0, 9.0, 17.0, 19.0, 19.0, 19.0, 33.0, 25.0, 31.0, 36.0, 31.0, 39.0, 35.0, 41.0, 46.0, 45.0, 39.0, 41.0, 42.0, 29.0, 45.0, 40.0, 28.0, 35.0, 27.0, 26.0, 18.0, 23.0, 25.0, 18.0, 12.0, 16.0, 8.0, 6.0, 4.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9165236949920654, -2.8275294303894043, -2.738535165786743, -2.649540901184082, -2.560546636581421, -2.4715523719787598, -2.3825583457946777, -2.2935640811920166, -2.2045698165893555, -2.1155755519866943, -2.026581287384033, -1.937587022781372, -1.8485928773880005, -1.7595986127853394, -1.6706043481826782, -1.5816102027893066, -1.492615818977356, -1.4036215543746948, -1.3146272897720337, -1.225633144378662, -1.136638879776001, -1.0476446151733398, -0.9586503505706787, -0.8696561455726624, -0.7806618809700012, -0.6916676163673401, -0.6026734113693237, -0.5136791467666626, -0.42468491196632385, -0.3356906771659851, -0.24669641256332397, -0.15770220756530762, -0.06870794296264648, 0.020286299288272858, 0.1092805415391922, 0.19827479124069214, 0.2872690260410309, 0.37626326084136963, 0.46525752544403076, 0.5542517304420471, 0.6432459950447083, 0.7322402596473694, 0.8212344646453857, 0.9102287292480469, 0.999222993850708, 1.0882172584533691, 1.1772115230560303, 1.2662056684494019, 1.355199933052063, 1.4441941976547241, 1.5331884622573853, 1.6221826076507568, 1.711176872253418, 1.800171136856079, 1.8891654014587402, 1.9781596660614014, 2.0671539306640625, 2.1561481952667236, 2.2451424598693848, 2.334136724472046, 2.423130989074707, 2.512125015258789, 2.6011195182800293, 2.6901135444641113, 2.7791078090667725]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 9.0, 10.0, 9.0, 18.0, 20.0, 34.0, 39.0, 51.0, 76.0, 108.0, 113.0, 151.0, 231.0, 332.0, 444.0, 656.0, 1378.0, 4955.0, 45721.0, 433937.0, 493845.0, 56701.0, 5870.0, 1411.0, 743.0, 467.0, 320.0, 221.0, 167.0, 109.0, 96.0, 82.0, 52.0, 40.0, 30.0, 20.0, 19.0, 18.0, 9.0, 12.0, 12.0, 2.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.078643798828125, -1.04498291015625, -1.011322021484375, -0.9776611328125, -0.944000244140625, -0.91033935546875, -0.876678466796875, -0.843017578125, -0.809356689453125, -0.77569580078125, -0.742034912109375, -0.7083740234375, -0.674713134765625, -0.64105224609375, -0.607391357421875, -0.57373046875, -0.540069580078125, -0.50640869140625, -0.472747802734375, -0.4390869140625, -0.405426025390625, -0.37176513671875, -0.338104248046875, -0.304443359375, -0.270782470703125, -0.23712158203125, -0.203460693359375, -0.1697998046875, -0.136138916015625, -0.10247802734375, -0.068817138671875, -0.03515625, -0.001495361328125, 0.03216552734375, 0.065826416015625, 0.0994873046875, 0.133148193359375, 0.16680908203125, 0.200469970703125, 0.234130859375, 0.267791748046875, 0.30145263671875, 0.335113525390625, 0.3687744140625, 0.402435302734375, 0.43609619140625, 0.469757080078125, 0.50341796875, 0.537078857421875, 0.57073974609375, 0.604400634765625, 0.6380615234375, 0.671722412109375, 0.70538330078125, 0.739044189453125, 0.772705078125, 0.806365966796875, 0.84002685546875, 0.873687744140625, 0.9073486328125, 0.941009521484375, 0.97467041015625, 1.008331298828125, 1.0419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 8.0, 8.0, 11.0, 6.0, 10.0, 15.0, 11.0, 12.0, 9.0, 14.0, 29.0, 27.0, 27.0, 26.0, 31.0, 44.0, 31.0, 34.0, 38.0, 43.0, 44.0, 39.0, 43.0, 43.0, 44.0, 38.0, 26.0, 27.0, 37.0, 24.0, 30.0, 31.0, 30.0, 18.0, 20.0, 18.0, 10.0, 9.0, 12.0, 8.0, 6.0, 4.0, 8.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.798828125, -1.741485595703125, -1.68414306640625, -1.626800537109375, -1.5694580078125, -1.512115478515625, -1.45477294921875, -1.397430419921875, -1.340087890625, -1.282745361328125, -1.22540283203125, -1.168060302734375, -1.1107177734375, -1.053375244140625, -0.99603271484375, -0.938690185546875, -0.88134765625, -0.824005126953125, -0.76666259765625, -0.709320068359375, -0.6519775390625, -0.594635009765625, -0.53729248046875, -0.479949951171875, -0.422607421875, -0.365264892578125, -0.30792236328125, -0.250579833984375, -0.1932373046875, -0.135894775390625, -0.07855224609375, -0.021209716796875, 0.0361328125, 0.093475341796875, 0.15081787109375, 0.208160400390625, 0.2655029296875, 0.322845458984375, 0.38018798828125, 0.437530517578125, 0.494873046875, 0.552215576171875, 0.60955810546875, 0.666900634765625, 0.7242431640625, 0.781585693359375, 0.83892822265625, 0.896270751953125, 0.95361328125, 1.010955810546875, 1.06829833984375, 1.125640869140625, 1.1829833984375, 1.240325927734375, 1.29766845703125, 1.355010986328125, 1.412353515625, 1.469696044921875, 1.52703857421875, 1.584381103515625, 1.6417236328125, 1.699066162109375, 1.75640869140625, 1.813751220703125, 1.87109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 13.0, 11.0, 28.0, 30.0, 38.0, 67.0, 122.0, 217.0, 359.0, 630.0, 1178.0, 2118.0, 3801.0, 7072.0, 12673.0, 22808.0, 40823.0, 70476.0, 113660.0, 161513.0, 184121.0, 158634.0, 110589.0, 68758.0, 39339.0, 22102.0, 12159.0, 6785.0, 3725.0, 2026.0, 1143.0, 633.0, 366.0, 197.0, 121.0, 76.0, 41.0, 36.0, 20.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.223388671875, -0.2165088653564453, -0.20962905883789062, -0.20274925231933594, -0.19586944580078125, -0.18898963928222656, -0.18210983276367188, -0.1752300262451172, -0.1683502197265625, -0.1614704132080078, -0.15459060668945312, -0.14771080017089844, -0.14083099365234375, -0.13395118713378906, -0.12707138061523438, -0.12019157409667969, -0.113311767578125, -0.10643196105957031, -0.09955215454101562, -0.09267234802246094, -0.08579254150390625, -0.07891273498535156, -0.07203292846679688, -0.06515312194824219, -0.0582733154296875, -0.05139350891113281, -0.044513702392578125, -0.03763389587402344, -0.03075408935546875, -0.023874282836914062, -0.016994476318359375, -0.010114669799804688, -0.00323486328125, 0.0036449432373046875, 0.010524749755859375, 0.017404556274414062, 0.02428436279296875, 0.031164169311523438, 0.038043975830078125, 0.04492378234863281, 0.0518035888671875, 0.05868339538574219, 0.06556320190429688, 0.07244300842285156, 0.07932281494140625, 0.08620262145996094, 0.09308242797851562, 0.09996223449707031, 0.106842041015625, 0.11372184753417969, 0.12060165405273438, 0.12748146057128906, 0.13436126708984375, 0.14124107360839844, 0.14812088012695312, 0.1550006866455078, 0.1618804931640625, 0.1687602996826172, 0.17564010620117188, 0.18251991271972656, 0.18939971923828125, 0.19627952575683594, 0.20315933227539062, 0.2100391387939453, 0.2169189453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 15.0, 13.0, 11.0, 14.0, 15.0, 20.0, 18.0, 37.0, 27.0, 32.0, 36.0, 42.0, 37.0, 40.0, 65.0, 45.0, 39.0, 32.0, 43.0, 42.0, 40.0, 31.0, 41.0, 24.0, 31.0, 27.0, 18.0, 27.0, 21.0, 17.0, 17.0, 9.0, 9.0, 9.0, 4.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.82421875, -4.67926025390625, -4.5343017578125, -4.38934326171875, -4.244384765625, -4.09942626953125, -3.9544677734375, -3.80950927734375, -3.66455078125, -3.51959228515625, -3.3746337890625, -3.22967529296875, -3.084716796875, -2.93975830078125, -2.7947998046875, -2.64984130859375, -2.5048828125, -2.35992431640625, -2.2149658203125, -2.07000732421875, -1.925048828125, -1.78009033203125, -1.6351318359375, -1.49017333984375, -1.34521484375, -1.20025634765625, -1.0552978515625, -0.91033935546875, -0.765380859375, -0.62042236328125, -0.4754638671875, -0.33050537109375, -0.185546875, -0.04058837890625, 0.1043701171875, 0.24932861328125, 0.394287109375, 0.53924560546875, 0.6842041015625, 0.82916259765625, 0.97412109375, 1.11907958984375, 1.2640380859375, 1.40899658203125, 1.553955078125, 1.69891357421875, 1.8438720703125, 1.98883056640625, 2.1337890625, 2.27874755859375, 2.4237060546875, 2.56866455078125, 2.713623046875, 2.85858154296875, 3.0035400390625, 3.14849853515625, 3.29345703125, 3.43841552734375, 3.5833740234375, 3.72833251953125, 3.873291015625, 4.01824951171875, 4.1632080078125, 4.30816650390625, 4.453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 13.0, 22.0, 23.0, 48.0, 84.0, 72.0, 187.0, 238.0, 401.0, 746.0, 1557.0, 4255.0, 19083.0, 202596.0, 737334.0, 66700.0, 9524.0, 2923.0, 1186.0, 596.0, 339.0, 214.0, 121.0, 73.0, 58.0, 51.0, 27.0, 15.0, 15.0, 15.0, 11.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.2429656982421875, -0.235443115234375, -0.2279205322265625, -0.22039794921875, -0.2128753662109375, -0.205352783203125, -0.1978302001953125, -0.1903076171875, -0.1827850341796875, -0.175262451171875, -0.1677398681640625, -0.16021728515625, -0.1526947021484375, -0.145172119140625, -0.1376495361328125, -0.130126953125, -0.1226043701171875, -0.115081787109375, -0.1075592041015625, -0.10003662109375, -0.0925140380859375, -0.084991455078125, -0.0774688720703125, -0.0699462890625, -0.0624237060546875, -0.054901123046875, -0.0473785400390625, -0.03985595703125, -0.0323333740234375, -0.024810791015625, -0.0172882080078125, -0.009765625, -0.0022430419921875, 0.005279541015625, 0.0128021240234375, 0.02032470703125, 0.0278472900390625, 0.035369873046875, 0.0428924560546875, 0.0504150390625, 0.0579376220703125, 0.065460205078125, 0.0729827880859375, 0.08050537109375, 0.0880279541015625, 0.095550537109375, 0.1030731201171875, 0.110595703125, 0.1181182861328125, 0.125640869140625, 0.1331634521484375, 0.14068603515625, 0.1482086181640625, 0.155731201171875, 0.1632537841796875, 0.1707763671875, 0.1782989501953125, 0.185821533203125, 0.1933441162109375, 0.20086669921875, 0.2083892822265625, 0.215911865234375, 0.2234344482421875, 0.23095703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 10.0, 17.0, 27.0, 37.0, 56.0, 80.0, 109.0, 142.0, 144.0, 118.0, 88.0, 60.0, 42.0, 25.0, 16.0, 13.0, 8.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265806198120117e-05, -6.923172622919083e-05, -6.580539047718048e-05, -6.237905472517014e-05, -5.895271897315979e-05, -5.5526383221149445e-05, -5.21000474691391e-05, -4.8673711717128754e-05, -4.524737596511841e-05, -4.182104021310806e-05, -3.839470446109772e-05, -3.496836870908737e-05, -3.1542032957077026e-05, -2.811569720506668e-05, -2.4689361453056335e-05, -2.126302570104599e-05, -1.7836689949035645e-05, -1.4410354197025299e-05, -1.0984018445014954e-05, -7.557682693004608e-06, -4.131346940994263e-06, -7.050111889839172e-07, 2.7213245630264282e-06, 6.147660315036774e-06, 9.573996067047119e-06, 1.3000331819057465e-05, 1.642666757106781e-05, 1.9853003323078156e-05, 2.32793390750885e-05, 2.6705674827098846e-05, 3.0132010579109192e-05, 3.355834633111954e-05, 3.698468208312988e-05, 4.041101783514023e-05, 4.3837353587150574e-05, 4.726368933916092e-05, 5.0690025091171265e-05, 5.411636084318161e-05, 5.7542696595191956e-05, 6.09690323472023e-05, 6.439536809921265e-05, 6.782170385122299e-05, 7.124803960323334e-05, 7.467437535524368e-05, 7.810071110725403e-05, 8.152704685926437e-05, 8.495338261127472e-05, 8.837971836328506e-05, 9.180605411529541e-05, 9.523238986730576e-05, 9.86587256193161e-05, 0.00010208506137132645, 0.00010551139712333679, 0.00010893773287534714, 0.00011236406862735748, 0.00011579040437936783, 0.00011921674013137817, 0.00012264307588338852, 0.00012606941163539886, 0.0001294957473874092, 0.00013292208313941956, 0.0001363484188914299, 0.00013977475464344025, 0.0001432010903954506, 0.00014662742614746094]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 9.0, 5.0, 6.0, 7.0, 7.0, 18.0, 21.0, 30.0, 55.0, 57.0, 115.0, 193.0, 242.0, 390.0, 689.0, 1140.0, 1895.0, 3168.0, 5670.0, 10209.0, 19095.0, 39434.0, 95111.0, 361814.0, 337072.0, 90741.0, 38368.0, 19040.0, 10137.0, 5647.0, 3215.0, 1938.0, 1101.0, 697.0, 420.0, 283.0, 165.0, 113.0, 75.0, 52.0, 27.0, 22.0, 15.0, 10.0, 4.0, 7.0, 5.0, 5.0, 6.0, 0.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1290283203125, -0.1248626708984375, -0.120697021484375, -0.1165313720703125, -0.11236572265625, -0.1082000732421875, -0.104034423828125, -0.0998687744140625, -0.095703125, -0.0915374755859375, -0.087371826171875, -0.0832061767578125, -0.07904052734375, -0.0748748779296875, -0.070709228515625, -0.0665435791015625, -0.0623779296875, -0.0582122802734375, -0.054046630859375, -0.0498809814453125, -0.04571533203125, -0.0415496826171875, -0.037384033203125, -0.0332183837890625, -0.029052734375, -0.0248870849609375, -0.020721435546875, -0.0165557861328125, -0.01239013671875, -0.0082244873046875, -0.004058837890625, 0.0001068115234375, 0.0042724609375, 0.0084381103515625, 0.012603759765625, 0.0167694091796875, 0.02093505859375, 0.0251007080078125, 0.029266357421875, 0.0334320068359375, 0.03759765625, 0.0417633056640625, 0.045928955078125, 0.0500946044921875, 0.05426025390625, 0.0584259033203125, 0.062591552734375, 0.0667572021484375, 0.0709228515625, 0.0750885009765625, 0.079254150390625, 0.0834197998046875, 0.08758544921875, 0.0917510986328125, 0.095916748046875, 0.1000823974609375, 0.104248046875, 0.1084136962890625, 0.112579345703125, 0.1167449951171875, 0.12091064453125, 0.1250762939453125, 0.129241943359375, 0.1334075927734375, 0.1375732421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 5.0, 6.0, 6.0, 4.0, 13.0, 5.0, 12.0, 18.0, 26.0, 35.0, 41.0, 37.0, 49.0, 67.0, 102.0, 133.0, 94.0, 60.0, 42.0, 39.0, 29.0, 23.0, 23.0, 23.0, 20.0, 14.0, 7.0, 8.0, 13.0, 2.0, 5.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.05609130859375, -0.054302215576171875, -0.05251312255859375, -0.050724029541015625, -0.0489349365234375, -0.047145843505859375, -0.04535675048828125, -0.043567657470703125, -0.041778564453125, -0.039989471435546875, -0.03820037841796875, -0.036411285400390625, -0.0346221923828125, -0.032833099365234375, -0.03104400634765625, -0.029254913330078125, -0.0274658203125, -0.025676727294921875, -0.02388763427734375, -0.022098541259765625, -0.0203094482421875, -0.018520355224609375, -0.01673126220703125, -0.014942169189453125, -0.013153076171875, -0.011363983154296875, -0.00957489013671875, -0.007785797119140625, -0.0059967041015625, -0.004207611083984375, -0.00241851806640625, -0.000629425048828125, 0.00115966796875, 0.002948760986328125, 0.00473785400390625, 0.006526947021484375, 0.0083160400390625, 0.010105133056640625, 0.01189422607421875, 0.013683319091796875, 0.015472412109375, 0.017261505126953125, 0.01905059814453125, 0.020839691162109375, 0.0226287841796875, 0.024417877197265625, 0.02620697021484375, 0.027996063232421875, 0.02978515625, 0.031574249267578125, 0.03336334228515625, 0.035152435302734375, 0.0369415283203125, 0.038730621337890625, 0.04051971435546875, 0.042308807373046875, 0.044097900390625, 0.045886993408203125, 0.04767608642578125, 0.049465179443359375, 0.0512542724609375, 0.053043365478515625, 0.05483245849609375, 0.056621551513671875, 0.05841064453125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 2.0, 10.0, 2.0, 12.0, 16.0, 13.0, 16.0, 28.0, 19.0, 35.0, 27.0, 49.0, 50.0, 33.0, 40.0, 50.0, 57.0, 47.0, 56.0, 48.0, 59.0, 49.0, 35.0, 35.0, 34.0, 26.0, 32.0, 17.0, 25.0, 11.0, 19.0, 8.0, 8.0, 12.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3707630634307861, -1.3151752948760986, -1.2595875263214111, -1.2039998769760132, -1.1484121084213257, -1.0928243398666382, -1.0372365713119507, -0.981648862361908, -0.9260611534118652, -0.8704733848571777, -0.814885675907135, -0.7592979073524475, -0.7037101984024048, -0.6481224298477173, -0.5925346612930298, -0.5369469523429871, -0.48135918378829956, -0.42577144503593445, -0.37018370628356934, -0.31459593772888184, -0.2590082287788391, -0.2034204602241516, -0.1478327214717865, -0.09224498271942139, -0.036657243967056274, 0.018930498510599136, 0.07451824098825455, 0.13010598719120026, 0.18569372594356537, 0.24128147959709167, 0.2968692183494568, 0.3524569571018219, 0.408044695854187, 0.4636324346065521, 0.5192201733589172, 0.5748079419136047, 0.6303956508636475, 0.685983419418335, 0.7415711879730225, 0.7971588969230652, 0.8527466058731079, 0.9083343744277954, 0.9639220833778381, 1.0195097923278809, 1.0750975608825684, 1.1306853294372559, 1.1862730979919434, 1.2418608665466309, 1.2974486351013184, 1.3530364036560059, 1.4086241722106934, 1.4642118215560913, 1.5197995901107788, 1.5753873586654663, 1.6309751272201538, 1.6865627765655518, 1.7421505451202393, 1.7977383136749268, 1.8533260822296143, 1.9089137315750122, 1.9645015001296997, 2.0200891494750977, 2.075676918029785, 2.1312646865844727, 2.18685245513916]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 6.0, 9.0, 7.0, 12.0, 16.0, 13.0, 18.0, 12.0, 20.0, 19.0, 22.0, 33.0, 28.0, 29.0, 35.0, 42.0, 37.0, 40.0, 42.0, 45.0, 51.0, 42.0, 36.0, 34.0, 38.0, 36.0, 40.0, 29.0, 31.0, 22.0, 29.0, 23.0, 20.0, 13.0, 18.0, 10.0, 15.0, 8.0, 3.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8072359561920166, -1.7508479356765747, -1.6944599151611328, -1.638071894645691, -1.581683874130249, -1.5252959728240967, -1.4689079523086548, -1.412519931793213, -1.356131911277771, -1.299743890762329, -1.2433558702468872, -1.1869678497314453, -1.130579948425293, -1.0741918087005615, -1.0178039073944092, -0.9614158868789673, -0.9050278663635254, -0.8486398458480835, -0.7922518253326416, -0.7358638644218445, -0.6794758439064026, -0.6230878233909607, -0.5666998624801636, -0.5103118419647217, -0.4539238214492798, -0.3975358009338379, -0.3411478102207184, -0.2847598195075989, -0.22837179899215698, -0.1719837784767151, -0.11559578776359558, -0.059207797050476074, -0.0028198957443237305, 0.05356810986995697, 0.10995611548423767, 0.16634412109851837, 0.22273212671279907, 0.27912014722824097, 0.3355081379413605, 0.39189612865448, 0.4482841491699219, 0.5046721696853638, 0.5610601902008057, 0.6174481511116028, 0.6738361716270447, 0.7302241921424866, 0.7866121530532837, 0.8430001735687256, 0.8993881940841675, 0.9557762145996094, 1.0121642351150513, 1.0685522556304932, 1.1249401569366455, 1.181328296661377, 1.2377161979675293, 1.2941042184829712, 1.350492238998413, 1.406880259513855, 1.4632682800292969, 1.5196563005447388, 1.5760443210601807, 1.632432222366333, 1.688820242881775, 1.7452082633972168, 1.8015962839126587]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 14.0, 16.0, 24.0, 27.0, 35.0, 66.0, 95.0, 166.0, 258.0, 388.0, 612.0, 1220.0, 2263.0, 4710.0, 9956.0, 21149.0, 47453.0, 103005.0, 196687.0, 264482.0, 198857.0, 106182.0, 48852.0, 21976.0, 10016.0, 4685.0, 2356.0, 1181.0, 644.0, 418.0, 254.0, 156.0, 103.0, 60.0, 59.0, 32.0, 25.0, 19.0, 9.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.546875, -2.466064453125, -2.38525390625, -2.304443359375, -2.2236328125, -2.142822265625, -2.06201171875, -1.981201171875, -1.900390625, -1.819580078125, -1.73876953125, -1.657958984375, -1.5771484375, -1.496337890625, -1.41552734375, -1.334716796875, -1.25390625, -1.173095703125, -1.09228515625, -1.011474609375, -0.9306640625, -0.849853515625, -0.76904296875, -0.688232421875, -0.607421875, -0.526611328125, -0.44580078125, -0.364990234375, -0.2841796875, -0.203369140625, -0.12255859375, -0.041748046875, 0.0390625, 0.119873046875, 0.20068359375, 0.281494140625, 0.3623046875, 0.443115234375, 0.52392578125, 0.604736328125, 0.685546875, 0.766357421875, 0.84716796875, 0.927978515625, 1.0087890625, 1.089599609375, 1.17041015625, 1.251220703125, 1.33203125, 1.412841796875, 1.49365234375, 1.574462890625, 1.6552734375, 1.736083984375, 1.81689453125, 1.897705078125, 1.978515625, 2.059326171875, 2.14013671875, 2.220947265625, 2.3017578125, 2.382568359375, 2.46337890625, 2.544189453125, 2.625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 10.0, 4.0, 6.0, 8.0, 8.0, 6.0, 12.0, 16.0, 22.0, 16.0, 35.0, 36.0, 32.0, 32.0, 43.0, 38.0, 33.0, 53.0, 47.0, 65.0, 56.0, 46.0, 48.0, 47.0, 50.0, 40.0, 37.0, 29.0, 19.0, 21.0, 25.0, 22.0, 12.0, 6.0, 9.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68359375, -3.5738525390625, -3.464111328125, -3.3543701171875, -3.24462890625, -3.1348876953125, -3.025146484375, -2.9154052734375, -2.8056640625, -2.6959228515625, -2.586181640625, -2.4764404296875, -2.36669921875, -2.2569580078125, -2.147216796875, -2.0374755859375, -1.927734375, -1.8179931640625, -1.708251953125, -1.5985107421875, -1.48876953125, -1.3790283203125, -1.269287109375, -1.1595458984375, -1.0498046875, -0.9400634765625, -0.830322265625, -0.7205810546875, -0.61083984375, -0.5010986328125, -0.391357421875, -0.2816162109375, -0.171875, -0.0621337890625, 0.047607421875, 0.1573486328125, 0.26708984375, 0.3768310546875, 0.486572265625, 0.5963134765625, 0.7060546875, 0.8157958984375, 0.925537109375, 1.0352783203125, 1.14501953125, 1.2547607421875, 1.364501953125, 1.4742431640625, 1.583984375, 1.6937255859375, 1.803466796875, 1.9132080078125, 2.02294921875, 2.1326904296875, 2.242431640625, 2.3521728515625, 2.4619140625, 2.5716552734375, 2.681396484375, 2.7911376953125, 2.90087890625, 3.0106201171875, 3.120361328125, 3.2301025390625, 3.33984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 11.0, 5.0, 13.0, 12.0, 24.0, 32.0, 43.0, 57.0, 101.0, 159.0, 252.0, 438.0, 943.0, 2587.0, 8961.0, 34049.0, 140279.0, 439860.0, 312711.0, 79956.0, 19348.0, 5328.0, 1768.0, 672.0, 328.0, 217.0, 119.0, 81.0, 61.0, 31.0, 28.0, 12.0, 16.0, 10.0, 9.0, 14.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6953125, -4.53228759765625, -4.3692626953125, -4.20623779296875, -4.043212890625, -3.88018798828125, -3.7171630859375, -3.55413818359375, -3.39111328125, -3.22808837890625, -3.0650634765625, -2.90203857421875, -2.739013671875, -2.57598876953125, -2.4129638671875, -2.24993896484375, -2.0869140625, -1.92388916015625, -1.7608642578125, -1.59783935546875, -1.434814453125, -1.27178955078125, -1.1087646484375, -0.94573974609375, -0.78271484375, -0.61968994140625, -0.4566650390625, -0.29364013671875, -0.130615234375, 0.03240966796875, 0.1954345703125, 0.35845947265625, 0.521484375, 0.68450927734375, 0.8475341796875, 1.01055908203125, 1.173583984375, 1.33660888671875, 1.4996337890625, 1.66265869140625, 1.82568359375, 1.98870849609375, 2.1517333984375, 2.31475830078125, 2.477783203125, 2.64080810546875, 2.8038330078125, 2.96685791015625, 3.1298828125, 3.29290771484375, 3.4559326171875, 3.61895751953125, 3.781982421875, 3.94500732421875, 4.1080322265625, 4.27105712890625, 4.43408203125, 4.59710693359375, 4.7601318359375, 4.92315673828125, 5.086181640625, 5.24920654296875, 5.4122314453125, 5.57525634765625, 5.73828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 4.0, 5.0, 7.0, 5.0, 11.0, 22.0, 15.0, 14.0, 27.0, 34.0, 27.0, 27.0, 33.0, 38.0, 45.0, 53.0, 46.0, 49.0, 76.0, 50.0, 49.0, 49.0, 46.0, 36.0, 30.0, 28.0, 24.0, 20.0, 17.0, 20.0, 9.0, 16.0, 14.0, 7.0, 10.0, 8.0, 6.0, 0.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.396484375, -3.285430908203125, -3.17437744140625, -3.063323974609375, -2.9522705078125, -2.841217041015625, -2.73016357421875, -2.619110107421875, -2.508056640625, -2.397003173828125, -2.28594970703125, -2.174896240234375, -2.0638427734375, -1.952789306640625, -1.84173583984375, -1.730682373046875, -1.61962890625, -1.508575439453125, -1.39752197265625, -1.286468505859375, -1.1754150390625, -1.064361572265625, -0.95330810546875, -0.842254638671875, -0.731201171875, -0.620147705078125, -0.50909423828125, -0.398040771484375, -0.2869873046875, -0.175933837890625, -0.06488037109375, 0.046173095703125, 0.1572265625, 0.268280029296875, 0.37933349609375, 0.490386962890625, 0.6014404296875, 0.712493896484375, 0.82354736328125, 0.934600830078125, 1.045654296875, 1.156707763671875, 1.26776123046875, 1.378814697265625, 1.4898681640625, 1.600921630859375, 1.71197509765625, 1.823028564453125, 1.93408203125, 2.045135498046875, 2.15618896484375, 2.267242431640625, 2.3782958984375, 2.489349365234375, 2.60040283203125, 2.711456298828125, 2.822509765625, 2.933563232421875, 3.04461669921875, 3.155670166015625, 3.2667236328125, 3.377777099609375, 3.48883056640625, 3.599884033203125, 3.7109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 9.0, 20.0, 39.0, 57.0, 105.0, 198.0, 417.0, 770.0, 1915.0, 5031.0, 15154.0, 53578.0, 191026.0, 449573.0, 233293.0, 68266.0, 18931.0, 6065.0, 2278.0, 960.0, 426.0, 195.0, 100.0, 57.0, 29.0, 21.0, 16.0, 7.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.1845703125, -1.1560897827148438, -1.1276092529296875, -1.0991287231445312, -1.070648193359375, -1.0421676635742188, -1.0136871337890625, -0.9852066040039062, -0.95672607421875, -0.9282455444335938, -0.8997650146484375, -0.8712844848632812, -0.842803955078125, -0.8143234252929688, -0.7858428955078125, -0.7573623657226562, -0.7288818359375, -0.7004013061523438, -0.6719207763671875, -0.6434402465820312, -0.614959716796875, -0.5864791870117188, -0.5579986572265625, -0.5295181274414062, -0.50103759765625, -0.47255706787109375, -0.4440765380859375, -0.41559600830078125, -0.387115478515625, -0.35863494873046875, -0.3301544189453125, -0.30167388916015625, -0.273193359375, -0.24471282958984375, -0.2162322998046875, -0.18775177001953125, -0.159271240234375, -0.13079071044921875, -0.1023101806640625, -0.07382965087890625, -0.04534912109375, -0.01686859130859375, 0.0116119384765625, 0.04009246826171875, 0.068572998046875, 0.09705352783203125, 0.1255340576171875, 0.15401458740234375, 0.1824951171875, 0.21097564697265625, 0.2394561767578125, 0.26793670654296875, 0.296417236328125, 0.32489776611328125, 0.3533782958984375, 0.38185882568359375, 0.41033935546875, 0.43881988525390625, 0.4673004150390625, 0.49578094482421875, 0.524261474609375, 0.5527420043945312, 0.5812225341796875, 0.6097030639648438, 0.63818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 8.0, 9.0, 10.0, 14.0, 13.0, 13.0, 20.0, 31.0, 34.0, 56.0, 60.0, 68.0, 87.0, 157.0, 86.0, 57.0, 48.0, 36.0, 36.0, 39.0, 21.0, 27.0, 12.0, 9.0, 11.0, 11.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.00018262863159179688, -0.00017763115465641022, -0.00017263367772102356, -0.0001676362007856369, -0.00016263872385025024, -0.00015764124691486359, -0.00015264376997947693, -0.00014764629304409027, -0.0001426488161087036, -0.00013765133917331696, -0.0001326538622379303, -0.00012765638530254364, -0.00012265890836715698, -0.00011766143143177032, -0.00011266395449638367, -0.00010766647756099701, -0.00010266900062561035, -9.76715236902237e-05, -9.267404675483704e-05, -8.767656981945038e-05, -8.267909288406372e-05, -7.768161594867706e-05, -7.26841390132904e-05, -6.768666207790375e-05, -6.268918514251709e-05, -5.769170820713043e-05, -5.2694231271743774e-05, -4.769675433635712e-05, -4.269927740097046e-05, -3.77018004655838e-05, -3.2704323530197144e-05, -2.7706846594810486e-05, -2.2709369659423828e-05, -1.771189272403717e-05, -1.2714415788650513e-05, -7.716938853263855e-06, -2.7194619178771973e-06, 2.2780150175094604e-06, 7.275491952896118e-06, 1.2272968888282776e-05, 1.7270445823669434e-05, 2.226792275905609e-05, 2.726539969444275e-05, 3.226287662982941e-05, 3.7260353565216064e-05, 4.225783050060272e-05, 4.725530743598938e-05, 5.225278437137604e-05, 5.7250261306762695e-05, 6.224773824214935e-05, 6.724521517753601e-05, 7.224269211292267e-05, 7.724016904830933e-05, 8.223764598369598e-05, 8.723512291908264e-05, 9.22325998544693e-05, 9.723007678985596e-05, 0.00010222755372524261, 0.00010722503066062927, 0.00011222250759601593, 0.00011721998453140259, 0.00012221746146678925, 0.0001272149384021759, 0.00013221241533756256, 0.00013720989227294922]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 5.0, 11.0, 23.0, 35.0, 44.0, 71.0, 95.0, 145.0, 253.0, 393.0, 635.0, 1129.0, 2044.0, 3851.0, 8575.0, 23549.0, 80378.0, 268507.0, 440783.0, 149781.0, 42478.0, 13715.0, 5664.0, 2728.0, 1443.0, 785.0, 521.0, 316.0, 218.0, 123.0, 84.0, 50.0, 39.0, 30.0, 22.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -1.002105712890625, -0.97003173828125, -0.937957763671875, -0.9058837890625, -0.873809814453125, -0.84173583984375, -0.809661865234375, -0.777587890625, -0.745513916015625, -0.71343994140625, -0.681365966796875, -0.6492919921875, -0.617218017578125, -0.58514404296875, -0.553070068359375, -0.52099609375, -0.488922119140625, -0.45684814453125, -0.424774169921875, -0.3927001953125, -0.360626220703125, -0.32855224609375, -0.296478271484375, -0.264404296875, -0.232330322265625, -0.20025634765625, -0.168182373046875, -0.1361083984375, -0.104034423828125, -0.07196044921875, -0.039886474609375, -0.0078125, 0.024261474609375, 0.05633544921875, 0.088409423828125, 0.1204833984375, 0.152557373046875, 0.18463134765625, 0.216705322265625, 0.248779296875, 0.280853271484375, 0.31292724609375, 0.345001220703125, 0.3770751953125, 0.409149169921875, 0.44122314453125, 0.473297119140625, 0.50537109375, 0.537445068359375, 0.56951904296875, 0.601593017578125, 0.6336669921875, 0.665740966796875, 0.69781494140625, 0.729888916015625, 0.761962890625, 0.794036865234375, 0.82611083984375, 0.858184814453125, 0.8902587890625, 0.922332763671875, 0.95440673828125, 0.986480712890625, 1.0185546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 18.0, 28.0, 37.0, 59.0, 98.0, 100.0, 154.0, 135.0, 85.0, 64.0, 62.0, 41.0, 35.0, 14.0, 12.0, 13.0, 6.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5100173950195312, -0.4843902587890625, -0.45876312255859375, -0.433135986328125, -0.40750885009765625, -0.3818817138671875, -0.35625457763671875, -0.33062744140625, -0.30500030517578125, -0.2793731689453125, -0.25374603271484375, -0.228118896484375, -0.20249176025390625, -0.1768646240234375, -0.15123748779296875, -0.1256103515625, -0.09998321533203125, -0.0743560791015625, -0.04872894287109375, -0.023101806640625, 0.00252532958984375, 0.0281524658203125, 0.05377960205078125, 0.07940673828125, 0.10503387451171875, 0.1306610107421875, 0.15628814697265625, 0.181915283203125, 0.20754241943359375, 0.2331695556640625, 0.25879669189453125, 0.284423828125, 0.31005096435546875, 0.3356781005859375, 0.36130523681640625, 0.386932373046875, 0.41255950927734375, 0.4381866455078125, 0.46381378173828125, 0.48944091796875, 0.5150680541992188, 0.5406951904296875, 0.5663223266601562, 0.591949462890625, 0.6175765991210938, 0.6432037353515625, 0.6688308715820312, 0.6944580078125, 0.7200851440429688, 0.7457122802734375, 0.7713394165039062, 0.796966552734375, 0.8225936889648438, 0.8482208251953125, 0.8738479614257812, 0.89947509765625, 0.9251022338867188, 0.9507293701171875, 0.9763565063476562, 1.001983642578125, 1.0276107788085938, 1.0532379150390625, 1.0788650512695312, 1.1044921875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 20.0, 15.0, 32.0, 56.0, 72.0, 85.0, 84.0, 105.0, 94.0, 109.0, 90.0, 64.0, 52.0, 37.0, 26.0, 17.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.922094345092773, -9.714754104614258, -9.507413864135742, -9.300073623657227, -9.092733383178711, -8.885393142700195, -8.67805290222168, -8.470712661743164, -8.263372421264648, -8.056032180786133, -7.848691940307617, -7.641351699829102, -7.434011459350586, -7.22667121887207, -7.019330978393555, -6.811990737915039, -6.604650497436523, -6.397310256958008, -6.189970016479492, -5.982629776000977, -5.775289535522461, -5.567949295043945, -5.36060905456543, -5.153268814086914, -4.945929050445557, -4.738588809967041, -4.531248569488525, -4.32390832901001, -4.116568088531494, -3.9092278480529785, -3.701887607574463, -3.4945473670959473, -3.2872071266174316, -3.079866886138916, -2.8725266456604004, -2.6651864051818848, -2.457846164703369, -2.2505059242248535, -2.043165683746338, -1.8358255624771118, -1.6284853219985962, -1.4211450815200806, -1.213804841041565, -1.0064647197723389, -0.7991244196891785, -0.5917842388153076, -0.384443998336792, -0.17710375785827637, 0.030236482620239258, 0.2375767081975937, 0.4449169337749481, 0.6522571444511414, 0.859597384929657, 1.0669375658035278, 1.2742778062820435, 1.481618046760559, 1.6889582872390747, 1.8962985277175903, 2.1036386489868164, 2.310978889465332, 2.5183191299438477, 2.7256593704223633, 2.932999610900879, 3.1403398513793945, 3.34768009185791]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 12.0, 10.0, 13.0, 7.0, 10.0, 14.0, 30.0, 29.0, 25.0, 27.0, 29.0, 29.0, 42.0, 31.0, 44.0, 42.0, 38.0, 45.0, 51.0, 41.0, 35.0, 33.0, 29.0, 37.0, 35.0, 36.0, 33.0, 25.0, 15.0, 17.0, 16.0, 25.0, 16.0, 14.0, 16.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.669668197631836, -5.494604110717773, -5.319540500640869, -5.144476413726807, -4.969412326812744, -4.79434871673584, -4.619284629821777, -4.444220542907715, -4.269156455993652, -4.09409236907959, -3.9190285205841064, -3.743964672088623, -3.5689005851745605, -3.393836736679077, -3.2187728881835938, -3.0437088012695312, -2.868645191192627, -2.6935813426971436, -2.518517255783081, -2.3434534072875977, -2.168389320373535, -1.9933254718780518, -1.8182616233825684, -1.6431976556777954, -1.4681336879730225, -1.2930697202682495, -1.1180057525634766, -0.9429419040679932, -0.7678779363632202, -0.5928139686584473, -0.41775012016296387, -0.24268615245819092, -0.06762218475341797, 0.10744175314903259, 0.28250569105148315, 0.45756959915161133, 0.6326335668563843, 0.8076975345611572, 0.9827613830566406, 1.1578253507614136, 1.3328893184661865, 1.5079532861709595, 1.6830172538757324, 1.8580811023712158, 2.033144950866699, 2.2082090377807617, 2.383272886276245, 2.5583367347717285, 2.733400821685791, 2.9084646701812744, 3.083528757095337, 3.2585926055908203, 3.433656692504883, 3.608720541000366, 3.7837843894958496, 3.958848476409912, 4.133912086486816, 4.308976173400879, 4.484039783477783, 4.659103870391846, 4.834167957305908, 5.0092315673828125, 5.184295654296875, 5.3593597412109375, 5.534423828125]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 9.0, 8.0, 13.0, 19.0, 23.0, 26.0, 46.0, 67.0, 68.0, 112.0, 162.0, 184.0, 319.0, 450.0, 647.0, 917.0, 1361.0, 2064.0, 3046.0, 4385.0, 6128.0, 1014167.0, 5252.0, 3486.0, 2458.0, 1596.0, 1081.0, 727.0, 543.0, 364.0, 237.0, 168.0, 122.0, 105.0, 68.0, 47.0, 28.0, 22.0, 22.0, 21.0, 12.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.356604099273682, -5.200021266937256, -5.04343843460083, -4.8868560791015625, -4.730273246765137, -4.573690414428711, -4.417107582092285, -4.260524749755859, -4.103941917419434, -3.947359085083008, -3.790776491165161, -3.6341936588287354, -3.4776110649108887, -3.321028232574463, -3.164445400238037, -3.0078625679016113, -2.8512802124023438, -2.694697380065918, -2.5381147861480713, -2.3815319538116455, -2.224949359893799, -2.068366527557373, -1.9117836952209473, -1.755200982093811, -1.5986182689666748, -1.4420355558395386, -1.2854528427124023, -1.1288700103759766, -0.9722872972488403, -0.8157045841217041, -0.6591218113899231, -0.5025390386581421, -0.34595584869384766, -0.18937310576438904, -0.03279036283493042, 0.1237923800945282, 0.2803751230239868, 0.43695783615112305, 0.593540608882904, 0.7501233816146851, 0.9067060947418213, 1.0632888078689575, 1.2198715209960938, 1.3764543533325195, 1.5330370664596558, 1.689619779586792, 1.8462026119232178, 2.0027852058410645, 2.1593680381774902, 2.315950870513916, 2.4725334644317627, 2.6291162967681885, 2.785698890686035, 2.942281723022461, 3.0988645553588867, 3.2554473876953125, 3.412029981613159, 3.568612813949585, 3.7251954078674316, 3.8817782402038574, 4.038361072540283, 4.194943428039551, 4.351526260375977, 4.508109092712402, 4.664691925048828]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 12.0, 12.0, 33.0, 62.0, 91.0, 177.0, 402.0, 1098.0, 3886.0, 19816.0, 51054424.0, 360975.0, 23030.0, 4727.0, 1152.0, 400.0, 192.0, 101.0, 54.0, 36.0, 25.0, 18.0, 17.0, 10.0, 9.0, 9.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.578125, -21.893598556518555, -21.209070205688477, -20.52454376220703, -19.840017318725586, -19.15549087524414, -18.470962524414062, -17.786436080932617, -17.101909637451172, -16.417383193969727, -15.732855796813965, -15.048328399658203, -14.363801956176758, -13.679274559020996, -12.994747161865234, -12.310220718383789, -11.625692367553711, -10.94116497039795, -10.256638526916504, -9.572111129760742, -8.887584686279297, -8.203057289123535, -7.518529891967773, -6.83400297164917, -6.149476051330566, -5.464949131011963, -4.780422210693359, -4.095894813537598, -3.411367893218994, -2.7268409729003906, -2.042313575744629, -1.3577866554260254, -0.6732616424560547, 0.011265397071838379, 0.6957924365997314, 1.380319595336914, 2.0648465156555176, 2.749373435974121, 3.433900833129883, 4.118427753448486, 4.80295467376709, 5.487481594085693, 6.172008514404297, 6.856535911560059, 7.541062831878662, 8.225589752197266, 8.910117149353027, 9.594644546508789, 10.279170989990234, 10.963698387145996, 11.648224830627441, 12.332752227783203, 13.017278671264648, 13.70180606842041, 14.386333465576172, 15.070859909057617, 15.755387306213379, 16.43991470336914, 17.124441146850586, 17.80896759033203, 18.49349594116211, 19.178022384643555, 19.862548828125, 20.547077178955078, 21.231603622436523]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 8.0, 7.0, 14.0, 29.0, 38.0, 58.0, 84.0, 179.0, 240.0, 413.0, 668.0, 992.0, 1668.0, 2665.0, 4456.0, 7385.0, 12070.0, 19861.0, 32954.0, 52972.0, 85209.0, 131278.0, 195884.0, 274241.0, 352376.0, 2214180.0, 1737724.0, 350106.0, 271839.0, 193038.0, 129204.0, 83484.0, 52256.0, 32472.0, 20165.0, 11994.0, 7600.0, 4446.0, 2784.0, 1664.0, 1045.0, 634.0, 394.0, 264.0, 151.0, 85.0, 59.0, 43.0, 20.0, 23.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.0751953125, -1.0415802001953125, -1.007965087890625, -0.9743499755859375, -0.94073486328125, -0.9071197509765625, -0.873504638671875, -0.8398895263671875, -0.8062744140625, -0.7726593017578125, -0.739044189453125, -0.7054290771484375, -0.67181396484375, -0.6381988525390625, -0.604583740234375, -0.5709686279296875, -0.537353515625, -0.5037384033203125, -0.470123291015625, -0.4365081787109375, -0.40289306640625, -0.3692779541015625, -0.335662841796875, -0.3020477294921875, -0.2684326171875, -0.2348175048828125, -0.201202392578125, -0.1675872802734375, -0.13397216796875, -0.1003570556640625, -0.066741943359375, -0.0331268310546875, 0.00048828125, 0.0341033935546875, 0.067718505859375, 0.1013336181640625, 0.13494873046875, 0.1685638427734375, 0.202178955078125, 0.2357940673828125, 0.2694091796875, 0.3030242919921875, 0.336639404296875, 0.3702545166015625, 0.40386962890625, 0.4374847412109375, 0.471099853515625, 0.5047149658203125, 0.538330078125, 0.5719451904296875, 0.605560302734375, 0.6391754150390625, 0.67279052734375, 0.7064056396484375, 0.740020751953125, 0.7736358642578125, 0.8072509765625, 0.8408660888671875, 0.874481201171875, 0.9080963134765625, 0.94171142578125, 0.9753265380859375, 1.008941650390625, 1.0425567626953125, 1.076171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 8.0, 7.0, 16.0, 10.0, 14.0, 13.0, 16.0, 19.0, 22.0, 21.0, 38.0, 32.0, 45.0, 33.0, 35.0, 40.0, 34.0, 45.0, 1069.0, 48.0, 39.0, 35.0, 39.0, 41.0, 48.0, 30.0, 32.0, 28.0, 31.0, 19.0, 18.0, 10.0, 17.0, 11.0, 11.0, 8.0, 10.0, 7.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.171875, -20.501953125, -19.83203125, -19.162109375, -18.4921875, -17.822265625, -17.15234375, -16.482421875, -15.8125, -15.142578125, -14.47265625, -13.802734375, -13.1328125, -12.462890625, -11.79296875, -11.123046875, -10.453125, -9.783203125, -9.11328125, -8.443359375, -7.7734375, -7.103515625, -6.43359375, -5.763671875, -5.09375, -4.423828125, -3.75390625, -3.083984375, -2.4140625, -1.744140625, -1.07421875, -0.404296875, 0.265625, 0.935546875, 1.60546875, 2.275390625, 2.9453125, 3.615234375, 4.28515625, 4.955078125, 5.625, 6.294921875, 6.96484375, 7.634765625, 8.3046875, 8.974609375, 9.64453125, 10.314453125, 10.984375, 11.654296875, 12.32421875, 12.994140625, 13.6640625, 14.333984375, 15.00390625, 15.673828125, 16.34375, 17.013671875, 17.68359375, 18.353515625, 19.0234375, 19.693359375, 20.36328125, 21.033203125, 21.703125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 9.0, 14.0, 28.0, 41.0, 68.0, 122.0, 191.0, 290.0, 533.0, 910.0, 1530.0, 2441.0, 4301.0, 7139.0, 12065.0, 19858.0, 31770.0, 50113.0, 77739.0, 117357.0, 169262.0, 231628.0, 295689.0, 364862.0, 3445359.0, 395785.0, 301765.0, 238808.0, 176560.0, 123434.0, 82247.0, 53530.0, 33673.0, 20562.0, 12654.0, 7668.0, 4664.0, 2670.0, 1625.0, 997.0, 558.0, 366.0, 223.0, 121.0, 93.0, 45.0, 26.0, 18.0, 12.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.994842529296875, -0.96429443359375, -0.933746337890625, -0.9031982421875, -0.872650146484375, -0.84210205078125, -0.811553955078125, -0.781005859375, -0.750457763671875, -0.71990966796875, -0.689361572265625, -0.6588134765625, -0.628265380859375, -0.59771728515625, -0.567169189453125, -0.53662109375, -0.506072998046875, -0.47552490234375, -0.444976806640625, -0.4144287109375, -0.383880615234375, -0.35333251953125, -0.322784423828125, -0.292236328125, -0.261688232421875, -0.23114013671875, -0.200592041015625, -0.1700439453125, -0.139495849609375, -0.10894775390625, -0.078399658203125, -0.0478515625, -0.017303466796875, 0.01324462890625, 0.043792724609375, 0.0743408203125, 0.104888916015625, 0.13543701171875, 0.165985107421875, 0.196533203125, 0.227081298828125, 0.25762939453125, 0.288177490234375, 0.3187255859375, 0.349273681640625, 0.37982177734375, 0.410369873046875, 0.44091796875, 0.471466064453125, 0.50201416015625, 0.532562255859375, 0.5631103515625, 0.593658447265625, 0.62420654296875, 0.654754638671875, 0.685302734375, 0.715850830078125, 0.74639892578125, 0.776947021484375, 0.8074951171875, 0.838043212890625, 0.86859130859375, 0.899139404296875, 0.9296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 4.0, 13.0, 9.0, 10.0, 16.0, 10.0, 19.0, 20.0, 19.0, 19.0, 30.0, 32.0, 33.0, 47.0, 42.0, 39.0, 36.0, 43.0, 928.0, 169.0, 32.0, 51.0, 27.0, 37.0, 30.0, 31.0, 26.0, 25.0, 26.0, 28.0, 31.0, 22.0, 21.0, 17.0, 10.0, 7.0, 10.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.5390625, -13.099365234375, -12.65966796875, -12.219970703125, -11.7802734375, -11.340576171875, -10.90087890625, -10.461181640625, -10.021484375, -9.581787109375, -9.14208984375, -8.702392578125, -8.2626953125, -7.822998046875, -7.38330078125, -6.943603515625, -6.50390625, -6.064208984375, -5.62451171875, -5.184814453125, -4.7451171875, -4.305419921875, -3.86572265625, -3.426025390625, -2.986328125, -2.546630859375, -2.10693359375, -1.667236328125, -1.2275390625, -0.787841796875, -0.34814453125, 0.091552734375, 0.53125, 0.970947265625, 1.41064453125, 1.850341796875, 2.2900390625, 2.729736328125, 3.16943359375, 3.609130859375, 4.048828125, 4.488525390625, 4.92822265625, 5.367919921875, 5.8076171875, 6.247314453125, 6.68701171875, 7.126708984375, 7.56640625, 8.006103515625, 8.44580078125, 8.885498046875, 9.3251953125, 9.764892578125, 10.20458984375, 10.644287109375, 11.083984375, 11.523681640625, 11.96337890625, 12.403076171875, 12.8427734375, 13.282470703125, 13.72216796875, 14.161865234375, 14.6015625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 5.0, 8.0, 11.0, 13.0, 24.0, 36.0, 52.0, 81.0, 90.0, 145.0, 231.0, 356.0, 504.0, 741.0, 1198.0, 1716.0, 2798.0, 4442.0, 7057.0, 11145.0, 17601.0, 27596.0, 43571.0, 67225.0, 106965.0, 5425731.0, 308621.0, 94843.0, 60954.0, 39549.0, 24829.0, 15668.0, 9888.0, 6194.0, 3943.0, 2589.0, 1659.0, 1122.0, 758.0, 478.0, 352.0, 191.0, 128.0, 99.0, 68.0, 51.0, 41.0, 19.0, 20.0, 13.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1015625, -2.02880859375, -1.9560546875, -1.88330078125, -1.810546875, -1.73779296875, -1.6650390625, -1.59228515625, -1.51953125, -1.44677734375, -1.3740234375, -1.30126953125, -1.228515625, -1.15576171875, -1.0830078125, -1.01025390625, -0.9375, -0.86474609375, -0.7919921875, -0.71923828125, -0.646484375, -0.57373046875, -0.5009765625, -0.42822265625, -0.35546875, -0.28271484375, -0.2099609375, -0.13720703125, -0.064453125, 0.00830078125, 0.0810546875, 0.15380859375, 0.2265625, 0.29931640625, 0.3720703125, 0.44482421875, 0.517578125, 0.59033203125, 0.6630859375, 0.73583984375, 0.80859375, 0.88134765625, 0.9541015625, 1.02685546875, 1.099609375, 1.17236328125, 1.2451171875, 1.31787109375, 1.390625, 1.46337890625, 1.5361328125, 1.60888671875, 1.681640625, 1.75439453125, 1.8271484375, 1.89990234375, 1.97265625, 2.04541015625, 2.1181640625, 2.19091796875, 2.263671875, 2.33642578125, 2.4091796875, 2.48193359375, 2.5546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 3.0, 11.0, 13.0, 16.0, 18.0, 22.0, 25.0, 21.0, 29.0, 23.0, 18.0, 20.0, 35.0, 30.0, 49.0, 35.0, 36.0, 135.0, 953.0, 42.0, 48.0, 37.0, 42.0, 41.0, 31.0, 31.0, 28.0, 26.0, 28.0, 20.0, 29.0, 18.0, 21.0, 10.0, 11.0, 11.0, 9.0, 7.0, 5.0, 6.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.25, -10.9312744140625, -10.612548828125, -10.2938232421875, -9.97509765625, -9.6563720703125, -9.337646484375, -9.0189208984375, -8.7001953125, -8.3814697265625, -8.062744140625, -7.7440185546875, -7.42529296875, -7.1065673828125, -6.787841796875, -6.4691162109375, -6.150390625, -5.8316650390625, -5.512939453125, -5.1942138671875, -4.87548828125, -4.5567626953125, -4.238037109375, -3.9193115234375, -3.6005859375, -3.2818603515625, -2.963134765625, -2.6444091796875, -2.32568359375, -2.0069580078125, -1.688232421875, -1.3695068359375, -1.05078125, -0.7320556640625, -0.413330078125, -0.0946044921875, 0.22412109375, 0.5428466796875, 0.861572265625, 1.1802978515625, 1.4990234375, 1.8177490234375, 2.136474609375, 2.4552001953125, 2.77392578125, 3.0926513671875, 3.411376953125, 3.7301025390625, 4.048828125, 4.3675537109375, 4.686279296875, 5.0050048828125, 5.32373046875, 5.6424560546875, 5.961181640625, 6.2799072265625, 6.5986328125, 6.9173583984375, 7.236083984375, 7.5548095703125, 7.87353515625, 8.1922607421875, 8.510986328125, 8.8297119140625, 9.1484375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 14.0, 7.0, 22.0, 58.0, 157.0, 288.0, 236.0, 104.0, 53.0, 31.0, 13.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.218788146972656, -23.16107177734375, -22.103357315063477, -21.04564094543457, -19.987924575805664, -18.93021011352539, -17.872493743896484, -16.814777374267578, -15.757061958312988, -14.699346542358398, -13.641630172729492, -12.583914756774902, -11.526199340820312, -10.468482971191406, -9.410767555236816, -8.353052139282227, -7.29533576965332, -6.237619876861572, -5.179903984069824, -4.122188568115234, -3.0644726753234863, -2.0067567825317383, -0.9490413665771484, 0.10867452621459961, 1.1663904190063477, 2.2241063117980957, 3.2818219661712646, 4.339537620544434, 5.397253513336182, 6.45496940612793, 7.5126848220825195, 8.57040023803711, 9.628116607666016, 10.685832023620605, 11.743548393249512, 12.801263809204102, 13.858980178833008, 14.916695594787598, 15.974411010742188, 17.032127380371094, 18.08984375, 19.147560119628906, 20.20527458190918, 21.262990951538086, 22.320707321166992, 23.378421783447266, 24.436138153076172, 25.493854522705078, 26.55156898498535, 27.609285354614258, 28.66699981689453, 29.724716186523438, 30.782432556152344, 31.84014892578125, 32.897865295410156, 33.9555778503418, 35.0132942199707, 36.07101058959961, 37.128726959228516, 38.186439514160156, 39.24415588378906, 40.30187225341797, 41.359588623046875, 42.41730499267578, 43.47502136230469]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 12.0, 4.0, 10.0, 11.0, 8.0, 12.0, 8.0, 16.0, 18.0, 20.0, 22.0, 21.0, 20.0, 39.0, 32.0, 29.0, 37.0, 40.0, 27.0, 39.0, 42.0, 50.0, 45.0, 30.0, 42.0, 40.0, 41.0, 40.0, 28.0, 31.0, 25.0, 19.0, 13.0, 16.0, 14.0, 19.0, 16.0, 6.0, 10.0, 14.0, 8.0, 1.0, 5.0, 1.0, 6.0, 2.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.749069213867188, -13.299906730651855, -12.85074520111084, -12.401582717895508, -11.952421188354492, -11.50325870513916, -11.054097175598145, -10.604934692382812, -10.155773162841797, -9.706610679626465, -9.25744915008545, -8.808286666870117, -8.359125137329102, -7.9099626541137695, -7.460801124572754, -7.011638641357422, -6.562476634979248, -6.113314628601074, -5.6641526222229, -5.214990615844727, -4.765828609466553, -4.316666603088379, -3.867504358291626, -3.418342351913452, -2.9691803455352783, -2.5200183391571045, -2.0708563327789307, -1.6216942071914673, -1.1725322008132935, -0.7233700752258301, -0.27420806884765625, 0.17495393753051758, 0.6241159439086914, 1.0732779502868652, 1.522439956665039, 1.9716020822525024, 2.4207639694213867, 2.8699262142181396, 3.3190882205963135, 3.7682502269744873, 4.217411994934082, 4.666574001312256, 5.11573600769043, 5.5648980140686035, 6.014060020446777, 6.463222503662109, 6.912384033203125, 7.361546516418457, 7.810708522796631, 8.259870529174805, 8.709033012390137, 9.158194541931152, 9.607357025146484, 10.0565185546875, 10.505681037902832, 10.954842567443848, 11.40400505065918, 11.853167533874512, 12.302329063415527, 12.75149154663086, 13.200653076171875, 13.649815559387207, 14.098977088928223, 14.548139572143555, 14.99730110168457]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 11.0, 6.0, 15.0, 26.0, 29.0, 45.0, 62.0, 112.0, 140.0, 181.0, 324.0, 518.0, 805.0, 1334.0, 2338.0, 3854.0, 7087.0, 14015.0, 31299.0, 98012.0, 3839985.0, 120875.0, 35881.0, 15868.0, 8348.0, 4653.0, 2918.0, 1792.0, 1196.0, 772.0, 550.0, 357.0, 269.0, 179.0, 122.0, 84.0, 59.0, 50.0, 32.0, 21.0, 14.0, 11.0, 17.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.348388671875, -0.3366050720214844, -0.32482147216796875, -0.3130378723144531, -0.3012542724609375, -0.2894706726074219, -0.27768707275390625, -0.2659034729003906, -0.254119873046875, -0.24233627319335938, -0.23055267333984375, -0.21876907348632812, -0.2069854736328125, -0.19520187377929688, -0.18341827392578125, -0.17163467407226562, -0.15985107421875, -0.14806747436523438, -0.13628387451171875, -0.12450027465820312, -0.1127166748046875, -0.10093307495117188, -0.08914947509765625, -0.07736587524414062, -0.065582275390625, -0.053798675537109375, -0.04201507568359375, -0.030231475830078125, -0.0184478759765625, -0.006664276123046875, 0.00511932373046875, 0.016902923583984375, 0.0286865234375, 0.040470123291015625, 0.05225372314453125, 0.06403732299804688, 0.0758209228515625, 0.08760452270507812, 0.09938812255859375, 0.11117172241210938, 0.122955322265625, 0.13473892211914062, 0.14652252197265625, 0.15830612182617188, 0.1700897216796875, 0.18187332153320312, 0.19365692138671875, 0.20544052124023438, 0.21722412109375, 0.22900772094726562, 0.24079132080078125, 0.2525749206542969, 0.2643585205078125, 0.2761421203613281, 0.28792572021484375, 0.2997093200683594, 0.311492919921875, 0.3232765197753906, 0.33506011962890625, 0.3468437194824219, 0.3586273193359375, 0.3704109191894531, 0.38219451904296875, 0.3939781188964844, 0.40576171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 4.0, 8.0, 5.0, 8.0, 10.0, 11.0, 12.0, 12.0, 22.0, 778.0, 18.0, 15.0, 8.0, 11.0, 12.0, 8.0, 6.0, 9.0, 4.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.106689453125, -0.10329532623291016, -0.09990119934082031, -0.09650707244873047, -0.09311294555664062, -0.08971881866455078, -0.08632469177246094, -0.0829305648803711, -0.07953643798828125, -0.0761423110961914, -0.07274818420410156, -0.06935405731201172, -0.06595993041992188, -0.06256580352783203, -0.05917167663574219, -0.055777549743652344, -0.0523834228515625, -0.048989295959472656, -0.04559516906738281, -0.04220104217529297, -0.038806915283203125, -0.03541278839111328, -0.03201866149902344, -0.028624534606933594, -0.02523040771484375, -0.021836280822753906, -0.018442153930664062, -0.015048027038574219, -0.011653900146484375, -0.008259773254394531, -0.0048656463623046875, -0.0014715194702148438, 0.001922607421875, 0.005316734313964844, 0.008710861206054688, 0.012104988098144531, 0.015499114990234375, 0.01889324188232422, 0.022287368774414062, 0.025681495666503906, 0.02907562255859375, 0.032469749450683594, 0.03586387634277344, 0.03925800323486328, 0.042652130126953125, 0.04604625701904297, 0.04944038391113281, 0.052834510803222656, 0.0562286376953125, 0.059622764587402344, 0.06301689147949219, 0.06641101837158203, 0.06980514526367188, 0.07319927215576172, 0.07659339904785156, 0.0799875259399414, 0.08338165283203125, 0.0867757797241211, 0.09016990661621094, 0.09356403350830078, 0.09695816040039062, 0.10035228729248047, 0.10374641418457031, 0.10714054107666016, 0.11053466796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 8.0, 22.0, 34.0, 45.0, 61.0, 106.0, 182.0, 302.0, 505.0, 977.0, 1877.0, 3996.0, 8621.0, 21329.0, 59016.0, 199417.0, 1109286.0, 2362597.0, 296018.0, 81470.0, 27941.0, 10739.0, 4910.0, 2247.0, 1086.0, 601.0, 344.0, 181.0, 117.0, 70.0, 51.0, 39.0, 18.0, 16.0, 10.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300048828125, -0.29009246826171875, -0.2801361083984375, -0.27017974853515625, -0.260223388671875, -0.25026702880859375, -0.2403106689453125, -0.23035430908203125, -0.22039794921875, -0.21044158935546875, -0.2004852294921875, -0.19052886962890625, -0.180572509765625, -0.17061614990234375, -0.1606597900390625, -0.15070343017578125, -0.1407470703125, -0.13079071044921875, -0.1208343505859375, -0.11087799072265625, -0.100921630859375, -0.09096527099609375, -0.0810089111328125, -0.07105255126953125, -0.06109619140625, -0.05113983154296875, -0.0411834716796875, -0.03122711181640625, -0.021270751953125, -0.01131439208984375, -0.0013580322265625, 0.00859832763671875, 0.0185546875, 0.02851104736328125, 0.0384674072265625, 0.04842376708984375, 0.058380126953125, 0.06833648681640625, 0.0782928466796875, 0.08824920654296875, 0.09820556640625, 0.10816192626953125, 0.1181182861328125, 0.12807464599609375, 0.138031005859375, 0.14798736572265625, 0.1579437255859375, 0.16790008544921875, 0.1778564453125, 0.18781280517578125, 0.1977691650390625, 0.20772552490234375, 0.217681884765625, 0.22763824462890625, 0.2375946044921875, 0.24755096435546875, 0.25750732421875, 0.26746368408203125, 0.2774200439453125, 0.28737640380859375, 0.297332763671875, 0.30728912353515625, 0.3172454833984375, 0.32720184326171875, 0.337158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 7.0, 12.0, 14.0, 20.0, 27.0, 26.0, 35.0, 47.0, 46.0, 72.0, 91.0, 114.0, 162.0, 218.0, 313.0, 722.0, 852.0, 344.0, 213.0, 149.0, 119.0, 94.0, 87.0, 72.0, 33.0, 45.0, 32.0, 18.0, 22.0, 19.0, 10.0, 3.0, 4.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.14377593994140625, -0.1389923095703125, -0.13420867919921875, -0.129425048828125, -0.12464141845703125, -0.1198577880859375, -0.11507415771484375, -0.11029052734375, -0.10550689697265625, -0.1007232666015625, -0.09593963623046875, -0.091156005859375, -0.08637237548828125, -0.0815887451171875, -0.07680511474609375, -0.072021484375, -0.06723785400390625, -0.0624542236328125, -0.05767059326171875, -0.052886962890625, -0.04810333251953125, -0.0433197021484375, -0.03853607177734375, -0.03375244140625, -0.02896881103515625, -0.0241851806640625, -0.01940155029296875, -0.014617919921875, -0.00983428955078125, -0.0050506591796875, -0.00026702880859375, 0.0045166015625, 0.00930023193359375, 0.0140838623046875, 0.01886749267578125, 0.023651123046875, 0.02843475341796875, 0.0332183837890625, 0.03800201416015625, 0.04278564453125, 0.04756927490234375, 0.0523529052734375, 0.05713653564453125, 0.061920166015625, 0.06670379638671875, 0.0714874267578125, 0.07627105712890625, 0.0810546875, 0.08583831787109375, 0.0906219482421875, 0.09540557861328125, 0.100189208984375, 0.10497283935546875, 0.1097564697265625, 0.11454010009765625, 0.11932373046875, 0.12410736083984375, 0.1288909912109375, 0.13367462158203125, 0.138458251953125, 0.14324188232421875, 0.1480255126953125, 0.15280914306640625, 0.1575927734375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 11.0, 11.0, 26.0, 70.0, 134.0, 214.0, 208.0, 166.0, 80.0, 38.0, 22.0, 9.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0877388715744019, -1.0405055284500122, -0.9932721853256226, -0.9460387825965881, -0.8988054394721985, -0.8515720963478088, -0.8043386936187744, -0.7571053504943848, -0.7098720073699951, -0.6626386642456055, -0.6154053211212158, -0.5681719183921814, -0.5209385752677917, -0.4737052321434021, -0.42647185921669006, -0.379238486289978, -0.3320051431655884, -0.28477180004119873, -0.2375384271144867, -0.19030506908893585, -0.143071711063385, -0.09583835303783417, -0.048604995012283325, -0.001371622085571289, 0.04586172103881836, 0.0930950790643692, 0.14032843708992004, 0.1875617951154709, 0.23479515314102173, 0.2820284962654114, 0.3292618691921234, 0.37649524211883545, 0.42372870445251465, 0.4709620475769043, 0.518195390701294, 0.5654287934303284, 0.612662136554718, 0.6598954796791077, 0.7071288824081421, 0.7543622255325317, 0.8015955686569214, 0.848828911781311, 0.8960622549057007, 0.9432956576347351, 0.9905290007591248, 1.0377624034881592, 1.0849957466125488, 1.1322290897369385, 1.1794624328613281, 1.2266957759857178, 1.2739291191101074, 1.321162462234497, 1.3683958053588867, 1.415629267692566, 1.4628626108169556, 1.5100959539413452, 1.5573292970657349, 1.6045626401901245, 1.6517959833145142, 1.6990293264389038, 1.746262788772583, 1.7934961318969727, 1.8407294750213623, 1.887962818145752, 1.9351961612701416]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 5.0, 7.0, 7.0, 14.0, 15.0, 12.0, 24.0, 33.0, 36.0, 27.0, 40.0, 38.0, 43.0, 54.0, 45.0, 45.0, 59.0, 47.0, 63.0, 47.0, 42.0, 54.0, 42.0, 22.0, 26.0, 21.0, 20.0, 20.0, 19.0, 10.0, 17.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.9560815691947937, -0.9309221506118774, -0.9057627320289612, -0.8806033134460449, -0.8554439544677734, -0.8302845358848572, -0.8051251173019409, -0.7799656987190247, -0.7548062801361084, -0.7296468615531921, -0.7044874429702759, -0.6793280839920044, -0.6541686654090881, -0.6290092468261719, -0.6038498282432556, -0.5786904096603394, -0.5535310506820679, -0.5283716320991516, -0.5032122135162354, -0.4780528247356415, -0.4528934359550476, -0.42773401737213135, -0.4025745987892151, -0.37741518020629883, -0.35225579142570496, -0.3270963728427887, -0.3019369840621948, -0.27677756547927856, -0.2516181468963623, -0.22645875811576843, -0.20129933953285217, -0.1761399358510971, -0.15098059177398682, -0.12582118809223175, -0.10066177695989609, -0.07550236582756042, -0.05034296214580536, -0.025183558464050293, -2.4139881134033203e-05, 0.025135263800621033, 0.0502946674823761, 0.07545407116413116, 0.10061348229646683, 0.1257728934288025, 0.15093229711055756, 0.17609170079231262, 0.20125111937522888, 0.22641052305698395, 0.251569926738739, 0.2767293453216553, 0.30188873410224915, 0.3270481526851654, 0.3522075414657593, 0.37736696004867554, 0.4025263786315918, 0.42768579721450806, 0.45284518599510193, 0.4780046045780182, 0.5031639933586121, 0.5283234119415283, 0.5534828305244446, 0.5786422491073608, 0.6038016080856323, 0.6289610266685486, 0.6541204452514648]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 15.0, 15.0, 26.0, 31.0, 39.0, 67.0, 85.0, 133.0, 157.0, 276.0, 371.0, 527.0, 843.0, 1283.0, 2107.0, 3382.0, 5410.0, 9503.0, 17799.0, 42850.0, 617070.0, 277746.0, 32062.0, 15278.0, 8187.0, 4832.0, 2980.0, 1856.0, 1145.0, 780.0, 526.0, 342.0, 254.0, 167.0, 117.0, 79.0, 53.0, 52.0, 35.0, 27.0, 15.0, 9.0, 15.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.253662109375, -0.24570465087890625, -0.2377471923828125, -0.22978973388671875, -0.221832275390625, -0.21387481689453125, -0.2059173583984375, -0.19795989990234375, -0.19000244140625, -0.18204498291015625, -0.1740875244140625, -0.16613006591796875, -0.158172607421875, -0.15021514892578125, -0.1422576904296875, -0.13430023193359375, -0.1263427734375, -0.11838531494140625, -0.1104278564453125, -0.10247039794921875, -0.094512939453125, -0.08655548095703125, -0.0785980224609375, -0.07064056396484375, -0.06268310546875, -0.05472564697265625, -0.0467681884765625, -0.03881072998046875, -0.030853271484375, -0.02289581298828125, -0.0149383544921875, -0.00698089599609375, 0.0009765625, 0.00893402099609375, 0.0168914794921875, 0.02484893798828125, 0.032806396484375, 0.04076385498046875, 0.0487213134765625, 0.05667877197265625, 0.06463623046875, 0.07259368896484375, 0.0805511474609375, 0.08850860595703125, 0.096466064453125, 0.10442352294921875, 0.1123809814453125, 0.12033843994140625, 0.1282958984375, 0.13625335693359375, 0.1442108154296875, 0.15216827392578125, 0.160125732421875, 0.16808319091796875, 0.1760406494140625, 0.18399810791015625, 0.19195556640625, 0.19991302490234375, 0.2078704833984375, 0.21582794189453125, 0.223785400390625, 0.23174285888671875, 0.2397003173828125, 0.24765777587890625, 0.255615234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 1.0, 9.0, 3.0, 8.0, 6.0, 10.0, 15.0, 15.0, 37.0, 151.0, 308.0, 243.0, 79.0, 22.0, 17.0, 13.0, 9.0, 11.0, 5.0, 4.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1058349609375, -0.10239887237548828, -0.09896278381347656, -0.09552669525146484, -0.09209060668945312, -0.0886545181274414, -0.08521842956542969, -0.08178234100341797, -0.07834625244140625, -0.07491016387939453, -0.07147407531738281, -0.0680379867553711, -0.06460189819335938, -0.061165809631347656, -0.05772972106933594, -0.05429363250732422, -0.0508575439453125, -0.04742145538330078, -0.04398536682128906, -0.040549278259277344, -0.037113189697265625, -0.033677101135253906, -0.030241012573242188, -0.02680492401123047, -0.02336883544921875, -0.01993274688720703, -0.016496658325195312, -0.013060569763183594, -0.009624481201171875, -0.006188392639160156, -0.0027523040771484375, 0.0006837844848632812, 0.004119873046875, 0.007555961608886719, 0.010992050170898438, 0.014428138732910156, 0.017864227294921875, 0.021300315856933594, 0.024736404418945312, 0.02817249298095703, 0.03160858154296875, 0.03504467010498047, 0.03848075866699219, 0.041916847229003906, 0.045352935791015625, 0.048789024353027344, 0.05222511291503906, 0.05566120147705078, 0.0590972900390625, 0.06253337860107422, 0.06596946716308594, 0.06940555572509766, 0.07284164428710938, 0.0762777328491211, 0.07971382141113281, 0.08314990997314453, 0.08658599853515625, 0.09002208709716797, 0.09345817565917969, 0.0968942642211914, 0.10033035278320312, 0.10376644134521484, 0.10720252990722656, 0.11063861846923828, 0.11407470703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 5.0, 16.0, 21.0, 36.0, 83.0, 143.0, 330.0, 733.0, 1942.0, 5998.0, 20283.0, 79778.0, 318449.0, 448735.0, 126972.0, 31241.0, 8992.0, 2877.0, 1029.0, 458.0, 190.0, 115.0, 47.0, 16.0, 20.0, 15.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4912109375, -0.4754486083984375, -0.459686279296875, -0.4439239501953125, -0.42816162109375, -0.4123992919921875, -0.396636962890625, -0.3808746337890625, -0.3651123046875, -0.3493499755859375, -0.333587646484375, -0.3178253173828125, -0.30206298828125, -0.2863006591796875, -0.270538330078125, -0.2547760009765625, -0.239013671875, -0.2232513427734375, -0.207489013671875, -0.1917266845703125, -0.17596435546875, -0.1602020263671875, -0.144439697265625, -0.1286773681640625, -0.1129150390625, -0.0971527099609375, -0.081390380859375, -0.0656280517578125, -0.04986572265625, -0.0341033935546875, -0.018341064453125, -0.0025787353515625, 0.01318359375, 0.0289459228515625, 0.044708251953125, 0.0604705810546875, 0.07623291015625, 0.0919952392578125, 0.107757568359375, 0.1235198974609375, 0.1392822265625, 0.1550445556640625, 0.170806884765625, 0.1865692138671875, 0.20233154296875, 0.2180938720703125, 0.233856201171875, 0.2496185302734375, 0.265380859375, 0.2811431884765625, 0.296905517578125, 0.3126678466796875, 0.32843017578125, 0.3441925048828125, 0.359954833984375, 0.3757171630859375, 0.3914794921875, 0.4072418212890625, 0.423004150390625, 0.4387664794921875, 0.45452880859375, 0.4702911376953125, 0.486053466796875, 0.5018157958984375, 0.517578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 6.0, 12.0, 9.0, 6.0, 11.0, 27.0, 27.0, 31.0, 24.0, 39.0, 39.0, 36.0, 39.0, 47.0, 35.0, 34.0, 38.0, 41.0, 44.0, 32.0, 38.0, 34.0, 29.0, 28.0, 35.0, 30.0, 35.0, 28.0, 28.0, 21.0, 13.0, 11.0, 14.0, 18.0, 6.0, 7.0, 6.0, 10.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.373046875, -0.3599891662597656, -0.34693145751953125, -0.3338737487792969, -0.3208160400390625, -0.3077583312988281, -0.29470062255859375, -0.2816429138183594, -0.268585205078125, -0.2555274963378906, -0.24246978759765625, -0.22941207885742188, -0.2163543701171875, -0.20329666137695312, -0.19023895263671875, -0.17718124389648438, -0.16412353515625, -0.15106582641601562, -0.13800811767578125, -0.12495040893554688, -0.1118927001953125, -0.09883499145507812, -0.08577728271484375, -0.07271957397460938, -0.059661865234375, -0.046604156494140625, -0.03354644775390625, -0.020488739013671875, -0.0074310302734375, 0.005626678466796875, 0.01868438720703125, 0.031742095947265625, 0.0447998046875, 0.057857513427734375, 0.07091522216796875, 0.08397293090820312, 0.0970306396484375, 0.11008834838867188, 0.12314605712890625, 0.13620376586914062, 0.149261474609375, 0.16231918334960938, 0.17537689208984375, 0.18843460083007812, 0.2014923095703125, 0.21455001831054688, 0.22760772705078125, 0.24066543579101562, 0.25372314453125, 0.2667808532714844, 0.27983856201171875, 0.2928962707519531, 0.3059539794921875, 0.3190116882324219, 0.33206939697265625, 0.3451271057128906, 0.358184814453125, 0.3712425231933594, 0.38430023193359375, 0.3973579406738281, 0.4104156494140625, 0.4234733581542969, 0.43653106689453125, 0.4495887756347656, 0.462646484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 6.0, 19.0, 20.0, 47.0, 115.0, 349.0, 1490.0, 20258.0, 1018514.0, 6420.0, 869.0, 242.0, 98.0, 53.0, 20.0, 9.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.06597900390625, -1.0255126953125, -0.98504638671875, -0.944580078125, -0.90411376953125, -0.8636474609375, -0.82318115234375, -0.78271484375, -0.74224853515625, -0.7017822265625, -0.66131591796875, -0.620849609375, -0.58038330078125, -0.5399169921875, -0.49945068359375, -0.458984375, -0.41851806640625, -0.3780517578125, -0.33758544921875, -0.297119140625, -0.25665283203125, -0.2161865234375, -0.17572021484375, -0.13525390625, -0.09478759765625, -0.0543212890625, -0.01385498046875, 0.026611328125, 0.06707763671875, 0.1075439453125, 0.14801025390625, 0.1884765625, 0.22894287109375, 0.2694091796875, 0.30987548828125, 0.350341796875, 0.39080810546875, 0.4312744140625, 0.47174072265625, 0.51220703125, 0.55267333984375, 0.5931396484375, 0.63360595703125, 0.674072265625, 0.71453857421875, 0.7550048828125, 0.79547119140625, 0.8359375, 0.87640380859375, 0.9168701171875, 0.95733642578125, 0.997802734375, 1.03826904296875, 1.0787353515625, 1.11920166015625, 1.15966796875, 1.20013427734375, 1.2406005859375, 1.28106689453125, 1.321533203125, 1.36199951171875, 1.4024658203125, 1.44293212890625, 1.4833984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 14.0, 15.0, 18.0, 19.0, 15.0, 41.0, 53.0, 59.0, 57.0, 63.0, 73.0, 84.0, 65.0, 66.0, 75.0, 50.0, 48.0, 34.0, 34.0, 19.0, 14.0, 12.0, 11.0, 7.0, 5.0, 4.0, 2.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.574920654296875e-05, -2.4784356355667114e-05, -2.381950616836548e-05, -2.2854655981063843e-05, -2.1889805793762207e-05, -2.092495560646057e-05, -1.9960105419158936e-05, -1.89952552318573e-05, -1.8030405044555664e-05, -1.706555485725403e-05, -1.6100704669952393e-05, -1.5135854482650757e-05, -1.4171004295349121e-05, -1.3206154108047485e-05, -1.224130392074585e-05, -1.1276453733444214e-05, -1.0311603546142578e-05, -9.346753358840942e-06, -8.381903171539307e-06, -7.417052984237671e-06, -6.452202796936035e-06, -5.487352609634399e-06, -4.522502422332764e-06, -3.557652235031128e-06, -2.592802047729492e-06, -1.6279518604278564e-06, -6.631016731262207e-07, 3.0174851417541504e-07, 1.2665987014770508e-06, 2.2314488887786865e-06, 3.1962990760803223e-06, 4.161149263381958e-06, 5.125999450683594e-06, 6.0908496379852295e-06, 7.055699825286865e-06, 8.020550012588501e-06, 8.985400199890137e-06, 9.950250387191772e-06, 1.0915100574493408e-05, 1.1879950761795044e-05, 1.284480094909668e-05, 1.3809651136398315e-05, 1.4774501323699951e-05, 1.5739351511001587e-05, 1.6704201698303223e-05, 1.766905188560486e-05, 1.8633902072906494e-05, 1.959875226020813e-05, 2.0563602447509766e-05, 2.15284526348114e-05, 2.2493302822113037e-05, 2.3458153009414673e-05, 2.442300319671631e-05, 2.5387853384017944e-05, 2.635270357131958e-05, 2.7317553758621216e-05, 2.828240394592285e-05, 2.9247254133224487e-05, 3.0212104320526123e-05, 3.117695450782776e-05, 3.2141804695129395e-05, 3.310665488243103e-05, 3.4071505069732666e-05, 3.50363552570343e-05, 3.600120544433594e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 7.0, 17.0, 12.0, 23.0, 34.0, 54.0, 87.0, 115.0, 159.0, 244.0, 313.0, 581.0, 936.0, 1543.0, 2870.0, 5570.0, 12027.0, 31639.0, 113897.0, 572434.0, 223442.0, 49213.0, 17006.0, 7470.0, 3652.0, 2009.0, 1155.0, 672.0, 441.0, 290.0, 198.0, 127.0, 89.0, 70.0, 44.0, 25.0, 25.0, 16.0, 13.0, 11.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.1934814453125, -0.18806076049804688, -0.18264007568359375, -0.17721939086914062, -0.1717987060546875, -0.16637802124023438, -0.16095733642578125, -0.15553665161132812, -0.150115966796875, -0.14469528198242188, -0.13927459716796875, -0.13385391235351562, -0.1284332275390625, -0.12301254272460938, -0.11759185791015625, -0.11217117309570312, -0.10675048828125, -0.10132980346679688, -0.09590911865234375, -0.09048843383789062, -0.0850677490234375, -0.07964706420898438, -0.07422637939453125, -0.06880569458007812, -0.063385009765625, -0.057964324951171875, -0.05254364013671875, -0.047122955322265625, -0.0417022705078125, -0.036281585693359375, -0.03086090087890625, -0.025440216064453125, -0.02001953125, -0.014598846435546875, -0.00917816162109375, -0.003757476806640625, 0.0016632080078125, 0.007083892822265625, 0.01250457763671875, 0.017925262451171875, 0.023345947265625, 0.028766632080078125, 0.03418731689453125, 0.039608001708984375, 0.0450286865234375, 0.050449371337890625, 0.05587005615234375, 0.061290740966796875, 0.06671142578125, 0.07213211059570312, 0.07755279541015625, 0.08297348022460938, 0.0883941650390625, 0.09381484985351562, 0.09923553466796875, 0.10465621948242188, 0.110076904296875, 0.11549758911132812, 0.12091827392578125, 0.12633895874023438, 0.1317596435546875, 0.13718032836914062, 0.14260101318359375, 0.14802169799804688, 0.1534423828125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 11.0, 18.0, 22.0, 39.0, 32.0, 56.0, 69.0, 104.0, 128.0, 109.0, 102.0, 65.0, 55.0, 41.0, 33.0, 33.0, 13.0, 9.0, 11.0, 5.0, 8.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2693595886230469, -0.26064300537109375, -0.2519264221191406, -0.2432098388671875, -0.23449325561523438, -0.22577667236328125, -0.21706008911132812, -0.208343505859375, -0.19962692260742188, -0.19091033935546875, -0.18219375610351562, -0.1734771728515625, -0.16476058959960938, -0.15604400634765625, -0.14732742309570312, -0.13861083984375, -0.12989425659179688, -0.12117767333984375, -0.11246109008789062, -0.1037445068359375, -0.09502792358398438, -0.08631134033203125, -0.07759475708007812, -0.068878173828125, -0.060161590576171875, -0.05144500732421875, -0.042728424072265625, -0.0340118408203125, -0.025295257568359375, -0.01657867431640625, -0.007862091064453125, 0.0008544921875, 0.009571075439453125, 0.01828765869140625, 0.027004241943359375, 0.0357208251953125, 0.044437408447265625, 0.05315399169921875, 0.061870574951171875, 0.070587158203125, 0.07930374145507812, 0.08802032470703125, 0.09673690795898438, 0.1054534912109375, 0.11417007446289062, 0.12288665771484375, 0.13160324096679688, 0.14031982421875, 0.14903640747070312, 0.15775299072265625, 0.16646957397460938, 0.1751861572265625, 0.18390274047851562, 0.19261932373046875, 0.20133590698242188, 0.210052490234375, 0.21876907348632812, 0.22748565673828125, 0.23620223999023438, 0.2449188232421875, 0.2536354064941406, 0.26235198974609375, 0.2710685729980469, 0.27978515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 24.0, 42.0, 96.0, 196.0, 255.0, 164.0, 86.0, 46.0, 29.0, 14.0, 12.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.376052379608154, -5.219544410705566, -5.0630364418029785, -4.906528472900391, -4.750020980834961, -4.593513011932373, -4.437005043029785, -4.280497074127197, -4.123989105224609, -3.9674811363220215, -3.8109731674194336, -3.654465436935425, -3.497957468032837, -3.341449499130249, -3.1849417686462402, -3.0284337997436523, -2.8719258308410645, -2.7154178619384766, -2.5589098930358887, -2.40240216255188, -2.245894193649292, -2.089386224746704, -1.9328783750534058, -1.7763705253601074, -1.6198625564575195, -1.4633545875549316, -1.3068467378616333, -1.150338888168335, -0.9938309192657471, -0.837323009967804, -0.6808151006698608, -0.5243072509765625, -0.3677988052368164, -0.2112908959388733, -0.054782986640930176, 0.10172492265701294, 0.25823283195495605, 0.41474074125289917, 0.5712486505508423, 0.7277565002441406, 0.8842644691467285, 1.0407724380493164, 1.1972802877426147, 1.353788137435913, 1.510296106338501, 1.6668040752410889, 1.8233119249343872, 1.9798197746276855, 2.1363277435302734, 2.2928357124328613, 2.449343681335449, 2.605851411819458, 2.762359380722046, 2.918867349624634, 3.0753750801086426, 3.2318830490112305, 3.3883910179138184, 3.5448989868164062, 3.701406955718994, 3.857914686203003, 4.014422416687012, 4.1709303855896, 4.3274383544921875, 4.483946323394775, 4.640454292297363]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 1.0, 6.0, 5.0, 7.0, 11.0, 17.0, 36.0, 63.0, 111.0, 122.0, 171.0, 130.0, 115.0, 70.0, 35.0, 23.0, 14.0, 11.0, 8.0, 4.0, 2.0, 1.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.360021591186523, -9.090184211730957, -8.820345878601074, -8.550508499145508, -8.280671119689941, -8.010833740234375, -7.740995407104492, -7.471158027648926, -7.201320171356201, -6.931482315063477, -6.66164493560791, -6.3918070793151855, -6.121969223022461, -5.8521318435668945, -5.58229398727417, -5.312456130981445, -5.042618751525879, -4.772780895233154, -4.502943515777588, -4.233105659484863, -3.9632680416107178, -3.6934304237365723, -3.4235925674438477, -3.153754949569702, -2.8839173316955566, -2.614079713821411, -2.3442420959472656, -2.074404239654541, -1.8045666217803955, -1.53472900390625, -1.264891266822815, -0.9950535297393799, -0.7252163887023926, -0.4553787112236023, -0.185541033744812, 0.08429664373397827, 0.35413432121276855, 0.6239719390869141, 0.8938096761703491, 1.1636474132537842, 1.4334850311279297, 1.7033226490020752, 1.9731603860855103, 2.2429981231689453, 2.512835741043091, 2.7826733589172363, 3.052511215209961, 3.3223488330841064, 3.592186450958252, 3.8620240688323975, 4.131861686706543, 4.401699542999268, 4.671537399291992, 4.941374778747559, 5.211212635040283, 5.481050491333008, 5.750887870788574, 6.020725727081299, 6.290563106536865, 6.56040096282959, 6.830238342285156, 7.100076198577881, 7.3699140548706055, 7.639751434326172, 7.9095892906188965]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 5.0, 9.0, 8.0, 5.0, 7.0, 20.0, 25.0, 34.0, 41.0, 73.0, 86.0, 116.0, 183.0, 230.0, 428.0, 630.0, 972.0, 1651.0, 2943.0, 6031.0, 15129.0, 73639.0, 3932661.0, 125063.0, 19464.0, 6863.0, 3339.0, 1810.0, 964.0, 649.0, 365.0, 267.0, 167.0, 136.0, 95.0, 59.0, 28.0, 18.0, 26.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9873046875, -0.9587631225585938, -0.9302215576171875, -0.9016799926757812, -0.873138427734375, -0.8445968627929688, -0.8160552978515625, -0.7875137329101562, -0.75897216796875, -0.7304306030273438, -0.7018890380859375, -0.6733474731445312, -0.644805908203125, -0.6162643432617188, -0.5877227783203125, -0.5591812133789062, -0.5306396484375, -0.5020980834960938, -0.4735565185546875, -0.44501495361328125, -0.416473388671875, -0.38793182373046875, -0.3593902587890625, -0.33084869384765625, -0.30230712890625, -0.27376556396484375, -0.2452239990234375, -0.21668243408203125, -0.188140869140625, -0.15959930419921875, -0.1310577392578125, -0.10251617431640625, -0.073974609375, -0.04543304443359375, -0.0168914794921875, 0.01165008544921875, 0.040191650390625, 0.06873321533203125, 0.0972747802734375, 0.12581634521484375, 0.15435791015625, 0.18289947509765625, 0.2114410400390625, 0.23998260498046875, 0.268524169921875, 0.29706573486328125, 0.3256072998046875, 0.35414886474609375, 0.3826904296875, 0.41123199462890625, 0.4397735595703125, 0.46831512451171875, 0.496856689453125, 0.5253982543945312, 0.5539398193359375, 0.5824813842773438, 0.61102294921875, 0.6395645141601562, 0.6681060791015625, 0.6966476440429688, 0.725189208984375, 0.7537307739257812, 0.7822723388671875, 0.8108139038085938, 0.83935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 6.0, 11.0, 7.0, 21.0, 14.0, 37.0, 74.0, 114.0, 182.0, 162.0, 124.0, 70.0, 47.0, 24.0, 15.0, 11.0, 9.0, 3.0, 7.0, 5.0, 6.0, 4.0, 2.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.11114501953125, -0.10814285278320312, -0.10514068603515625, -0.10213851928710938, -0.0991363525390625, -0.09613418579101562, -0.09313201904296875, -0.09012985229492188, -0.087127685546875, -0.08412551879882812, -0.08112335205078125, -0.07812118530273438, -0.0751190185546875, -0.07211685180664062, -0.06911468505859375, -0.06611251831054688, -0.0631103515625, -0.060108184814453125, -0.05710601806640625, -0.054103851318359375, -0.0511016845703125, -0.048099517822265625, -0.04509735107421875, -0.042095184326171875, -0.039093017578125, -0.036090850830078125, -0.03308868408203125, -0.030086517333984375, -0.0270843505859375, -0.024082183837890625, -0.02108001708984375, -0.018077850341796875, -0.01507568359375, -0.012073516845703125, -0.00907135009765625, -0.006069183349609375, -0.0030670166015625, -6.4849853515625e-05, 0.00293731689453125, 0.005939483642578125, 0.008941650390625, 0.011943817138671875, 0.01494598388671875, 0.017948150634765625, 0.0209503173828125, 0.023952484130859375, 0.02695465087890625, 0.029956817626953125, 0.032958984375, 0.035961151123046875, 0.03896331787109375, 0.041965484619140625, 0.0449676513671875, 0.047969818115234375, 0.05097198486328125, 0.053974151611328125, 0.056976318359375, 0.059978485107421875, 0.06298065185546875, 0.06598281860351562, 0.0689849853515625, 0.07198715209960938, 0.07498931884765625, 0.07799148559570312, 0.08099365234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 13.0, 14.0, 6.0, 21.0, 17.0, 31.0, 45.0, 64.0, 109.0, 174.0, 238.0, 403.0, 693.0, 1222.0, 1987.0, 3693.0, 7436.0, 16587.0, 52951.0, 439660.0, 3497630.0, 120282.0, 28559.0, 10835.0, 5037.0, 2703.0, 1564.0, 830.0, 532.0, 333.0, 208.0, 133.0, 85.0, 59.0, 36.0, 24.0, 19.0, 15.0, 11.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.68212890625, -0.6616134643554688, -0.6410980224609375, -0.6205825805664062, -0.600067138671875, -0.5795516967773438, -0.5590362548828125, -0.5385208129882812, -0.51800537109375, -0.49748992919921875, -0.4769744873046875, -0.45645904541015625, -0.435943603515625, -0.41542816162109375, -0.3949127197265625, -0.37439727783203125, -0.3538818359375, -0.33336639404296875, -0.3128509521484375, -0.29233551025390625, -0.271820068359375, -0.25130462646484375, -0.2307891845703125, -0.21027374267578125, -0.18975830078125, -0.16924285888671875, -0.1487274169921875, -0.12821197509765625, -0.107696533203125, -0.08718109130859375, -0.0666656494140625, -0.04615020751953125, -0.025634765625, -0.00511932373046875, 0.0153961181640625, 0.03591156005859375, 0.056427001953125, 0.07694244384765625, 0.0974578857421875, 0.11797332763671875, 0.13848876953125, 0.15900421142578125, 0.1795196533203125, 0.20003509521484375, 0.220550537109375, 0.24106597900390625, 0.2615814208984375, 0.28209686279296875, 0.3026123046875, 0.32312774658203125, 0.3436431884765625, 0.36415863037109375, 0.384674072265625, 0.40518951416015625, 0.4257049560546875, 0.44622039794921875, 0.46673583984375, 0.48725128173828125, 0.5077667236328125, 0.5282821655273438, 0.548797607421875, 0.5693130493164062, 0.5898284912109375, 0.6103439331054688, 0.630859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 5.0, 4.0, 7.0, 11.0, 14.0, 14.0, 41.0, 51.0, 86.0, 166.0, 404.0, 2112.0, 618.0, 206.0, 99.0, 61.0, 33.0, 33.0, 14.0, 14.0, 13.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1583251953125, -0.15346908569335938, -0.14861297607421875, -0.14375686645507812, -0.1389007568359375, -0.13404464721679688, -0.12918853759765625, -0.12433242797851562, -0.119476318359375, -0.11462020874023438, -0.10976409912109375, -0.10490798950195312, -0.1000518798828125, -0.09519577026367188, -0.09033966064453125, -0.08548355102539062, -0.08062744140625, -0.07577133178710938, -0.07091522216796875, -0.06605911254882812, -0.0612030029296875, -0.056346893310546875, -0.05149078369140625, -0.046634674072265625, -0.041778564453125, -0.036922454833984375, -0.03206634521484375, -0.027210235595703125, -0.0223541259765625, -0.017498016357421875, -0.01264190673828125, -0.007785797119140625, -0.0029296875, 0.001926422119140625, 0.00678253173828125, 0.011638641357421875, 0.0164947509765625, 0.021350860595703125, 0.02620697021484375, 0.031063079833984375, 0.035919189453125, 0.040775299072265625, 0.04563140869140625, 0.050487518310546875, 0.0553436279296875, 0.060199737548828125, 0.06505584716796875, 0.06991195678710938, 0.07476806640625, 0.07962417602539062, 0.08448028564453125, 0.08933639526367188, 0.0941925048828125, 0.09904861450195312, 0.10390472412109375, 0.10876083374023438, 0.113616943359375, 0.11847305297851562, 0.12332916259765625, 0.12818527221679688, 0.1330413818359375, 0.13789749145507812, 0.14275360107421875, 0.14760971069335938, 0.1524658203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 9.0, 23.0, 43.0, 96.0, 260.0, 253.0, 149.0, 68.0, 42.0, 22.0, 16.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4395490288734436, -0.41229909658432007, -0.38504916429519653, -0.357799232006073, -0.33054929971694946, -0.3032993674278259, -0.27604940533638, -0.24879947304725647, -0.22154954075813293, -0.1942996084690094, -0.16704967617988586, -0.13979972898960114, -0.1125497967004776, -0.08529986441135406, -0.058049917221069336, -0.0307999849319458, -0.0035500526428222656, 0.023699883371591568, 0.0509498193860054, 0.07819975912570953, 0.10544969141483307, 0.1326996237039566, 0.15994957089424133, 0.18719950318336487, 0.2144494354724884, 0.24169936776161194, 0.2689493000507355, 0.2961992621421814, 0.32344919443130493, 0.35069912672042847, 0.377949059009552, 0.40519899129867554, 0.4324488639831543, 0.45969879627227783, 0.48694872856140137, 0.5141986608505249, 0.5414485931396484, 0.568698525428772, 0.5959484577178955, 0.623198390007019, 0.6504483222961426, 0.6776982545852661, 0.7049481868743896, 0.7321981191635132, 0.7594480514526367, 0.7866979837417603, 0.8139479160308838, 0.8411978483200073, 0.8684478402137756, 0.8956977725028992, 0.9229477047920227, 0.9501976370811462, 0.9774475693702698, 1.004697561264038, 1.0319474935531616, 1.0591974258422852, 1.0864473581314087, 1.1136972904205322, 1.1409472227096558, 1.1681971549987793, 1.1954470872879028, 1.2226970195770264, 1.24994695186615, 1.2771968841552734, 1.304446816444397]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 11.0, 8.0, 23.0, 19.0, 35.0, 49.0, 75.0, 86.0, 126.0, 107.0, 112.0, 92.0, 63.0, 58.0, 42.0, 24.0, 17.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.908355712890625, -0.8805968165397644, -0.852837860584259, -0.8250789642333984, -0.7973200678825378, -0.7695611715316772, -0.7418022155761719, -0.7140433192253113, -0.6862844228744507, -0.6585255265235901, -0.6307665705680847, -0.6030076742172241, -0.5752487778663635, -0.5474898815155029, -0.5197309255599976, -0.49197202920913696, -0.4642130732536316, -0.4364541471004486, -0.408695250749588, -0.38093632459640503, -0.35317742824554443, -0.32541850209236145, -0.29765957593917847, -0.26990067958831787, -0.2421417534351349, -0.2143828421831131, -0.1866239309310913, -0.15886500477790833, -0.13110609352588654, -0.10334718227386475, -0.07558825612068176, -0.04782934486865997, -0.020070433616638184, 0.007688481360673904, 0.03544739633798599, 0.06320631504058838, 0.09096522629261017, 0.11872413754463196, 0.14648306369781494, 0.17424197494983673, 0.20200088620185852, 0.2297597974538803, 0.2575187087059021, 0.2852776348590851, 0.31303656101226807, 0.34079545736312866, 0.36855438351631165, 0.39631330966949463, 0.4240722060203552, 0.4518311321735382, 0.4795900285243988, 0.5073489546775818, 0.5351078510284424, 0.5628668069839478, 0.5906257033348083, 0.618384599685669, 0.6461435556411743, 0.6739024519920349, 0.7016614079475403, 0.7294203042984009, 0.7571792006492615, 0.7849380970001221, 0.8126970529556274, 0.840455949306488, 0.8682148456573486]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 5.0, 8.0, 11.0, 11.0, 21.0, 19.0, 34.0, 44.0, 78.0, 119.0, 152.0, 306.0, 472.0, 770.0, 1399.0, 2538.0, 4939.0, 10475.0, 27300.0, 108675.0, 639848.0, 188055.0, 36651.0, 13491.0, 6099.0, 3012.0, 1662.0, 894.0, 548.0, 302.0, 223.0, 131.0, 77.0, 46.0, 40.0, 22.0, 14.0, 19.0, 13.0, 8.0, 4.0, 5.0, 7.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.476318359375, -0.46172332763671875, -0.4471282958984375, -0.43253326416015625, -0.417938232421875, -0.40334320068359375, -0.3887481689453125, -0.37415313720703125, -0.35955810546875, -0.34496307373046875, -0.3303680419921875, -0.31577301025390625, -0.301177978515625, -0.28658294677734375, -0.2719879150390625, -0.25739288330078125, -0.2427978515625, -0.22820281982421875, -0.2136077880859375, -0.19901275634765625, -0.184417724609375, -0.16982269287109375, -0.1552276611328125, -0.14063262939453125, -0.12603759765625, -0.11144256591796875, -0.0968475341796875, -0.08225250244140625, -0.067657470703125, -0.05306243896484375, -0.0384674072265625, -0.02387237548828125, -0.00927734375, 0.00531768798828125, 0.0199127197265625, 0.03450775146484375, 0.049102783203125, 0.06369781494140625, 0.0782928466796875, 0.09288787841796875, 0.10748291015625, 0.12207794189453125, 0.1366729736328125, 0.15126800537109375, 0.165863037109375, 0.18045806884765625, 0.1950531005859375, 0.20964813232421875, 0.2242431640625, 0.23883819580078125, 0.2534332275390625, 0.26802825927734375, 0.282623291015625, 0.29721832275390625, 0.3118133544921875, 0.32640838623046875, 0.34100341796875, 0.35559844970703125, 0.3701934814453125, 0.38478851318359375, 0.399383544921875, 0.41397857666015625, 0.4285736083984375, 0.44316864013671875, 0.457763671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 1.0, 3.0, 8.0, 4.0, 1.0, 4.0, 13.0, 10.0, 10.0, 13.0, 9.0, 30.0, 41.0, 69.0, 77.0, 111.0, 124.0, 117.0, 88.0, 79.0, 43.0, 39.0, 21.0, 22.0, 12.0, 9.0, 7.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058349609375, -0.05644989013671875, -0.0545501708984375, -0.05265045166015625, -0.050750732421875, -0.04885101318359375, -0.0469512939453125, -0.04505157470703125, -0.04315185546875, -0.04125213623046875, -0.0393524169921875, -0.03745269775390625, -0.035552978515625, -0.03365325927734375, -0.0317535400390625, -0.02985382080078125, -0.0279541015625, -0.02605438232421875, -0.0241546630859375, -0.02225494384765625, -0.020355224609375, -0.01845550537109375, -0.0165557861328125, -0.01465606689453125, -0.01275634765625, -0.01085662841796875, -0.0089569091796875, -0.00705718994140625, -0.005157470703125, -0.00325775146484375, -0.0013580322265625, 0.00054168701171875, 0.00244140625, 0.00434112548828125, 0.0062408447265625, 0.00814056396484375, 0.010040283203125, 0.01194000244140625, 0.0138397216796875, 0.01573944091796875, 0.01763916015625, 0.01953887939453125, 0.0214385986328125, 0.02333831787109375, 0.025238037109375, 0.02713775634765625, 0.0290374755859375, 0.03093719482421875, 0.0328369140625, 0.03473663330078125, 0.0366363525390625, 0.03853607177734375, 0.040435791015625, 0.04233551025390625, 0.0442352294921875, 0.04613494873046875, 0.04803466796875, 0.04993438720703125, 0.0518341064453125, 0.05373382568359375, 0.055633544921875, 0.05753326416015625, 0.0594329833984375, 0.06133270263671875, 0.063232421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 21.0, 30.0, 60.0, 102.0, 178.0, 339.0, 635.0, 1328.0, 2688.0, 5640.0, 11692.0, 25889.0, 59455.0, 143310.0, 293367.0, 275523.0, 129492.0, 53638.0, 23942.0, 11004.0, 5000.0, 2526.0, 1254.0, 618.0, 353.0, 179.0, 124.0, 58.0, 36.0, 15.0, 20.0, 6.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.225830078125, -0.21802520751953125, -0.2102203369140625, -0.20241546630859375, -0.194610595703125, -0.18680572509765625, -0.1790008544921875, -0.17119598388671875, -0.16339111328125, -0.15558624267578125, -0.1477813720703125, -0.13997650146484375, -0.132171630859375, -0.12436676025390625, -0.1165618896484375, -0.10875701904296875, -0.1009521484375, -0.09314727783203125, -0.0853424072265625, -0.07753753662109375, -0.069732666015625, -0.06192779541015625, -0.0541229248046875, -0.04631805419921875, -0.03851318359375, -0.03070831298828125, -0.0229034423828125, -0.01509857177734375, -0.007293701171875, 0.00051116943359375, 0.0083160400390625, 0.01612091064453125, 0.02392578125, 0.03173065185546875, 0.0395355224609375, 0.04734039306640625, 0.055145263671875, 0.06295013427734375, 0.0707550048828125, 0.07855987548828125, 0.08636474609375, 0.09416961669921875, 0.1019744873046875, 0.10977935791015625, 0.117584228515625, 0.12538909912109375, 0.1331939697265625, 0.14099884033203125, 0.1488037109375, 0.15660858154296875, 0.1644134521484375, 0.17221832275390625, 0.180023193359375, 0.18782806396484375, 0.1956329345703125, 0.20343780517578125, 0.21124267578125, 0.21904754638671875, 0.2268524169921875, 0.23465728759765625, 0.242462158203125, 0.25026702880859375, 0.2580718994140625, 0.26587677001953125, 0.273681640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 13.0, 9.0, 9.0, 11.0, 11.0, 8.0, 16.0, 15.0, 14.0, 14.0, 26.0, 22.0, 25.0, 36.0, 25.0, 24.0, 29.0, 33.0, 33.0, 30.0, 41.0, 35.0, 30.0, 47.0, 39.0, 40.0, 30.0, 26.0, 32.0, 21.0, 27.0, 30.0, 23.0, 20.0, 17.0, 19.0, 12.0, 16.0, 9.0, 14.0, 14.0, 8.0, 7.0, 6.0, 5.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1827392578125, -0.17677688598632812, -0.17081451416015625, -0.16485214233398438, -0.1588897705078125, -0.15292739868164062, -0.14696502685546875, -0.14100265502929688, -0.135040283203125, -0.12907791137695312, -0.12311553955078125, -0.11715316772460938, -0.1111907958984375, -0.10522842407226562, -0.09926605224609375, -0.09330368041992188, -0.08734130859375, -0.08137893676757812, -0.07541656494140625, -0.06945419311523438, -0.0634918212890625, -0.057529449462890625, -0.05156707763671875, -0.045604705810546875, -0.039642333984375, -0.033679962158203125, -0.02771759033203125, -0.021755218505859375, -0.0157928466796875, -0.009830474853515625, -0.00386810302734375, 0.002094268798828125, 0.008056640625, 0.014019012451171875, 0.01998138427734375, 0.025943756103515625, 0.0319061279296875, 0.037868499755859375, 0.04383087158203125, 0.049793243408203125, 0.055755615234375, 0.061717987060546875, 0.06768035888671875, 0.07364273071289062, 0.0796051025390625, 0.08556747436523438, 0.09152984619140625, 0.09749221801757812, 0.10345458984375, 0.10941696166992188, 0.11537933349609375, 0.12134170532226562, 0.1273040771484375, 0.13326644897460938, 0.13922882080078125, 0.14519119262695312, 0.151153564453125, 0.15711593627929688, 0.16307830810546875, 0.16904067993164062, 0.1750030517578125, 0.18096542358398438, 0.18692779541015625, 0.19289016723632812, 0.1988525390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 5.0, 15.0, 12.0, 15.0, 19.0, 41.0, 59.0, 103.0, 197.0, 572.0, 2089.0, 26256.0, 1006044.0, 10960.0, 1366.0, 418.0, 152.0, 76.0, 44.0, 31.0, 17.0, 14.0, 11.0, 12.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3192901611328125, -1.277252197265625, -1.2352142333984375, -1.19317626953125, -1.1511383056640625, -1.109100341796875, -1.0670623779296875, -1.0250244140625, -0.9829864501953125, -0.940948486328125, -0.8989105224609375, -0.85687255859375, -0.8148345947265625, -0.772796630859375, -0.7307586669921875, -0.688720703125, -0.6466827392578125, -0.604644775390625, -0.5626068115234375, -0.52056884765625, -0.4785308837890625, -0.436492919921875, -0.3944549560546875, -0.3524169921875, -0.3103790283203125, -0.268341064453125, -0.2263031005859375, -0.18426513671875, -0.1422271728515625, -0.100189208984375, -0.0581512451171875, -0.01611328125, 0.0259246826171875, 0.067962646484375, 0.1100006103515625, 0.15203857421875, 0.1940765380859375, 0.236114501953125, 0.2781524658203125, 0.3201904296875, 0.3622283935546875, 0.404266357421875, 0.4463043212890625, 0.48834228515625, 0.5303802490234375, 0.572418212890625, 0.6144561767578125, 0.656494140625, 0.6985321044921875, 0.740570068359375, 0.7826080322265625, 0.82464599609375, 0.8666839599609375, 0.908721923828125, 0.9507598876953125, 0.9927978515625, 1.0348358154296875, 1.076873779296875, 1.1189117431640625, 1.16094970703125, 1.2029876708984375, 1.245025634765625, 1.2870635986328125, 1.3291015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 3.0, 8.0, 5.0, 11.0, 15.0, 18.0, 17.0, 31.0, 34.0, 73.0, 85.0, 98.0, 119.0, 117.0, 103.0, 54.0, 44.0, 29.0, 32.0, 18.0, 26.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.479024887084961e-05, -6.268173456192017e-05, -6.057322025299072e-05, -5.846470594406128e-05, -5.6356191635131836e-05, -5.424767732620239e-05, -5.213916301727295e-05, -5.0030648708343506e-05, -4.792213439941406e-05, -4.581362009048462e-05, -4.3705105781555176e-05, -4.159659147262573e-05, -3.948807716369629e-05, -3.7379562854766846e-05, -3.52710485458374e-05, -3.316253423690796e-05, -3.1054019927978516e-05, -2.8945505619049072e-05, -2.683699131011963e-05, -2.4728477001190186e-05, -2.2619962692260742e-05, -2.05114483833313e-05, -1.8402934074401855e-05, -1.6294419765472412e-05, -1.4185905456542969e-05, -1.2077391147613525e-05, -9.968876838684082e-06, -7.860362529754639e-06, -5.751848220825195e-06, -3.643333911895752e-06, -1.5348196029663086e-06, 5.736947059631348e-07, 2.682209014892578e-06, 4.7907233238220215e-06, 6.899237632751465e-06, 9.007751941680908e-06, 1.1116266250610352e-05, 1.3224780559539795e-05, 1.5333294868469238e-05, 1.744180917739868e-05, 1.9550323486328125e-05, 2.165883779525757e-05, 2.3767352104187012e-05, 2.5875866413116455e-05, 2.79843807220459e-05, 3.0092895030975342e-05, 3.2201409339904785e-05, 3.430992364883423e-05, 3.641843795776367e-05, 3.8526952266693115e-05, 4.063546657562256e-05, 4.2743980884552e-05, 4.4852495193481445e-05, 4.696100950241089e-05, 4.906952381134033e-05, 5.1178038120269775e-05, 5.328655242919922e-05, 5.539506673812866e-05, 5.7503581047058105e-05, 5.961209535598755e-05, 6.172060966491699e-05, 6.382912397384644e-05, 6.593763828277588e-05, 6.804615259170532e-05, 7.015466690063477e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 6.0, 19.0, 24.0, 24.0, 54.0, 68.0, 93.0, 145.0, 196.0, 254.0, 458.0, 656.0, 997.0, 1659.0, 2670.0, 4762.0, 9175.0, 22628.0, 170903.0, 732382.0, 69011.0, 15628.0, 7165.0, 3706.0, 2121.0, 1272.0, 826.0, 533.0, 342.0, 235.0, 147.0, 130.0, 80.0, 43.0, 30.0, 31.0, 16.0, 16.0, 12.0, 7.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.402099609375, -0.3892631530761719, -0.37642669677734375, -0.3635902404785156, -0.3507537841796875, -0.3379173278808594, -0.32508087158203125, -0.3122444152832031, -0.299407958984375, -0.2865715026855469, -0.27373504638671875, -0.2608985900878906, -0.2480621337890625, -0.23522567749023438, -0.22238922119140625, -0.20955276489257812, -0.19671630859375, -0.18387985229492188, -0.17104339599609375, -0.15820693969726562, -0.1453704833984375, -0.13253402709960938, -0.11969757080078125, -0.10686111450195312, -0.094024658203125, -0.08118820190429688, -0.06835174560546875, -0.055515289306640625, -0.0426788330078125, -0.029842376708984375, -0.01700592041015625, -0.004169464111328125, 0.0086669921875, 0.021503448486328125, 0.03433990478515625, 0.047176361083984375, 0.0600128173828125, 0.07284927368164062, 0.08568572998046875, 0.09852218627929688, 0.111358642578125, 0.12419509887695312, 0.13703155517578125, 0.14986801147460938, 0.1627044677734375, 0.17554092407226562, 0.18837738037109375, 0.20121383666992188, 0.21405029296875, 0.22688674926757812, 0.23972320556640625, 0.2525596618652344, 0.2653961181640625, 0.2782325744628906, 0.29106903076171875, 0.3039054870605469, 0.316741943359375, 0.3295783996582031, 0.34241485595703125, 0.3552513122558594, 0.3680877685546875, 0.3809242248535156, 0.39376068115234375, 0.4065971374511719, 0.41943359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 6.0, 14.0, 15.0, 26.0, 64.0, 124.0, 211.0, 201.0, 151.0, 72.0, 20.0, 15.0, 12.0, 10.0, 5.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.4139518737792969, -0.39968109130859375, -0.3854103088378906, -0.3711395263671875, -0.3568687438964844, -0.34259796142578125, -0.3283271789550781, -0.314056396484375, -0.2997856140136719, -0.28551483154296875, -0.2712440490722656, -0.2569732666015625, -0.24270248413085938, -0.22843170166015625, -0.21416091918945312, -0.19989013671875, -0.18561935424804688, -0.17134857177734375, -0.15707778930664062, -0.1428070068359375, -0.12853622436523438, -0.11426544189453125, -0.09999465942382812, -0.085723876953125, -0.07145309448242188, -0.05718231201171875, -0.042911529541015625, -0.0286407470703125, -0.014369964599609375, -9.918212890625e-05, 0.014171600341796875, 0.0284423828125, 0.042713165283203125, 0.05698394775390625, 0.07125473022460938, 0.0855255126953125, 0.09979629516601562, 0.11406707763671875, 0.12833786010742188, 0.142608642578125, 0.15687942504882812, 0.17115020751953125, 0.18542098999023438, 0.1996917724609375, 0.21396255493164062, 0.22823333740234375, 0.24250411987304688, 0.25677490234375, 0.2710456848144531, 0.28531646728515625, 0.2995872497558594, 0.3138580322265625, 0.3281288146972656, 0.34239959716796875, 0.3566703796386719, 0.370941162109375, 0.3852119445800781, 0.39948272705078125, 0.4137535095214844, 0.4280242919921875, 0.4422950744628906, 0.45656585693359375, 0.4708366394042969, 0.485107421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 13.0, 14.0, 18.0, 41.0, 88.0, 172.0, 232.0, 189.0, 87.0, 48.0, 39.0, 15.0, 6.0, 10.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7499608993530273, -1.6612286567687988, -1.5724964141845703, -1.4837641716003418, -1.3950319290161133, -1.3062996864318848, -1.2175674438476562, -1.1288352012634277, -1.0401029586791992, -0.9513707160949707, -0.8626384735107422, -0.7739062309265137, -0.6851739883422852, -0.5964417457580566, -0.5077094435691833, -0.41897720098495483, -0.33024489879608154, -0.24151265621185303, -0.15278039872646332, -0.06404814124107361, 0.024684101343154907, 0.11341634392738342, 0.20214861631393433, 0.29088085889816284, 0.37961310148239136, 0.4683453440666199, 0.5570775866508484, 0.6458098888397217, 0.7345421314239502, 0.8232743740081787, 0.9120066165924072, 1.0007388591766357, 1.0894711017608643, 1.1782033443450928, 1.2669355869293213, 1.3556678295135498, 1.4444000720977783, 1.5331323146820068, 1.6218645572662354, 1.7105967998504639, 1.7993290424346924, 1.888061285018921, 1.9767935276031494, 2.065525770187378, 2.1542580127716064, 2.242990255355835, 2.3317224979400635, 2.420454740524292, 2.5091872215270996, 2.597919464111328, 2.6866517066955566, 2.775383949279785, 2.8641161918640137, 2.952848434448242, 3.0415806770324707, 3.130312919616699, 3.2190451622009277, 3.3077774047851562, 3.3965096473693848, 3.4852418899536133, 3.573974132537842, 3.6627063751220703, 3.751438617706299, 3.8401708602905273, 3.928903102874756]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 12.0, 7.0, 12.0, 17.0, 35.0, 38.0, 43.0, 78.0, 84.0, 97.0, 95.0, 112.0, 95.0, 68.0, 46.0, 39.0, 31.0, 21.0, 14.0, 11.0, 10.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0156478881835938, -2.9194695949554443, -2.823291301727295, -2.7271127700805664, -2.630934476852417, -2.5347561836242676, -2.438577890396118, -2.3423995971679688, -2.2462210655212402, -2.150042772293091, -2.0538644790649414, -1.9576860666275024, -1.8615076541900635, -1.765329360961914, -1.6691510677337646, -1.5729726552963257, -1.4767943620681763, -1.3806160688400269, -1.284437656402588, -1.1882593631744385, -1.0920809507369995, -0.9959026575088501, -0.8997243046760559, -0.8035459518432617, -0.7073675990104675, -0.6111892461776733, -0.5150108933448792, -0.41883257031440735, -0.32265421748161316, -0.22647586464881897, -0.13029754161834717, -0.03411918878555298, 0.06205916404724121, 0.1582375168800354, 0.2544158697128296, 0.3505941927433014, 0.4467725455760956, 0.5429508686065674, 0.6391292214393616, 0.7353075742721558, 0.83148592710495, 0.9276642799377441, 1.0238425731658936, 1.1200209856033325, 1.216199278831482, 1.312377691268921, 1.4085559844970703, 1.5047342777252197, 1.6009126901626587, 1.697090983390808, 1.793269395828247, 1.8894476890563965, 1.9856261014938354, 2.0818045139312744, 2.177982807159424, 2.2741611003875732, 2.3703393936157227, 2.466517686843872, 2.5626959800720215, 2.65887451171875, 2.7550528049468994, 2.851231098175049, 2.9474093914031982, 3.0435876846313477, 3.139766216278076]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 8.0, 8.0, 15.0, 22.0, 23.0, 42.0, 45.0, 63.0, 73.0, 120.0, 138.0, 225.0, 271.0, 404.0, 514.0, 802.0, 1154.0, 1748.0, 2934.0, 5463.0, 11340.0, 29159.0, 127369.0, 3656487.0, 281260.0, 42271.0, 14787.0, 6792.0, 3657.0, 2175.0, 1383.0, 970.0, 695.0, 486.0, 374.0, 278.0, 195.0, 129.0, 109.0, 78.0, 49.0, 46.0, 35.0, 24.0, 12.0, 10.0, 5.0, 8.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7509765625, -0.7279815673828125, -0.704986572265625, -0.6819915771484375, -0.65899658203125, -0.6360015869140625, -0.613006591796875, -0.5900115966796875, -0.5670166015625, -0.5440216064453125, -0.521026611328125, -0.4980316162109375, -0.47503662109375, -0.4520416259765625, -0.429046630859375, -0.4060516357421875, -0.383056640625, -0.3600616455078125, -0.337066650390625, -0.3140716552734375, -0.29107666015625, -0.2680816650390625, -0.245086669921875, -0.2220916748046875, -0.1990966796875, -0.1761016845703125, -0.153106689453125, -0.1301116943359375, -0.10711669921875, -0.0841217041015625, -0.061126708984375, -0.0381317138671875, -0.01513671875, 0.0078582763671875, 0.030853271484375, 0.0538482666015625, 0.07684326171875, 0.0998382568359375, 0.122833251953125, 0.1458282470703125, 0.1688232421875, 0.1918182373046875, 0.214813232421875, 0.2378082275390625, 0.26080322265625, 0.2837982177734375, 0.306793212890625, 0.3297882080078125, 0.352783203125, 0.3757781982421875, 0.398773193359375, 0.4217681884765625, 0.44476318359375, 0.4677581787109375, 0.490753173828125, 0.5137481689453125, 0.5367431640625, 0.5597381591796875, 0.582733154296875, 0.6057281494140625, 0.62872314453125, 0.6517181396484375, 0.674713134765625, 0.6977081298828125, 0.720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 8.0, 10.0, 7.0, 7.0, 17.0, 15.0, 23.0, 45.0, 46.0, 75.0, 73.0, 89.0, 99.0, 100.0, 80.0, 68.0, 54.0, 26.0, 30.0, 15.0, 14.0, 14.0, 15.0, 5.0, 8.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0604248046875, -0.05862998962402344, -0.056835174560546875, -0.05504035949707031, -0.05324554443359375, -0.05145072937011719, -0.049655914306640625, -0.04786109924316406, -0.0460662841796875, -0.04427146911621094, -0.042476654052734375, -0.04068183898925781, -0.03888702392578125, -0.03709220886230469, -0.035297393798828125, -0.03350257873535156, -0.031707763671875, -0.029912948608398438, -0.028118133544921875, -0.026323318481445312, -0.02452850341796875, -0.022733688354492188, -0.020938873291015625, -0.019144058227539062, -0.0173492431640625, -0.015554428100585938, -0.013759613037109375, -0.011964797973632812, -0.01016998291015625, -0.008375167846679688, -0.006580352783203125, -0.0047855377197265625, -0.00299072265625, -0.0011959075927734375, 0.000598907470703125, 0.0023937225341796875, 0.00418853759765625, 0.0059833526611328125, 0.007778167724609375, 0.009572982788085938, 0.0113677978515625, 0.013162612915039062, 0.014957427978515625, 0.016752243041992188, 0.01854705810546875, 0.020341873168945312, 0.022136688232421875, 0.023931503295898438, 0.025726318359375, 0.027521133422851562, 0.029315948486328125, 0.031110763549804688, 0.03290557861328125, 0.03470039367675781, 0.036495208740234375, 0.03829002380371094, 0.0400848388671875, 0.04187965393066406, 0.043674468994140625, 0.04546928405761719, 0.04726409912109375, 0.04905891418457031, 0.050853729248046875, 0.05264854431152344, 0.054443359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 17.0, 21.0, 48.0, 78.0, 189.0, 707.0, 6484.0, 4006361.0, 177178.0, 2511.0, 396.0, 122.0, 73.0, 31.0, 11.0, 15.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.1962890625, -2.095703125, -1.9951171875, -1.89453125, -1.7939453125, -1.693359375, -1.5927734375, -1.4921875, -1.3916015625, -1.291015625, -1.1904296875, -1.08984375, -0.9892578125, -0.888671875, -0.7880859375, -0.6875, -0.5869140625, -0.486328125, -0.3857421875, -0.28515625, -0.1845703125, -0.083984375, 0.0166015625, 0.1171875, 0.2177734375, 0.318359375, 0.4189453125, 0.51953125, 0.6201171875, 0.720703125, 0.8212890625, 0.921875, 1.0224609375, 1.123046875, 1.2236328125, 1.32421875, 1.4248046875, 1.525390625, 1.6259765625, 1.7265625, 1.8271484375, 1.927734375, 2.0283203125, 2.12890625, 2.2294921875, 2.330078125, 2.4306640625, 2.53125, 2.6318359375, 2.732421875, 2.8330078125, 2.93359375, 3.0341796875, 3.134765625, 3.2353515625, 3.3359375, 3.4365234375, 3.537109375, 3.6376953125, 3.73828125, 3.8388671875, 3.939453125, 4.0400390625, 4.140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 14.0, 17.0, 21.0, 49.0, 93.0, 179.0, 503.0, 2112.0, 636.0, 191.0, 99.0, 56.0, 33.0, 20.0, 8.0, 10.0, 5.0, 6.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.300537109375, -0.2936420440673828, -0.2867469787597656, -0.27985191345214844, -0.27295684814453125, -0.26606178283691406, -0.2591667175292969, -0.2522716522216797, -0.2453765869140625, -0.2384815216064453, -0.23158645629882812, -0.22469139099121094, -0.21779632568359375, -0.21090126037597656, -0.20400619506835938, -0.1971111297607422, -0.190216064453125, -0.1833209991455078, -0.17642593383789062, -0.16953086853027344, -0.16263580322265625, -0.15574073791503906, -0.14884567260742188, -0.1419506072998047, -0.1350555419921875, -0.1281604766845703, -0.12126541137695312, -0.11437034606933594, -0.10747528076171875, -0.10058021545410156, -0.09368515014648438, -0.08679008483886719, -0.07989501953125, -0.07299995422363281, -0.06610488891601562, -0.05920982360839844, -0.05231475830078125, -0.04541969299316406, -0.038524627685546875, -0.03162956237792969, -0.0247344970703125, -0.017839431762695312, -0.010944366455078125, -0.0040493011474609375, 0.00284576416015625, 0.009740829467773438, 0.016635894775390625, 0.023530960083007812, 0.030426025390625, 0.03732109069824219, 0.044216156005859375, 0.05111122131347656, 0.05800628662109375, 0.06490135192871094, 0.07179641723632812, 0.07869148254394531, 0.0855865478515625, 0.09248161315917969, 0.09937667846679688, 0.10627174377441406, 0.11316680908203125, 0.12006187438964844, 0.12695693969726562, 0.1338520050048828, 0.1407470703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 15.0, 32.0, 49.0, 103.0, 197.0, 264.0, 181.0, 85.0, 30.0, 16.0, 4.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7906152606010437, -0.7568397521972656, -0.7230641841888428, -0.6892886757850647, -0.6555131673812866, -0.6217376589775085, -0.5879621505737305, -0.5541865825653076, -0.5204110741615295, -0.48663556575775146, -0.452860027551651, -0.41908448934555054, -0.38530898094177246, -0.3515334725379944, -0.3177579343318939, -0.28398239612579346, -0.2502068877220154, -0.2164313644170761, -0.18265584111213684, -0.14888031780719757, -0.1151047945022583, -0.08132927119731903, -0.04755374789237976, -0.01377822458744049, 0.01999729871749878, 0.05377282202243805, 0.08754834532737732, 0.12132386863231659, 0.15509939193725586, 0.18887491524219513, 0.2226504385471344, 0.25642597675323486, 0.29020142555236816, 0.32397693395614624, 0.3577524721622467, 0.39152801036834717, 0.42530351877212524, 0.4590790271759033, 0.4928545653820038, 0.5266301035881042, 0.5604056119918823, 0.5941811203956604, 0.6279566287994385, 0.6617321968078613, 0.6955077052116394, 0.7292832136154175, 0.7630587816238403, 0.7968342900276184, 0.8306097984313965, 0.8643853068351746, 0.8981608152389526, 0.9319363832473755, 0.9657118916511536, 0.9994874000549316, 1.0332629680633545, 1.0670384168624878, 1.1008139848709106, 1.1345895528793335, 1.1683650016784668, 1.2021405696868896, 1.2359161376953125, 1.2696915864944458, 1.3034671545028687, 1.337242603302002, 1.3710181713104248]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 15.0, 17.0, 28.0, 29.0, 42.0, 56.0, 77.0, 85.0, 109.0, 98.0, 75.0, 73.0, 75.0, 57.0, 36.0, 35.0, 20.0, 14.0, 12.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0533130168914795, -1.0257294178009033, -0.9981458187103271, -0.970562219619751, -0.9429786205291748, -0.9153950214385986, -0.8878114223480225, -0.8602278232574463, -0.8326442241668701, -0.805060625076294, -0.7774770259857178, -0.7498934268951416, -0.7223098278045654, -0.6947262287139893, -0.6671426296234131, -0.6395590305328369, -0.6119754910469055, -0.5843918919563293, -0.5568082928657532, -0.529224693775177, -0.5016410946846008, -0.47405749559402466, -0.4464739263057709, -0.4188903272151947, -0.39130672812461853, -0.36372312903404236, -0.3361395299434662, -0.3085559606552124, -0.28097236156463623, -0.25338876247406006, -0.2258051633834839, -0.19822156429290771, -0.17063796520233154, -0.14305436611175537, -0.1154707744717598, -0.08788718283176422, -0.06030358374118805, -0.03271998465061188, -0.005136400461196899, 0.022447198629379272, 0.050030797719955444, 0.07761439681053162, 0.10519798845052719, 0.13278158009052277, 0.16036517918109894, 0.1879487782716751, 0.2155323624610901, 0.24311596155166626, 0.27069956064224243, 0.2982831597328186, 0.3258667588233948, 0.35345035791397095, 0.3810339570045471, 0.4086175560951233, 0.4362011253833771, 0.46378472447395325, 0.4913683235645294, 0.5189518928527832, 0.5465354919433594, 0.5741190910339355, 0.6017026901245117, 0.6292862892150879, 0.6568698883056641, 0.6844534873962402, 0.7120370864868164]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 5.0, 7.0, 6.0, 7.0, 15.0, 20.0, 18.0, 12.0, 20.0, 28.0, 22.0, 36.0, 36.0, 43.0, 68.0, 128.0, 480.0, 4972.0, 621346.0, 416257.0, 4107.0, 487.0, 117.0, 58.0, 46.0, 26.0, 32.0, 30.0, 30.0, 25.0, 15.0, 10.0, 8.0, 9.0, 8.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7392578125, -1.68121337890625, -1.6231689453125, -1.56512451171875, -1.507080078125, -1.44903564453125, -1.3909912109375, -1.33294677734375, -1.27490234375, -1.21685791015625, -1.1588134765625, -1.10076904296875, -1.042724609375, -0.98468017578125, -0.9266357421875, -0.86859130859375, -0.810546875, -0.75250244140625, -0.6944580078125, -0.63641357421875, -0.578369140625, -0.52032470703125, -0.4622802734375, -0.40423583984375, -0.34619140625, -0.28814697265625, -0.2301025390625, -0.17205810546875, -0.114013671875, -0.05596923828125, 0.0020751953125, 0.06011962890625, 0.1181640625, 0.17620849609375, 0.2342529296875, 0.29229736328125, 0.350341796875, 0.40838623046875, 0.4664306640625, 0.52447509765625, 0.58251953125, 0.64056396484375, 0.6986083984375, 0.75665283203125, 0.814697265625, 0.87274169921875, 0.9307861328125, 0.98883056640625, 1.046875, 1.10491943359375, 1.1629638671875, 1.22100830078125, 1.279052734375, 1.33709716796875, 1.3951416015625, 1.45318603515625, 1.51123046875, 1.56927490234375, 1.6273193359375, 1.68536376953125, 1.743408203125, 1.80145263671875, 1.8594970703125, 1.91754150390625, 1.9755859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 11.0, 52.0, 126.0, 271.0, 307.0, 157.0, 51.0, 18.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.32373046875, -0.3176288604736328, -0.3115272521972656, -0.30542564392089844, -0.29932403564453125, -0.29322242736816406, -0.2871208190917969, -0.2810192108154297, -0.2749176025390625, -0.2688159942626953, -0.2627143859863281, -0.25661277770996094, -0.25051116943359375, -0.24440956115722656, -0.23830795288085938, -0.2322063446044922, -0.226104736328125, -0.2200031280517578, -0.21390151977539062, -0.20779991149902344, -0.20169830322265625, -0.19559669494628906, -0.18949508666992188, -0.1833934783935547, -0.1772918701171875, -0.1711902618408203, -0.16508865356445312, -0.15898704528808594, -0.15288543701171875, -0.14678382873535156, -0.14068222045898438, -0.1345806121826172, -0.12847900390625, -0.12237739562988281, -0.11627578735351562, -0.11017417907714844, -0.10407257080078125, -0.09797096252441406, -0.09186935424804688, -0.08576774597167969, -0.0796661376953125, -0.07356452941894531, -0.06746292114257812, -0.06136131286621094, -0.05525970458984375, -0.04915809631347656, -0.043056488037109375, -0.03695487976074219, -0.030853271484375, -0.024751663208007812, -0.018650054931640625, -0.012548446655273438, -0.00644683837890625, -0.0003452301025390625, 0.005756378173828125, 0.011857986450195312, 0.0179595947265625, 0.024061203002929688, 0.030162811279296875, 0.03626441955566406, 0.04236602783203125, 0.04846763610839844, 0.054569244384765625, 0.06067085266113281, 0.0667724609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 11.0, 11.0, 13.0, 11.0, 23.0, 30.0, 39.0, 64.0, 58.0, 90.0, 159.0, 271.0, 457.0, 962.0, 2161.0, 5278.0, 14657.0, 44481.0, 168924.0, 480036.0, 239904.0, 60565.0, 18618.0, 6506.0, 2618.0, 1225.0, 542.0, 294.0, 165.0, 99.0, 79.0, 46.0, 39.0, 32.0, 27.0, 15.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4399528503417969, -0.42458343505859375, -0.4092140197753906, -0.3938446044921875, -0.3784751892089844, -0.36310577392578125, -0.3477363586425781, -0.332366943359375, -0.3169975280761719, -0.30162811279296875, -0.2862586975097656, -0.2708892822265625, -0.2555198669433594, -0.24015045166015625, -0.22478103637695312, -0.20941162109375, -0.19404220581054688, -0.17867279052734375, -0.16330337524414062, -0.1479339599609375, -0.13256454467773438, -0.11719512939453125, -0.10182571411132812, -0.086456298828125, -0.07108688354492188, -0.05571746826171875, -0.040348052978515625, -0.0249786376953125, -0.009609222412109375, 0.00576019287109375, 0.021129608154296875, 0.0364990234375, 0.051868438720703125, 0.06723785400390625, 0.08260726928710938, 0.0979766845703125, 0.11334609985351562, 0.12871551513671875, 0.14408493041992188, 0.159454345703125, 0.17482376098632812, 0.19019317626953125, 0.20556259155273438, 0.2209320068359375, 0.23630142211914062, 0.25167083740234375, 0.2670402526855469, 0.28240966796875, 0.2977790832519531, 0.31314849853515625, 0.3285179138183594, 0.3438873291015625, 0.3592567443847656, 0.37462615966796875, 0.3899955749511719, 0.405364990234375, 0.4207344055175781, 0.43610382080078125, 0.4514732360839844, 0.4668426513671875, 0.4822120666503906, 0.49758148193359375, 0.5129508972167969, 0.5283203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 5.0, 6.0, 10.0, 5.0, 13.0, 11.0, 13.0, 9.0, 21.0, 24.0, 25.0, 31.0, 40.0, 35.0, 28.0, 37.0, 46.0, 53.0, 43.0, 49.0, 41.0, 47.0, 45.0, 40.0, 44.0, 43.0, 31.0, 37.0, 26.0, 26.0, 27.0, 15.0, 14.0, 12.0, 12.0, 12.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.303466796875, -0.2940330505371094, -0.28459930419921875, -0.2751655578613281, -0.2657318115234375, -0.2562980651855469, -0.24686431884765625, -0.23743057250976562, -0.227996826171875, -0.21856307983398438, -0.20912933349609375, -0.19969558715820312, -0.1902618408203125, -0.18082809448242188, -0.17139434814453125, -0.16196060180664062, -0.15252685546875, -0.14309310913085938, -0.13365936279296875, -0.12422561645507812, -0.1147918701171875, -0.10535812377929688, -0.09592437744140625, -0.08649063110351562, -0.077056884765625, -0.06762313842773438, -0.05818939208984375, -0.048755645751953125, -0.0393218994140625, -0.029888153076171875, -0.02045440673828125, -0.011020660400390625, -0.0015869140625, 0.007846832275390625, 0.01728057861328125, 0.026714324951171875, 0.0361480712890625, 0.045581817626953125, 0.05501556396484375, 0.06444931030273438, 0.073883056640625, 0.08331680297851562, 0.09275054931640625, 0.10218429565429688, 0.1116180419921875, 0.12105178833007812, 0.13048553466796875, 0.13991928100585938, 0.14935302734375, 0.15878677368164062, 0.16822052001953125, 0.17765426635742188, 0.1870880126953125, 0.19652175903320312, 0.20595550537109375, 0.21538925170898438, 0.224822998046875, 0.23425674438476562, 0.24369049072265625, 0.2531242370605469, 0.2625579833984375, 0.2719917297363281, 0.28142547607421875, 0.2908592224121094, 0.30029296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 6.0, 4.0, 15.0, 18.0, 24.0, 39.0, 71.0, 126.0, 206.0, 372.0, 811.0, 2125.0, 7493.0, 39120.0, 376623.0, 548305.0, 58624.0, 9966.0, 2592.0, 1003.0, 452.0, 247.0, 107.0, 81.0, 35.0, 34.0, 14.0, 12.0, 8.0, 6.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.44873046875, -0.4338226318359375, -0.418914794921875, -0.4040069580078125, -0.38909912109375, -0.3741912841796875, -0.359283447265625, -0.3443756103515625, -0.3294677734375, -0.3145599365234375, -0.299652099609375, -0.2847442626953125, -0.26983642578125, -0.2549285888671875, -0.240020751953125, -0.2251129150390625, -0.210205078125, -0.1952972412109375, -0.180389404296875, -0.1654815673828125, -0.15057373046875, -0.1356658935546875, -0.120758056640625, -0.1058502197265625, -0.0909423828125, -0.0760345458984375, -0.061126708984375, -0.0462188720703125, -0.03131103515625, -0.0164031982421875, -0.001495361328125, 0.0134124755859375, 0.0283203125, 0.0432281494140625, 0.058135986328125, 0.0730438232421875, 0.08795166015625, 0.1028594970703125, 0.117767333984375, 0.1326751708984375, 0.1475830078125, 0.1624908447265625, 0.177398681640625, 0.1923065185546875, 0.20721435546875, 0.2221221923828125, 0.237030029296875, 0.2519378662109375, 0.266845703125, 0.2817535400390625, 0.296661376953125, 0.3115692138671875, 0.32647705078125, 0.3413848876953125, 0.356292724609375, 0.3712005615234375, 0.3861083984375, 0.4010162353515625, 0.415924072265625, 0.4308319091796875, 0.44573974609375, 0.4606475830078125, 0.475555419921875, 0.4904632568359375, 0.50537109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 8.0, 14.0, 11.0, 13.0, 15.0, 27.0, 36.0, 37.0, 48.0, 65.0, 68.0, 72.0, 75.0, 74.0, 69.0, 49.0, 57.0, 43.0, 40.0, 22.0, 33.0, 28.0, 19.0, 10.0, 13.0, 10.0, 6.0, 9.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.266334533691406e-05, -3.144238144159317e-05, -3.0221417546272278e-05, -2.9000453650951385e-05, -2.7779489755630493e-05, -2.65585258603096e-05, -2.533756196498871e-05, -2.4116598069667816e-05, -2.2895634174346924e-05, -2.167467027902603e-05, -2.045370638370514e-05, -1.9232742488384247e-05, -1.8011778593063354e-05, -1.6790814697742462e-05, -1.556985080242157e-05, -1.4348886907100677e-05, -1.3127923011779785e-05, -1.1906959116458893e-05, -1.0685995221138e-05, -9.465031325817108e-06, -8.244067430496216e-06, -7.0231035351753235e-06, -5.802139639854431e-06, -4.581175744533539e-06, -3.3602118492126465e-06, -2.139247953891754e-06, -9.182840585708618e-07, 3.026798367500305e-07, 1.5236437320709229e-06, 2.744607627391815e-06, 3.9655715227127075e-06, 5.1865354180336e-06, 6.407499313354492e-06, 7.6284632086753845e-06, 8.849427103996277e-06, 1.007039099931717e-05, 1.1291354894638062e-05, 1.2512318789958954e-05, 1.3733282685279846e-05, 1.4954246580600739e-05, 1.617521047592163e-05, 1.7396174371242523e-05, 1.8617138266563416e-05, 1.9838102161884308e-05, 2.10590660572052e-05, 2.2280029952526093e-05, 2.3500993847846985e-05, 2.4721957743167877e-05, 2.594292163848877e-05, 2.7163885533809662e-05, 2.8384849429130554e-05, 2.9605813324451447e-05, 3.082677721977234e-05, 3.204774111509323e-05, 3.3268705010414124e-05, 3.4489668905735016e-05, 3.571063280105591e-05, 3.69315966963768e-05, 3.815256059169769e-05, 3.9373524487018585e-05, 4.059448838233948e-05, 4.181545227766037e-05, 4.303641617298126e-05, 4.4257380068302155e-05, 4.547834396362305e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 7.0, 17.0, 23.0, 37.0, 59.0, 106.0, 219.0, 402.0, 769.0, 1852.0, 4938.0, 16722.0, 88881.0, 640518.0, 246410.0, 33682.0, 8567.0, 2928.0, 1226.0, 536.0, 276.0, 151.0, 89.0, 41.0, 36.0, 16.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.68115234375, -0.6644287109375, -0.647705078125, -0.6309814453125, -0.6142578125, -0.5975341796875, -0.580810546875, -0.5640869140625, -0.54736328125, -0.5306396484375, -0.513916015625, -0.4971923828125, -0.48046875, -0.4637451171875, -0.447021484375, -0.4302978515625, -0.41357421875, -0.3968505859375, -0.380126953125, -0.3634033203125, -0.3466796875, -0.3299560546875, -0.313232421875, -0.2965087890625, -0.27978515625, -0.2630615234375, -0.246337890625, -0.2296142578125, -0.212890625, -0.1961669921875, -0.179443359375, -0.1627197265625, -0.14599609375, -0.1292724609375, -0.112548828125, -0.0958251953125, -0.0791015625, -0.0623779296875, -0.045654296875, -0.0289306640625, -0.01220703125, 0.0045166015625, 0.021240234375, 0.0379638671875, 0.0546875, 0.0714111328125, 0.088134765625, 0.1048583984375, 0.12158203125, 0.1383056640625, 0.155029296875, 0.1717529296875, 0.1884765625, 0.2052001953125, 0.221923828125, 0.2386474609375, 0.25537109375, 0.2720947265625, 0.288818359375, 0.3055419921875, 0.322265625, 0.3389892578125, 0.355712890625, 0.3724365234375, 0.38916015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 8.0, 4.0, 8.0, 11.0, 15.0, 21.0, 41.0, 60.0, 86.0, 100.0, 92.0, 108.0, 121.0, 99.0, 72.0, 42.0, 32.0, 19.0, 19.0, 14.0, 8.0, 9.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349853515625, -0.3402214050292969, -0.33058929443359375, -0.3209571838378906, -0.3113250732421875, -0.3016929626464844, -0.29206085205078125, -0.2824287414550781, -0.272796630859375, -0.2631645202636719, -0.25353240966796875, -0.24390029907226562, -0.2342681884765625, -0.22463607788085938, -0.21500396728515625, -0.20537185668945312, -0.19573974609375, -0.18610763549804688, -0.17647552490234375, -0.16684341430664062, -0.1572113037109375, -0.14757919311523438, -0.13794708251953125, -0.12831497192382812, -0.118682861328125, -0.10905075073242188, -0.09941864013671875, -0.08978652954101562, -0.0801544189453125, -0.07052230834960938, -0.06089019775390625, -0.051258087158203125, -0.0416259765625, -0.031993865966796875, -0.02236175537109375, -0.012729644775390625, -0.0030975341796875, 0.006534576416015625, 0.01616668701171875, 0.025798797607421875, 0.035430908203125, 0.045063018798828125, 0.05469512939453125, 0.06432723999023438, 0.0739593505859375, 0.08359146118164062, 0.09322357177734375, 0.10285568237304688, 0.11248779296875, 0.12211990356445312, 0.13175201416015625, 0.14138412475585938, 0.1510162353515625, 0.16064834594726562, 0.17028045654296875, 0.17991256713867188, 0.189544677734375, 0.19917678833007812, 0.20880889892578125, 0.21844100952148438, 0.2280731201171875, 0.23770523071289062, 0.24733734130859375, 0.2569694519042969, 0.2666015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 15.0, 56.0, 285.0, 366.0, 167.0, 63.0, 20.0, 9.0, 10.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.080022811889648, -9.851767539978027, -9.623512268066406, -9.395256996154785, -9.167001724243164, -8.93874740600586, -8.710491180419922, -8.482236862182617, -8.253981590270996, -8.025726318359375, -7.797471046447754, -7.569215774536133, -7.34096097946167, -7.112705707550049, -6.884450435638428, -6.656195163726807, -6.4279398918151855, -6.1996846199035645, -5.971429347991943, -5.7431745529174805, -5.514919281005859, -5.286664009094238, -5.058408737182617, -4.830153465270996, -4.601898193359375, -4.373642921447754, -4.145387649536133, -3.917132616043091, -3.688877582550049, -3.4606223106384277, -3.2323670387268066, -3.0041117668151855, -2.775857448577881, -2.5476021766662598, -2.3193471431732178, -2.0910918712615967, -1.8628367185592651, -1.6345815658569336, -1.4063262939453125, -1.178071141242981, -0.9498159885406494, -0.7215608358383179, -0.49330562353134155, -0.26505041122436523, -0.03679525852203369, 0.19145989418029785, 0.41971516609191895, 0.6479703187942505, 0.876225471496582, 1.1044806241989136, 1.3327357769012451, 1.5609910488128662, 1.7892462015151978, 2.0175013542175293, 2.2457566261291504, 2.4740118980407715, 2.7022669315338135, 2.9305222034454346, 3.1587772369384766, 3.3870325088500977, 3.6152877807617188, 3.8435428142547607, 4.071798324584961, 4.300053119659424, 4.528308391571045]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 9.0, 5.0, 9.0, 11.0, 23.0, 25.0, 34.0, 42.0, 51.0, 48.0, 58.0, 53.0, 57.0, 68.0, 67.0, 66.0, 68.0, 42.0, 49.0, 31.0, 35.0, 38.0, 20.0, 15.0, 18.0, 17.0, 12.0, 7.0, 6.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3112001419067383, -3.2188661098480225, -3.1265320777893066, -3.034198045730591, -2.941864013671875, -2.849529981613159, -2.7571959495544434, -2.6648621559143066, -2.5725278854370117, -2.480193853378296, -2.38785982131958, -2.2955257892608643, -2.2031917572021484, -2.1108577251434326, -2.018523693084717, -1.9261897802352905, -1.8338558673858643, -1.7415218353271484, -1.6491878032684326, -1.5568537712097168, -1.464519739151001, -1.3721857070922852, -1.2798517942428589, -1.187517762184143, -1.0951837301254272, -1.0028496980667114, -0.9105156660079956, -0.8181816935539246, -0.7258476614952087, -0.6335136294364929, -0.5411796569824219, -0.44884562492370605, -0.35651159286499023, -0.2641775608062744, -0.17184355854988098, -0.07950955629348755, 0.012824475765228271, 0.10515850782394409, 0.19749248027801514, 0.28982651233673096, 0.3821605443954468, 0.4744945764541626, 0.5668286085128784, 0.6591625809669495, 0.7514966130256653, 0.8438306450843811, 0.9361646175384521, 1.028498649597168, 1.1208326816558838, 1.2131667137145996, 1.3055007457733154, 1.3978347778320312, 1.490168809890747, 1.582502841949463, 1.6748367547988892, 1.767170786857605, 1.8595048189163208, 1.9518388509750366, 2.044172763824463, 2.1365067958831787, 2.2288408279418945, 2.3211748600006104, 2.413508892059326, 2.505842924118042, 2.598176956176758]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 9.0, 16.0, 10.0, 8.0, 12.0, 15.0, 28.0, 32.0, 13.0, 41.0, 50.0, 43.0, 62.0, 85.0, 176.0, 299.0, 772.0, 3283.0, 34103.0, 4096432.0, 52742.0, 4391.0, 973.0, 308.0, 166.0, 65.0, 41.0, 27.0, 16.0, 13.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.177734375, -3.095306396484375, -3.01287841796875, -2.930450439453125, -2.8480224609375, -2.765594482421875, -2.68316650390625, -2.600738525390625, -2.518310546875, -2.435882568359375, -2.35345458984375, -2.271026611328125, -2.1885986328125, -2.106170654296875, -2.02374267578125, -1.941314697265625, -1.85888671875, -1.776458740234375, -1.69403076171875, -1.611602783203125, -1.5291748046875, -1.446746826171875, -1.36431884765625, -1.281890869140625, -1.199462890625, -1.117034912109375, -1.03460693359375, -0.952178955078125, -0.8697509765625, -0.787322998046875, -0.70489501953125, -0.622467041015625, -0.5400390625, -0.457611083984375, -0.37518310546875, -0.292755126953125, -0.2103271484375, -0.127899169921875, -0.04547119140625, 0.036956787109375, 0.119384765625, 0.201812744140625, 0.28424072265625, 0.366668701171875, 0.4490966796875, 0.531524658203125, 0.61395263671875, 0.696380615234375, 0.77880859375, 0.861236572265625, 0.94366455078125, 1.026092529296875, 1.1085205078125, 1.190948486328125, 1.27337646484375, 1.355804443359375, 1.438232421875, 1.520660400390625, 1.60308837890625, 1.685516357421875, 1.7679443359375, 1.850372314453125, 1.93280029296875, 2.015228271484375, 2.09765625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 9.0, 12.0, 33.0, 61.0, 89.0, 132.0, 175.0, 199.0, 125.0, 77.0, 46.0, 26.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.266357421875, -0.26067066192626953, -0.25498390197753906, -0.2492971420288086, -0.24361038208007812, -0.23792362213134766, -0.2322368621826172, -0.22655010223388672, -0.22086334228515625, -0.21517658233642578, -0.2094898223876953, -0.20380306243896484, -0.19811630249023438, -0.1924295425415039, -0.18674278259277344, -0.18105602264404297, -0.1753692626953125, -0.16968250274658203, -0.16399574279785156, -0.1583089828491211, -0.15262222290039062, -0.14693546295166016, -0.1412487030029297, -0.13556194305419922, -0.12987518310546875, -0.12418842315673828, -0.11850166320800781, -0.11281490325927734, -0.10712814331054688, -0.1014413833618164, -0.09575462341308594, -0.09006786346435547, -0.084381103515625, -0.07869434356689453, -0.07300758361816406, -0.0673208236694336, -0.061634063720703125, -0.055947303771972656, -0.05026054382324219, -0.04457378387451172, -0.03888702392578125, -0.03320026397705078, -0.027513504028320312, -0.021826744079589844, -0.016139984130859375, -0.010453224182128906, -0.0047664642333984375, 0.0009202957153320312, 0.0066070556640625, 0.012293815612792969, 0.017980575561523438, 0.023667335510253906, 0.029354095458984375, 0.035040855407714844, 0.04072761535644531, 0.04641437530517578, 0.05210113525390625, 0.05778789520263672, 0.06347465515136719, 0.06916141510009766, 0.07484817504882812, 0.0805349349975586, 0.08622169494628906, 0.09190845489501953, 0.09759521484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 10.0, 7.0, 7.0, 13.0, 8.0, 18.0, 13.0, 11.0, 27.0, 24.0, 34.0, 29.0, 31.0, 37.0, 56.0, 79.0, 109.0, 198.0, 299.0, 927.0, 10919.0, 4112000.0, 66101.0, 2218.0, 468.0, 190.0, 113.0, 74.0, 46.0, 30.0, 28.0, 20.0, 21.0, 19.0, 16.0, 10.0, 12.0, 9.0, 9.0, 9.0, 4.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.375, -4.2451171875, -4.115234375, -3.9853515625, -3.85546875, -3.7255859375, -3.595703125, -3.4658203125, -3.3359375, -3.2060546875, -3.076171875, -2.9462890625, -2.81640625, -2.6865234375, -2.556640625, -2.4267578125, -2.296875, -2.1669921875, -2.037109375, -1.9072265625, -1.77734375, -1.6474609375, -1.517578125, -1.3876953125, -1.2578125, -1.1279296875, -0.998046875, -0.8681640625, -0.73828125, -0.6083984375, -0.478515625, -0.3486328125, -0.21875, -0.0888671875, 0.041015625, 0.1708984375, 0.30078125, 0.4306640625, 0.560546875, 0.6904296875, 0.8203125, 0.9501953125, 1.080078125, 1.2099609375, 1.33984375, 1.4697265625, 1.599609375, 1.7294921875, 1.859375, 1.9892578125, 2.119140625, 2.2490234375, 2.37890625, 2.5087890625, 2.638671875, 2.7685546875, 2.8984375, 3.0283203125, 3.158203125, 3.2880859375, 3.41796875, 3.5478515625, 3.677734375, 3.8076171875, 3.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 24.0, 94.0, 595.0, 2933.0, 298.0, 85.0, 27.0, 11.0, 7.0, 6.0, 1.0, 2.0], "bins": [-1.3115234375, -1.2878150939941406, -1.2641067504882812, -1.2403984069824219, -1.2166900634765625, -1.1929817199707031, -1.1692733764648438, -1.1455650329589844, -1.121856689453125, -1.0981483459472656, -1.0744400024414062, -1.0507316589355469, -1.0270233154296875, -1.0033149719238281, -0.9796066284179688, -0.9558982849121094, -0.93218994140625, -0.9084815979003906, -0.8847732543945312, -0.8610649108886719, -0.8373565673828125, -0.8136482238769531, -0.7899398803710938, -0.7662315368652344, -0.742523193359375, -0.7188148498535156, -0.6951065063476562, -0.6713981628417969, -0.6476898193359375, -0.6239814758300781, -0.6002731323242188, -0.5765647888183594, -0.5528564453125, -0.5291481018066406, -0.5054397583007812, -0.4817314147949219, -0.4580230712890625, -0.4343147277832031, -0.41060638427734375, -0.3868980407714844, -0.363189697265625, -0.3394813537597656, -0.31577301025390625, -0.2920646667480469, -0.2683563232421875, -0.24464797973632812, -0.22093963623046875, -0.19723129272460938, -0.17352294921875, -0.14981460571289062, -0.12610626220703125, -0.10239791870117188, -0.0786895751953125, -0.054981231689453125, -0.03127288818359375, -0.007564544677734375, 0.016143798828125, 0.039852142333984375, 0.06356048583984375, 0.08726882934570312, 0.1109771728515625, 0.13468551635742188, 0.15839385986328125, 0.18210220336914062, 0.205810546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 41.0, 788.0, 162.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.56743049621582, -9.027774810791016, -8.488119125366211, -7.94846248626709, -7.408806800842285, -6.8691511154174805, -6.329494953155518, -5.789838790893555, -5.25018310546875, -4.710527420043945, -4.170871257781982, -3.6312153339385986, -3.091559410095215, -2.551903486251831, -2.0122475624084473, -1.4725916385650635, -0.9329357147216797, -0.3932797908782959, 0.1463761329650879, 0.6860320568084717, 1.2256879806518555, 1.7653439044952393, 2.304999828338623, 2.844655752182007, 3.3843116760253906, 3.9239675998687744, 4.463623523712158, 5.003279685974121, 5.542935371398926, 6.0825910568237305, 6.622247219085693, 7.161903381347656, 7.701560974121094, 8.241216659545898, 8.780872344970703, 9.320528984069824, 9.860184669494629, 10.399840354919434, 10.939496994018555, 11.47915267944336, 12.018808364868164, 12.558464050292969, 13.098119735717773, 13.637776374816895, 14.1774320602417, 14.717087745666504, 15.256744384765625, 15.79640007019043, 16.336055755615234, 16.87571144104004, 17.415367126464844, 17.95502281188965, 18.494678497314453, 19.03433609008789, 19.573991775512695, 20.1136474609375, 20.653303146362305, 21.19295883178711, 21.732614517211914, 22.27227020263672, 22.811927795410156, 23.35158348083496, 23.891239166259766, 24.43089485168457, 24.970550537109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 11.0, 25.0, 30.0, 48.0, 85.0, 121.0, 119.0, 130.0, 105.0, 113.0, 80.0, 54.0, 37.0, 21.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875815391540527, -3.0876879692077637, -2.9877943992614746, -2.8879008293151855, -2.7880072593688965, -2.6881136894226074, -2.5882201194763184, -2.4883265495300293, -2.3884329795837402, -2.288539409637451, -2.188645839691162, -2.088752269744873, -1.988858699798584, -1.888965129852295, -1.7890715599060059, -1.6891779899597168, -1.5892845392227173, -1.4893909692764282, -1.3894973993301392, -1.28960382938385, -1.189710259437561, -1.089816689491272, -0.9899231791496277, -0.8900296092033386, -0.7901360392570496, -0.6902424693107605, -0.5903488993644714, -0.49045535922050476, -0.3905617892742157, -0.29066821932792664, -0.19077467918395996, -0.0908811092376709, 0.009012460708618164, 0.10890602320432663, 0.2087995857000351, 0.30869314074516296, 0.408586710691452, 0.5084803104400635, 0.6083738207817078, 0.7082673907279968, 0.8081609606742859, 0.908054530620575, 1.0079480409622192, 1.1078416109085083, 1.2077351808547974, 1.3076287508010864, 1.4075223207473755, 1.5074158906936646, 1.6073094606399536, 1.7072030305862427, 1.8070966005325317, 1.9069901704788208, 2.0068836212158203, 2.1067771911621094, 2.2066707611083984, 2.3065643310546875, 2.4064579010009766, 2.5063514709472656, 2.6062450408935547, 2.7061386108398438, 2.806032180786133, 2.905925750732422, 3.005819320678711, 3.105712890625, 3.205606460571289]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 14.0, 22.0, 19.0, 25.0, 33.0, 51.0, 50.0, 99.0, 310.0, 1166.0, 8578.0, 355019.0, 668276.0, 12803.0, 1397.0, 333.0, 121.0, 60.0, 45.0, 40.0, 16.0, 18.0, 18.0, 5.0, 8.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.937225341796875, -2.85101318359375, -2.764801025390625, -2.6785888671875, -2.592376708984375, -2.50616455078125, -2.419952392578125, -2.333740234375, -2.247528076171875, -2.16131591796875, -2.075103759765625, -1.9888916015625, -1.902679443359375, -1.81646728515625, -1.730255126953125, -1.64404296875, -1.557830810546875, -1.47161865234375, -1.385406494140625, -1.2991943359375, -1.212982177734375, -1.12677001953125, -1.040557861328125, -0.954345703125, -0.868133544921875, -0.78192138671875, -0.695709228515625, -0.6094970703125, -0.523284912109375, -0.43707275390625, -0.350860595703125, -0.2646484375, -0.178436279296875, -0.09222412109375, -0.006011962890625, 0.0802001953125, 0.166412353515625, 0.25262451171875, 0.338836669921875, 0.425048828125, 0.511260986328125, 0.59747314453125, 0.683685302734375, 0.7698974609375, 0.856109619140625, 0.94232177734375, 1.028533935546875, 1.11474609375, 1.200958251953125, 1.28717041015625, 1.373382568359375, 1.4595947265625, 1.545806884765625, 1.63201904296875, 1.718231201171875, 1.804443359375, 1.890655517578125, 1.97686767578125, 2.063079833984375, 2.1492919921875, 2.235504150390625, 2.32171630859375, 2.407928466796875, 2.494140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 11.0, 19.0, 37.0, 77.0, 123.0, 160.0, 195.0, 155.0, 84.0, 69.0, 38.0, 16.0, 15.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3994140625, -0.39132118225097656, -0.3832283020019531, -0.3751354217529297, -0.36704254150390625, -0.3589496612548828, -0.3508567810058594, -0.34276390075683594, -0.3346710205078125, -0.32657814025878906, -0.3184852600097656, -0.3103923797607422, -0.30229949951171875, -0.2942066192626953, -0.2861137390136719, -0.27802085876464844, -0.269927978515625, -0.26183509826660156, -0.2537422180175781, -0.2456493377685547, -0.23755645751953125, -0.2294635772705078, -0.22137069702148438, -0.21327781677246094, -0.2051849365234375, -0.19709205627441406, -0.18899917602539062, -0.1809062957763672, -0.17281341552734375, -0.1647205352783203, -0.15662765502929688, -0.14853477478027344, -0.14044189453125, -0.13234901428222656, -0.12425613403320312, -0.11616325378417969, -0.10807037353515625, -0.09997749328613281, -0.09188461303710938, -0.08379173278808594, -0.0756988525390625, -0.06760597229003906, -0.059513092041015625, -0.05142021179199219, -0.04332733154296875, -0.03523445129394531, -0.027141571044921875, -0.019048690795898438, -0.010955810546875, -0.0028629302978515625, 0.005229949951171875, 0.013322830200195312, 0.02141571044921875, 0.029508590698242188, 0.037601470947265625, 0.04569435119628906, 0.0537872314453125, 0.06188011169433594, 0.06997299194335938, 0.07806587219238281, 0.08615875244140625, 0.09425163269042969, 0.10234451293945312, 0.11043739318847656, 0.1185302734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 10.0, 10.0, 12.0, 13.0, 30.0, 42.0, 42.0, 79.0, 89.0, 145.0, 195.0, 391.0, 677.0, 1262.0, 2447.0, 5535.0, 14266.0, 41198.0, 142844.0, 465026.0, 266369.0, 70055.0, 22394.0, 8285.0, 3408.0, 1501.0, 847.0, 481.0, 255.0, 193.0, 133.0, 84.0, 76.0, 47.0, 30.0, 23.0, 16.0, 11.0, 7.0, 5.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6298828125, -0.6106338500976562, -0.5913848876953125, -0.5721359252929688, -0.552886962890625, -0.5336380004882812, -0.5143890380859375, -0.49514007568359375, -0.47589111328125, -0.45664215087890625, -0.4373931884765625, -0.41814422607421875, -0.398895263671875, -0.37964630126953125, -0.3603973388671875, -0.34114837646484375, -0.3218994140625, -0.30265045166015625, -0.2834014892578125, -0.26415252685546875, -0.244903564453125, -0.22565460205078125, -0.2064056396484375, -0.18715667724609375, -0.16790771484375, -0.14865875244140625, -0.1294097900390625, -0.11016082763671875, -0.090911865234375, -0.07166290283203125, -0.0524139404296875, -0.03316497802734375, -0.013916015625, 0.00533294677734375, 0.0245819091796875, 0.04383087158203125, 0.063079833984375, 0.08232879638671875, 0.1015777587890625, 0.12082672119140625, 0.14007568359375, 0.15932464599609375, 0.1785736083984375, 0.19782257080078125, 0.217071533203125, 0.23632049560546875, 0.2555694580078125, 0.27481842041015625, 0.2940673828125, 0.31331634521484375, 0.3325653076171875, 0.35181427001953125, 0.371063232421875, 0.39031219482421875, 0.4095611572265625, 0.42881011962890625, 0.44805908203125, 0.46730804443359375, 0.4865570068359375, 0.5058059692382812, 0.525054931640625, 0.5443038940429688, 0.5635528564453125, 0.5828018188476562, 0.60205078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 7.0, 2.0, 8.0, 5.0, 8.0, 16.0, 13.0, 11.0, 24.0, 23.0, 42.0, 19.0, 35.0, 36.0, 40.0, 55.0, 50.0, 47.0, 51.0, 54.0, 44.0, 48.0, 34.0, 41.0, 42.0, 30.0, 39.0, 26.0, 28.0, 24.0, 23.0, 16.0, 13.0, 15.0, 5.0, 11.0, 6.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.4886436462402344, -0.47435760498046875, -0.4600715637207031, -0.4457855224609375, -0.4314994812011719, -0.41721343994140625, -0.4029273986816406, -0.388641357421875, -0.3743553161621094, -0.36006927490234375, -0.3457832336425781, -0.3314971923828125, -0.3172111511230469, -0.30292510986328125, -0.2886390686035156, -0.27435302734375, -0.2600669860839844, -0.24578094482421875, -0.23149490356445312, -0.2172088623046875, -0.20292282104492188, -0.18863677978515625, -0.17435073852539062, -0.160064697265625, -0.14577865600585938, -0.13149261474609375, -0.11720657348632812, -0.1029205322265625, -0.08863449096679688, -0.07434844970703125, -0.060062408447265625, -0.0457763671875, -0.031490325927734375, -0.01720428466796875, -0.002918243408203125, 0.0113677978515625, 0.025653839111328125, 0.03993988037109375, 0.054225921630859375, 0.068511962890625, 0.08279800415039062, 0.09708404541015625, 0.11137008666992188, 0.1256561279296875, 0.13994216918945312, 0.15422821044921875, 0.16851425170898438, 0.18280029296875, 0.19708633422851562, 0.21137237548828125, 0.22565841674804688, 0.2399444580078125, 0.2542304992675781, 0.26851654052734375, 0.2828025817871094, 0.297088623046875, 0.3113746643066406, 0.32566070556640625, 0.3399467468261719, 0.3542327880859375, 0.3685188293457031, 0.38280487060546875, 0.3970909118652344, 0.411376953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 13.0, 8.0, 11.0, 24.0, 32.0, 60.0, 79.0, 143.0, 278.0, 577.0, 1268.0, 3097.0, 9703.0, 61933.0, 879486.0, 75487.0, 10412.0, 3312.0, 1305.0, 608.0, 284.0, 156.0, 85.0, 62.0, 24.0, 23.0, 20.0, 20.0, 11.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0458984375, -1.0104827880859375, -0.975067138671875, -0.9396514892578125, -0.90423583984375, -0.8688201904296875, -0.833404541015625, -0.7979888916015625, -0.7625732421875, -0.7271575927734375, -0.691741943359375, -0.6563262939453125, -0.62091064453125, -0.5854949951171875, -0.550079345703125, -0.5146636962890625, -0.479248046875, -0.4438323974609375, -0.408416748046875, -0.3730010986328125, -0.33758544921875, -0.3021697998046875, -0.266754150390625, -0.2313385009765625, -0.1959228515625, -0.1605072021484375, -0.125091552734375, -0.0896759033203125, -0.05426025390625, -0.0188446044921875, 0.016571044921875, 0.0519866943359375, 0.08740234375, 0.1228179931640625, 0.158233642578125, 0.1936492919921875, 0.22906494140625, 0.2644805908203125, 0.299896240234375, 0.3353118896484375, 0.3707275390625, 0.4061431884765625, 0.441558837890625, 0.4769744873046875, 0.51239013671875, 0.5478057861328125, 0.583221435546875, 0.6186370849609375, 0.654052734375, 0.6894683837890625, 0.724884033203125, 0.7602996826171875, 0.79571533203125, 0.8311309814453125, 0.866546630859375, 0.9019622802734375, 0.9373779296875, 0.9727935791015625, 1.008209228515625, 1.0436248779296875, 1.07904052734375, 1.1144561767578125, 1.149871826171875, 1.1852874755859375, 1.220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 18.0, 35.0, 45.0, 112.0, 208.0, 221.0, 160.0, 82.0, 49.0, 17.0, 12.0, 13.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020051002502441406, -0.00019514933228492737, -0.00018978863954544067, -0.00018442794680595398, -0.00017906725406646729, -0.0001737065613269806, -0.0001683458685874939, -0.0001629851758480072, -0.0001576244831085205, -0.0001522637903690338, -0.00014690309762954712, -0.00014154240489006042, -0.00013618171215057373, -0.00013082101941108704, -0.00012546032667160034, -0.00012009963393211365, -0.00011473894119262695, -0.00010937824845314026, -0.00010401755571365356, -9.865686297416687e-05, -9.329617023468018e-05, -8.793547749519348e-05, -8.257478475570679e-05, -7.721409201622009e-05, -7.18533992767334e-05, -6.64927065372467e-05, -6.113201379776001e-05, -5.5771321058273315e-05, -5.041062831878662e-05, -4.504993557929993e-05, -3.968924283981323e-05, -3.432855010032654e-05, -2.8967857360839844e-05, -2.360716462135315e-05, -1.8246471881866455e-05, -1.288577914237976e-05, -7.525086402893066e-06, -2.164393663406372e-06, 3.1962990760803223e-06, 8.556991815567017e-06, 1.3917684555053711e-05, 1.9278377294540405e-05, 2.46390700340271e-05, 2.9999762773513794e-05, 3.536045551300049e-05, 4.072114825248718e-05, 4.608184099197388e-05, 5.144253373146057e-05, 5.6803226470947266e-05, 6.216391921043396e-05, 6.752461194992065e-05, 7.288530468940735e-05, 7.824599742889404e-05, 8.360669016838074e-05, 8.896738290786743e-05, 9.432807564735413e-05, 9.968876838684082e-05, 0.00010504946112632751, 0.00011041015386581421, 0.0001157708466053009, 0.0001211315393447876, 0.0001264922320842743, 0.00013185292482376099, 0.00013721361756324768, 0.00014257431030273438]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 12.0, 21.0, 33.0, 38.0, 57.0, 90.0, 168.0, 218.0, 493.0, 843.0, 1708.0, 3633.0, 9871.0, 39291.0, 461478.0, 473434.0, 39772.0, 9754.0, 3737.0, 1754.0, 913.0, 490.0, 267.0, 163.0, 102.0, 57.0, 39.0, 30.0, 18.0, 16.0, 10.0, 8.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.974609375, -0.948272705078125, -0.92193603515625, -0.895599365234375, -0.8692626953125, -0.842926025390625, -0.81658935546875, -0.790252685546875, -0.763916015625, -0.737579345703125, -0.71124267578125, -0.684906005859375, -0.6585693359375, -0.632232666015625, -0.60589599609375, -0.579559326171875, -0.55322265625, -0.526885986328125, -0.50054931640625, -0.474212646484375, -0.4478759765625, -0.421539306640625, -0.39520263671875, -0.368865966796875, -0.342529296875, -0.316192626953125, -0.28985595703125, -0.263519287109375, -0.2371826171875, -0.210845947265625, -0.18450927734375, -0.158172607421875, -0.1318359375, -0.105499267578125, -0.07916259765625, -0.052825927734375, -0.0264892578125, -0.000152587890625, 0.02618408203125, 0.052520751953125, 0.078857421875, 0.105194091796875, 0.13153076171875, 0.157867431640625, 0.1842041015625, 0.210540771484375, 0.23687744140625, 0.263214111328125, 0.28955078125, 0.315887451171875, 0.34222412109375, 0.368560791015625, 0.3948974609375, 0.421234130859375, 0.44757080078125, 0.473907470703125, 0.500244140625, 0.526580810546875, 0.55291748046875, 0.579254150390625, 0.6055908203125, 0.631927490234375, 0.65826416015625, 0.684600830078125, 0.7109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 3.0, 5.0, 6.0, 10.0, 6.0, 17.0, 24.0, 39.0, 61.0, 52.0, 74.0, 84.0, 108.0, 103.0, 88.0, 73.0, 55.0, 54.0, 28.0, 29.0, 19.0, 9.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.316162109375, -0.3053016662597656, -0.29444122314453125, -0.2835807800292969, -0.2727203369140625, -0.2618598937988281, -0.25099945068359375, -0.24013900756835938, -0.229278564453125, -0.21841812133789062, -0.20755767822265625, -0.19669723510742188, -0.1858367919921875, -0.17497634887695312, -0.16411590576171875, -0.15325546264648438, -0.14239501953125, -0.13153457641601562, -0.12067413330078125, -0.10981369018554688, -0.0989532470703125, -0.08809280395507812, -0.07723236083984375, -0.06637191772460938, -0.055511474609375, -0.044651031494140625, -0.03379058837890625, -0.022930145263671875, -0.0120697021484375, -0.001209259033203125, 0.00965118408203125, 0.020511627197265625, 0.0313720703125, 0.042232513427734375, 0.05309295654296875, 0.06395339965820312, 0.0748138427734375, 0.08567428588867188, 0.09653472900390625, 0.10739517211914062, 0.118255615234375, 0.12911605834960938, 0.13997650146484375, 0.15083694458007812, 0.1616973876953125, 0.17255783081054688, 0.18341827392578125, 0.19427871704101562, 0.20513916015625, 0.21599960327148438, 0.22686004638671875, 0.23772048950195312, 0.2485809326171875, 0.2594413757324219, 0.27030181884765625, 0.2811622619628906, 0.292022705078125, 0.3028831481933594, 0.31374359130859375, 0.3246040344238281, 0.3354644775390625, 0.3463249206542969, 0.35718536376953125, 0.3680458068847656, 0.37890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 11.0, 7.0, 24.0, 37.0, 84.0, 191.0, 234.0, 177.0, 108.0, 52.0, 29.0, 14.0, 14.0, 6.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.231497764587402, -7.038308143615723, -6.845118045806885, -6.651928424835205, -6.458738803863525, -6.2655487060546875, -6.072359085083008, -5.879169464111328, -5.68597936630249, -5.4927897453308105, -5.299599647521973, -5.106410026550293, -4.913220405578613, -4.720030307769775, -4.526840686798096, -4.333650588989258, -4.140460968017578, -3.9472711086273193, -3.7540814876556396, -3.560891628265381, -3.367701768875122, -3.1745119094848633, -2.9813222885131836, -2.788132429122925, -2.594943046569824, -2.4017531871795654, -2.2085635662078857, -2.015373706817627, -1.8221838474273682, -1.628994107246399, -1.4358043670654297, -1.242614507675171, -1.049424648284912, -0.8562348484992981, -0.6630450487136841, -0.46985530853271484, -0.27666550874710083, -0.08347570896148682, 0.10971403121948242, 0.3029038906097412, 0.49609363079071045, 0.6892834305763245, 0.8824732303619385, 1.0756629705429077, 1.268852710723877, 1.4620425701141357, 1.655232310295105, 1.8484221696853638, 2.041611909866333, 2.234801769256592, 2.4279913902282715, 2.6211812496185303, 2.814371109008789, 3.0075607299804688, 3.2007505893707275, 3.3939404487609863, 3.587130069732666, 3.780319929122925, 3.9735095500946045, 4.166699409484863, 4.359889030456543, 4.553079128265381, 4.7462687492370605, 4.939458847045898, 5.132648468017578]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 13.0, 9.0, 10.0, 14.0, 20.0, 16.0, 39.0, 42.0, 30.0, 41.0, 49.0, 63.0, 50.0, 46.0, 56.0, 54.0, 42.0, 44.0, 41.0, 45.0, 44.0, 24.0, 36.0, 30.0, 27.0, 25.0, 13.0, 9.0, 9.0, 18.0, 12.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.9997143745422363, -3.894901752471924, -3.7900888919830322, -3.6852762699127197, -3.5804636478424072, -3.4756507873535156, -3.370838165283203, -3.2660255432128906, -3.161212921142578, -3.0564002990722656, -2.951587438583374, -2.8467748165130615, -2.741962194442749, -2.6371493339538574, -2.532336711883545, -2.4275240898132324, -2.32271146774292, -2.2178988456726074, -2.113085985183716, -2.0082733631134033, -1.9034607410430908, -1.7986479997634888, -1.6938352584838867, -1.5890226364135742, -1.4842097759246826, -1.3793970346450806, -1.274584412574768, -1.169771671295166, -1.0649590492248535, -0.9601463079452515, -0.8553336262702942, -0.7505209445953369, -0.6457083225250244, -0.5408956408500671, -0.43608295917510986, -0.3312702476978302, -0.22645756602287292, -0.12164485454559326, -0.016832172870635986, 0.08798050880432129, 0.19279319047927856, 0.29760587215423584, 0.4024185538291931, 0.5072312355041504, 0.6120439767837524, 0.7168566584587097, 0.821669340133667, 0.9264820218086243, 1.0312947034835815, 1.1361074447631836, 1.240920066833496, 1.3457328081130981, 1.4505454301834106, 1.5553581714630127, 1.6601707935333252, 1.7649835348129272, 1.8697962760925293, 1.9746090173721313, 2.0794217586517334, 2.184234380722046, 2.2890470027923584, 2.39385986328125, 2.4986724853515625, 2.603485107421875, 2.7082977294921875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 8.0, 2.0, 6.0, 7.0, 2.0, 6.0, 8.0, 9.0, 3.0, 6.0, 17.0, 9.0, 10.0, 11.0, 14.0, 26.0, 22.0, 28.0, 29.0, 46.0, 53.0, 86.0, 93.0, 141.0, 312.0, 524.0, 1119.0, 3005.0, 9602.0, 51533.0, 3799528.0, 295582.0, 23896.0, 5595.0, 1765.0, 648.0, 266.0, 141.0, 60.0, 31.0, 16.0, 9.0, 4.0, 3.0, 3.0], "bins": [-3.408203125, -3.3397369384765625, -3.271270751953125, -3.2028045654296875, -3.13433837890625, -3.0658721923828125, -2.997406005859375, -2.9289398193359375, -2.8604736328125, -2.7920074462890625, -2.723541259765625, -2.6550750732421875, -2.58660888671875, -2.5181427001953125, -2.449676513671875, -2.3812103271484375, -2.312744140625, -2.2442779541015625, -2.175811767578125, -2.1073455810546875, -2.03887939453125, -1.9704132080078125, -1.901947021484375, -1.8334808349609375, -1.7650146484375, -1.6965484619140625, -1.628082275390625, -1.5596160888671875, -1.49114990234375, -1.4226837158203125, -1.354217529296875, -1.2857513427734375, -1.21728515625, -1.1488189697265625, -1.080352783203125, -1.0118865966796875, -0.94342041015625, -0.8749542236328125, -0.806488037109375, -0.7380218505859375, -0.6695556640625, -0.6010894775390625, -0.532623291015625, -0.4641571044921875, -0.39569091796875, -0.3272247314453125, -0.258758544921875, -0.1902923583984375, -0.121826171875, -0.0533599853515625, 0.015106201171875, 0.0835723876953125, 0.15203857421875, 0.2205047607421875, 0.288970947265625, 0.3574371337890625, 0.4259033203125, 0.4943695068359375, 0.562835693359375, 0.6313018798828125, 0.69976806640625, 0.7682342529296875, 0.836700439453125, 0.9051666259765625, 0.9736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 22.0, 37.0, 57.0, 102.0, 127.0, 154.0, 125.0, 123.0, 104.0, 60.0, 36.0, 18.0, 12.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.391357421875, -0.3835258483886719, -0.37569427490234375, -0.3678627014160156, -0.3600311279296875, -0.3521995544433594, -0.34436798095703125, -0.3365364074707031, -0.328704833984375, -0.3208732604980469, -0.31304168701171875, -0.3052101135253906, -0.2973785400390625, -0.2895469665527344, -0.28171539306640625, -0.2738838195800781, -0.26605224609375, -0.2582206726074219, -0.25038909912109375, -0.24255752563476562, -0.2347259521484375, -0.22689437866210938, -0.21906280517578125, -0.21123123168945312, -0.203399658203125, -0.19556808471679688, -0.18773651123046875, -0.17990493774414062, -0.1720733642578125, -0.16424179077148438, -0.15641021728515625, -0.14857864379882812, -0.1407470703125, -0.13291549682617188, -0.12508392333984375, -0.11725234985351562, -0.1094207763671875, -0.10158920288085938, -0.09375762939453125, -0.08592605590820312, -0.078094482421875, -0.07026290893554688, -0.06243133544921875, -0.054599761962890625, -0.0467681884765625, -0.038936614990234375, -0.03110504150390625, -0.023273468017578125, -0.01544189453125, -0.007610321044921875, 0.00022125244140625, 0.008052825927734375, 0.0158843994140625, 0.023715972900390625, 0.03154754638671875, 0.039379119873046875, 0.047210693359375, 0.055042266845703125, 0.06287384033203125, 0.07070541381835938, 0.0785369873046875, 0.08636856079101562, 0.09420013427734375, 0.10203170776367188, 0.10986328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 13.0, 23.0, 25.0, 46.0, 54.0, 90.0, 133.0, 173.0, 243.0, 422.0, 752.0, 1589.0, 4762.0, 25408.0, 667425.0, 3442101.0, 41114.0, 6367.0, 1683.0, 725.0, 421.0, 215.0, 154.0, 94.0, 55.0, 56.0, 48.0, 22.0, 17.0, 13.0, 10.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7834625244140625, -1.712432861328125, -1.6414031982421875, -1.57037353515625, -1.4993438720703125, -1.428314208984375, -1.3572845458984375, -1.2862548828125, -1.2152252197265625, -1.144195556640625, -1.0731658935546875, -1.00213623046875, -0.9311065673828125, -0.860076904296875, -0.7890472412109375, -0.718017578125, -0.6469879150390625, -0.575958251953125, -0.5049285888671875, -0.43389892578125, -0.3628692626953125, -0.291839599609375, -0.2208099365234375, -0.1497802734375, -0.0787506103515625, -0.007720947265625, 0.0633087158203125, 0.13433837890625, 0.2053680419921875, 0.276397705078125, 0.3474273681640625, 0.41845703125, 0.4894866943359375, 0.560516357421875, 0.6315460205078125, 0.70257568359375, 0.7736053466796875, 0.844635009765625, 0.9156646728515625, 0.9866943359375, 1.0577239990234375, 1.128753662109375, 1.1997833251953125, 1.27081298828125, 1.3418426513671875, 1.412872314453125, 1.4839019775390625, 1.554931640625, 1.6259613037109375, 1.696990966796875, 1.7680206298828125, 1.83905029296875, 1.9100799560546875, 1.981109619140625, 2.0521392822265625, 2.1231689453125, 2.1941986083984375, 2.265228271484375, 2.3362579345703125, 2.40728759765625, 2.4783172607421875, 2.549346923828125, 2.6203765869140625, 2.69140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 14.0, 31.0, 48.0, 80.0, 157.0, 318.0, 1355.0, 1387.0, 341.0, 128.0, 61.0, 44.0, 36.0, 18.0, 15.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.4935188293457031, -0.48117828369140625, -0.4688377380371094, -0.4564971923828125, -0.4441566467285156, -0.43181610107421875, -0.4194755554199219, -0.407135009765625, -0.3947944641113281, -0.38245391845703125, -0.3701133728027344, -0.3577728271484375, -0.3454322814941406, -0.33309173583984375, -0.3207511901855469, -0.30841064453125, -0.2960700988769531, -0.28372955322265625, -0.2713890075683594, -0.2590484619140625, -0.24670791625976562, -0.23436737060546875, -0.22202682495117188, -0.209686279296875, -0.19734573364257812, -0.18500518798828125, -0.17266464233398438, -0.1603240966796875, -0.14798355102539062, -0.13564300537109375, -0.12330245971679688, -0.1109619140625, -0.09862136840820312, -0.08628082275390625, -0.07394027709960938, -0.0615997314453125, -0.049259185791015625, -0.03691864013671875, -0.024578094482421875, -0.012237548828125, 0.000102996826171875, 0.01244354248046875, 0.024784088134765625, 0.0371246337890625, 0.049465179443359375, 0.06180572509765625, 0.07414627075195312, 0.08648681640625, 0.09882736206054688, 0.11116790771484375, 0.12350845336914062, 0.1358489990234375, 0.14818954467773438, 0.16053009033203125, 0.17287063598632812, 0.185211181640625, 0.19755172729492188, 0.20989227294921875, 0.22223281860351562, 0.2345733642578125, 0.24691390991210938, 0.25925445556640625, 0.2715950012207031, 0.283935546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 7.0, 10.0, 12.0, 28.0, 66.0, 171.0, 290.0, 245.0, 101.0, 43.0, 17.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7197020053863525, -3.5946264266967773, -3.4695510864257812, -3.344475507736206, -3.219399929046631, -3.0943245887756348, -2.9692490100860596, -2.8441734313964844, -2.7190980911254883, -2.594022512435913, -2.468947172164917, -2.343871593475342, -2.2187960147857666, -2.0937204360961914, -1.9686450958251953, -1.8435695171356201, -1.718493938446045, -1.5934184789657593, -1.468342900276184, -1.3432674407958984, -1.2181918621063232, -1.0931164026260376, -0.968040943145752, -0.8429654240608215, -0.7178899049758911, -0.5928143858909607, -0.46773889660835266, -0.34266340732574463, -0.2175878882408142, -0.09251236915588379, 0.032563090324401855, 0.15763860940933228, 0.2827138900756836, 0.407789409160614, 0.5328649282455444, 0.6579403877258301, 0.7830159068107605, 0.9080914258956909, 1.0331668853759766, 1.1582424640655518, 1.2833179235458374, 1.408393383026123, 1.5334689617156982, 1.6585444211959839, 1.7836198806762695, 1.9086954593658447, 2.03377103805542, 2.158846378326416, 2.283921957015991, 2.4089975357055664, 2.5340728759765625, 2.6591484546661377, 2.784224033355713, 2.909299373626709, 3.034374952316284, 3.1594505310058594, 3.2845258712768555, 3.4096014499664307, 3.5346767902374268, 3.659752368927002, 3.784827947616577, 3.9099035263061523, 4.034978866577148, 4.1600542068481445, 4.285130023956299]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 11.0, 15.0, 23.0, 42.0, 58.0, 80.0, 89.0, 85.0, 88.0, 106.0, 88.0, 71.0, 64.0, 58.0, 43.0, 24.0, 22.0, 12.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2537894248962402, -2.189366102218628, -2.1249430179595947, -2.0605196952819824, -1.9960963726043701, -1.9316731691360474, -1.8672499656677246, -1.8028266429901123, -1.7384034395217896, -1.6739802360534668, -1.6095569133758545, -1.5451337099075317, -1.480710506439209, -1.4162871837615967, -1.351863980293274, -1.2874407768249512, -1.2230174541473389, -1.1585942506790161, -1.0941709280014038, -1.029747724533081, -0.9653244614601135, -0.900901198387146, -0.8364779949188232, -0.7720547318458557, -0.7076314687728882, -0.6432082056999207, -0.5787849426269531, -0.5143617391586304, -0.44993847608566284, -0.3855152130126953, -0.32109197974205017, -0.25666874647140503, -0.1922457218170166, -0.12782247364521027, -0.06339922547340393, 0.0010240226984024048, 0.06544727087020874, 0.12987053394317627, 0.1942937672138214, 0.25871700048446655, 0.3231402635574341, 0.3875635266304016, 0.45198675990104675, 0.5164099931716919, 0.5808332562446594, 0.645256519317627, 0.7096797227859497, 0.7741029858589172, 0.8385262489318848, 0.9029495120048523, 0.9673727750778198, 1.0317959785461426, 1.0962193012237549, 1.1606425046920776, 1.2250657081604004, 1.2894890308380127, 1.3539122343063354, 1.4183354377746582, 1.4827587604522705, 1.5471819639205933, 1.611605167388916, 1.6760284900665283, 1.740451693534851, 1.8048748970031738, 1.8692982196807861]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 5.0, 6.0, 15.0, 12.0, 30.0, 35.0, 42.0, 66.0, 102.0, 166.0, 350.0, 846.0, 2815.0, 14088.0, 167482.0, 783526.0, 67942.0, 7856.0, 1807.0, 610.0, 263.0, 154.0, 88.0, 47.0, 58.0, 29.0, 25.0, 23.0, 13.0, 9.0, 6.0, 7.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6875, -1.6318817138671875, -1.576263427734375, -1.5206451416015625, -1.46502685546875, -1.4094085693359375, -1.353790283203125, -1.2981719970703125, -1.2425537109375, -1.1869354248046875, -1.131317138671875, -1.0756988525390625, -1.02008056640625, -0.9644622802734375, -0.908843994140625, -0.8532257080078125, -0.797607421875, -0.7419891357421875, -0.686370849609375, -0.6307525634765625, -0.57513427734375, -0.5195159912109375, -0.463897705078125, -0.4082794189453125, -0.3526611328125, -0.2970428466796875, -0.241424560546875, -0.1858062744140625, -0.13018798828125, -0.0745697021484375, -0.018951416015625, 0.0366668701171875, 0.09228515625, 0.1479034423828125, 0.203521728515625, 0.2591400146484375, 0.31475830078125, 0.3703765869140625, 0.425994873046875, 0.4816131591796875, 0.5372314453125, 0.5928497314453125, 0.648468017578125, 0.7040863037109375, 0.75970458984375, 0.8153228759765625, 0.870941162109375, 0.9265594482421875, 0.982177734375, 1.0377960205078125, 1.093414306640625, 1.1490325927734375, 1.20465087890625, 1.2602691650390625, 1.315887451171875, 1.3715057373046875, 1.4271240234375, 1.4827423095703125, 1.538360595703125, 1.5939788818359375, 1.64959716796875, 1.7052154541015625, 1.760833740234375, 1.8164520263671875, 1.8720703125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 21.0, 33.0, 58.0, 80.0, 109.0, 154.0, 133.0, 123.0, 114.0, 77.0, 45.0, 28.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.41300010681152344, -0.4038810729980469, -0.3947620391845703, -0.38564300537109375, -0.3765239715576172, -0.3674049377441406, -0.35828590393066406, -0.3491668701171875, -0.34004783630371094, -0.3309288024902344, -0.3218097686767578, -0.31269073486328125, -0.3035717010498047, -0.2944526672363281, -0.28533363342285156, -0.276214599609375, -0.26709556579589844, -0.2579765319824219, -0.2488574981689453, -0.23973846435546875, -0.2306194305419922, -0.22150039672851562, -0.21238136291503906, -0.2032623291015625, -0.19414329528808594, -0.18502426147460938, -0.1759052276611328, -0.16678619384765625, -0.1576671600341797, -0.14854812622070312, -0.13942909240722656, -0.13031005859375, -0.12119102478027344, -0.11207199096679688, -0.10295295715332031, -0.09383392333984375, -0.08471488952636719, -0.07559585571289062, -0.06647682189941406, -0.0573577880859375, -0.04823875427246094, -0.039119720458984375, -0.030000686645507812, -0.02088165283203125, -0.011762619018554688, -0.002643585205078125, 0.0064754486083984375, 0.015594482421875, 0.024713516235351562, 0.033832550048828125, 0.04295158386230469, 0.05207061767578125, 0.06118965148925781, 0.07030868530273438, 0.07942771911621094, 0.0885467529296875, 0.09766578674316406, 0.10678482055664062, 0.11590385437011719, 0.12502288818359375, 0.1341419219970703, 0.14326095581054688, 0.15237998962402344, 0.1614990234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 3.0, 14.0, 11.0, 31.0, 26.0, 33.0, 54.0, 93.0, 119.0, 223.0, 383.0, 687.0, 1306.0, 2809.0, 6630.0, 18638.0, 63160.0, 282790.0, 496197.0, 124273.0, 32291.0, 10512.0, 4152.0, 1897.0, 901.0, 502.0, 282.0, 174.0, 113.0, 69.0, 53.0, 36.0, 24.0, 17.0, 10.0, 15.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.736053466796875, -0.71087646484375, -0.685699462890625, -0.6605224609375, -0.635345458984375, -0.61016845703125, -0.584991455078125, -0.559814453125, -0.534637451171875, -0.50946044921875, -0.484283447265625, -0.4591064453125, -0.433929443359375, -0.40875244140625, -0.383575439453125, -0.3583984375, -0.333221435546875, -0.30804443359375, -0.282867431640625, -0.2576904296875, -0.232513427734375, -0.20733642578125, -0.182159423828125, -0.156982421875, -0.131805419921875, -0.10662841796875, -0.081451416015625, -0.0562744140625, -0.031097412109375, -0.00592041015625, 0.019256591796875, 0.04443359375, 0.069610595703125, 0.09478759765625, 0.119964599609375, 0.1451416015625, 0.170318603515625, 0.19549560546875, 0.220672607421875, 0.245849609375, 0.271026611328125, 0.29620361328125, 0.321380615234375, 0.3465576171875, 0.371734619140625, 0.39691162109375, 0.422088623046875, 0.447265625, 0.472442626953125, 0.49761962890625, 0.522796630859375, 0.5479736328125, 0.573150634765625, 0.59832763671875, 0.623504638671875, 0.648681640625, 0.673858642578125, 0.69903564453125, 0.724212646484375, 0.7493896484375, 0.774566650390625, 0.79974365234375, 0.824920654296875, 0.85009765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 4.0, 7.0, 11.0, 11.0, 13.0, 19.0, 20.0, 21.0, 23.0, 34.0, 49.0, 43.0, 40.0, 52.0, 44.0, 52.0, 36.0, 53.0, 42.0, 47.0, 39.0, 49.0, 34.0, 29.0, 32.0, 25.0, 27.0, 33.0, 17.0, 11.0, 20.0, 10.0, 12.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5576171875, -0.5404129028320312, -0.5232086181640625, -0.5060043334960938, -0.488800048828125, -0.47159576416015625, -0.4543914794921875, -0.43718719482421875, -0.41998291015625, -0.40277862548828125, -0.3855743408203125, -0.36837005615234375, -0.351165771484375, -0.33396148681640625, -0.3167572021484375, -0.29955291748046875, -0.2823486328125, -0.26514434814453125, -0.2479400634765625, -0.23073577880859375, -0.213531494140625, -0.19632720947265625, -0.1791229248046875, -0.16191864013671875, -0.14471435546875, -0.12751007080078125, -0.1103057861328125, -0.09310150146484375, -0.075897216796875, -0.05869293212890625, -0.0414886474609375, -0.02428436279296875, -0.007080078125, 0.01012420654296875, 0.0273284912109375, 0.04453277587890625, 0.061737060546875, 0.07894134521484375, 0.0961456298828125, 0.11334991455078125, 0.13055419921875, 0.14775848388671875, 0.1649627685546875, 0.18216705322265625, 0.199371337890625, 0.21657562255859375, 0.2337799072265625, 0.25098419189453125, 0.2681884765625, 0.28539276123046875, 0.3025970458984375, 0.31980133056640625, 0.337005615234375, 0.35420989990234375, 0.3714141845703125, 0.38861846923828125, 0.40582275390625, 0.42302703857421875, 0.4402313232421875, 0.45743560791015625, 0.474639892578125, 0.49184417724609375, 0.5090484619140625, 0.5262527465820312, 0.54345703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 15.0, 15.0, 20.0, 51.0, 84.0, 140.0, 262.0, 485.0, 1007.0, 2429.0, 8195.0, 67860.0, 872101.0, 81818.0, 9387.0, 2614.0, 996.0, 458.0, 215.0, 135.0, 77.0, 50.0, 32.0, 20.0, 23.0, 14.0, 8.0, 5.0, 10.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.95849609375, -0.9271011352539062, -0.8957061767578125, -0.8643112182617188, -0.832916259765625, -0.8015213012695312, -0.7701263427734375, -0.7387313842773438, -0.70733642578125, -0.6759414672851562, -0.6445465087890625, -0.6131515502929688, -0.581756591796875, -0.5503616333007812, -0.5189666748046875, -0.48757171630859375, -0.4561767578125, -0.42478179931640625, -0.3933868408203125, -0.36199188232421875, -0.330596923828125, -0.29920196533203125, -0.2678070068359375, -0.23641204833984375, -0.20501708984375, -0.17362213134765625, -0.1422271728515625, -0.11083221435546875, -0.079437255859375, -0.04804229736328125, -0.0166473388671875, 0.01474761962890625, 0.046142578125, 0.07753753662109375, 0.1089324951171875, 0.14032745361328125, 0.171722412109375, 0.20311737060546875, 0.2345123291015625, 0.26590728759765625, 0.29730224609375, 0.32869720458984375, 0.3600921630859375, 0.39148712158203125, 0.422882080078125, 0.45427703857421875, 0.4856719970703125, 0.5170669555664062, 0.5484619140625, 0.5798568725585938, 0.6112518310546875, 0.6426467895507812, 0.674041748046875, 0.7054367065429688, 0.7368316650390625, 0.7682266235351562, 0.79962158203125, 0.8310165405273438, 0.8624114990234375, 0.8938064575195312, 0.925201416015625, 0.9565963745117188, 0.9879913330078125, 1.0193862915039062, 1.05078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 6.0, 9.0, 11.0, 16.0, 15.0, 27.0, 38.0, 76.0, 125.0, 201.0, 186.0, 111.0, 73.0, 32.0, 21.0, 11.0, 9.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016689300537109375, -0.00016224384307861328, -0.0001575946807861328, -0.00015294551849365234, -0.00014829635620117188, -0.0001436471939086914, -0.00013899803161621094, -0.00013434886932373047, -0.00012969970703125, -0.00012505054473876953, -0.00012040138244628906, -0.0001157522201538086, -0.00011110305786132812, -0.00010645389556884766, -0.00010180473327636719, -9.715557098388672e-05, -9.250640869140625e-05, -8.785724639892578e-05, -8.320808410644531e-05, -7.855892181396484e-05, -7.390975952148438e-05, -6.92605972290039e-05, -6.461143493652344e-05, -5.996227264404297e-05, -5.53131103515625e-05, -5.066394805908203e-05, -4.601478576660156e-05, -4.1365623474121094e-05, -3.6716461181640625e-05, -3.2067298889160156e-05, -2.7418136596679688e-05, -2.276897430419922e-05, -1.811981201171875e-05, -1.3470649719238281e-05, -8.821487426757812e-06, -4.172325134277344e-06, 4.76837158203125e-07, 5.125999450683594e-06, 9.775161743164062e-06, 1.4424324035644531e-05, 1.9073486328125e-05, 2.372264862060547e-05, 2.8371810913085938e-05, 3.3020973205566406e-05, 3.7670135498046875e-05, 4.2319297790527344e-05, 4.696846008300781e-05, 5.161762237548828e-05, 5.626678466796875e-05, 6.091594696044922e-05, 6.556510925292969e-05, 7.021427154541016e-05, 7.486343383789062e-05, 7.95125961303711e-05, 8.416175842285156e-05, 8.881092071533203e-05, 9.34600830078125e-05, 9.810924530029297e-05, 0.00010275840759277344, 0.0001074075698852539, 0.00011205673217773438, 0.00011670589447021484, 0.00012135505676269531, 0.00012600421905517578, 0.00013065338134765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 26.0, 30.0, 48.0, 61.0, 117.0, 196.0, 297.0, 638.0, 1168.0, 2605.0, 7464.0, 57696.0, 904222.0, 61162.0, 7619.0, 2639.0, 1193.0, 542.0, 322.0, 172.0, 108.0, 62.0, 45.0, 24.0, 14.0, 20.0, 6.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2158203125, -1.1731719970703125, -1.130523681640625, -1.0878753662109375, -1.04522705078125, -1.0025787353515625, -0.959930419921875, -0.9172821044921875, -0.8746337890625, -0.8319854736328125, -0.789337158203125, -0.7466888427734375, -0.70404052734375, -0.6613922119140625, -0.618743896484375, -0.5760955810546875, -0.533447265625, -0.4907989501953125, -0.448150634765625, -0.4055023193359375, -0.36285400390625, -0.3202056884765625, -0.277557373046875, -0.2349090576171875, -0.1922607421875, -0.1496124267578125, -0.106964111328125, -0.0643157958984375, -0.02166748046875, 0.0209808349609375, 0.063629150390625, 0.1062774658203125, 0.14892578125, 0.1915740966796875, 0.234222412109375, 0.2768707275390625, 0.31951904296875, 0.3621673583984375, 0.404815673828125, 0.4474639892578125, 0.4901123046875, 0.5327606201171875, 0.575408935546875, 0.6180572509765625, 0.66070556640625, 0.7033538818359375, 0.746002197265625, 0.7886505126953125, 0.831298828125, 0.8739471435546875, 0.916595458984375, 0.9592437744140625, 1.00189208984375, 1.0445404052734375, 1.087188720703125, 1.1298370361328125, 1.1724853515625, 1.2151336669921875, 1.257781982421875, 1.3004302978515625, 1.34307861328125, 1.3857269287109375, 1.428375244140625, 1.4710235595703125, 1.513671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 13.0, 20.0, 27.0, 53.0, 92.0, 176.0, 194.0, 153.0, 95.0, 66.0, 40.0, 18.0, 14.0, 5.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.740234375, -0.7210884094238281, -0.7019424438476562, -0.6827964782714844, -0.6636505126953125, -0.6445045471191406, -0.6253585815429688, -0.6062126159667969, -0.587066650390625, -0.5679206848144531, -0.5487747192382812, -0.5296287536621094, -0.5104827880859375, -0.4913368225097656, -0.47219085693359375, -0.4530448913574219, -0.43389892578125, -0.4147529602050781, -0.39560699462890625, -0.3764610290527344, -0.3573150634765625, -0.3381690979003906, -0.31902313232421875, -0.2998771667480469, -0.280731201171875, -0.2615852355957031, -0.24243927001953125, -0.22329330444335938, -0.2041473388671875, -0.18500137329101562, -0.16585540771484375, -0.14670944213867188, -0.1275634765625, -0.10841751098632812, -0.08927154541015625, -0.07012557983398438, -0.0509796142578125, -0.031833648681640625, -0.01268768310546875, 0.006458282470703125, 0.025604248046875, 0.044750213623046875, 0.06389617919921875, 0.08304214477539062, 0.1021881103515625, 0.12133407592773438, 0.14048004150390625, 0.15962600708007812, 0.17877197265625, 0.19791793823242188, 0.21706390380859375, 0.23620986938476562, 0.2553558349609375, 0.2745018005371094, 0.29364776611328125, 0.3127937316894531, 0.331939697265625, 0.3510856628417969, 0.37023162841796875, 0.3893775939941406, 0.4085235595703125, 0.4276695251464844, 0.44681549072265625, 0.4659614562988281, 0.485107421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 9.0, 44.0, 119.0, 286.0, 321.0, 129.0, 48.0, 17.0, 10.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.310275554656982, -4.956239700317383, -4.602204322814941, -4.2481689453125, -3.8941330909729004, -3.54009747505188, -3.1860618591308594, -2.832026243209839, -2.4779906272888184, -2.123955011367798, -1.7699193954467773, -1.4158837795257568, -1.0618481636047363, -0.7078125476837158, -0.3537769317626953, 0.0002586841583251953, 0.3542943000793457, 0.7083299160003662, 1.0623655319213867, 1.4164011478424072, 1.7704367637634277, 2.1244723796844482, 2.4785079956054688, 2.8325436115264893, 3.1865792274475098, 3.5406148433685303, 3.894650459289551, 4.248685836791992, 4.602721691131592, 4.956757545471191, 5.310792922973633, 5.664828300476074, 6.018863677978516, 6.372899055480957, 6.726934909820557, 7.080970764160156, 7.435006141662598, 7.789041519165039, 8.143077850341797, 8.497113227844238, 8.85114860534668, 9.205183982849121, 9.559219360351562, 9.91325569152832, 10.267291069030762, 10.621326446533203, 10.975362777709961, 11.329398155212402, 11.683433532714844, 12.037468910217285, 12.391504287719727, 12.745540618896484, 13.099575996398926, 13.453611373901367, 13.807647705078125, 14.161683082580566, 14.515718460083008, 14.86975383758545, 15.22378921508789, 15.577825546264648, 15.93186092376709, 16.28589630126953, 16.63993263244629, 16.993967056274414, 17.348003387451172]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 7.0, 5.0, 3.0, 8.0, 9.0, 15.0, 14.0, 21.0, 20.0, 30.0, 34.0, 35.0, 45.0, 50.0, 41.0, 40.0, 53.0, 64.0, 37.0, 49.0, 56.0, 56.0, 45.0, 55.0, 40.0, 24.0, 28.0, 17.0, 24.0, 10.0, 11.0, 9.0, 9.0, 12.0, 2.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.445357322692871, -3.3283238410949707, -3.2112903594970703, -3.094256639480591, -2.9772231578826904, -2.86018967628479, -2.7431559562683105, -2.62612247467041, -2.5090889930725098, -2.3920555114746094, -2.275022029876709, -2.1579883098602295, -2.040954828262329, -1.9239213466644287, -1.8068877458572388, -1.6898541450500488, -1.5728206634521484, -1.455787181854248, -1.338753581047058, -1.2217199802398682, -1.1046864986419678, -0.9876529574394226, -0.8706194162368774, -0.7535858750343323, -0.6365523338317871, -0.5195187926292419, -0.4024852514266968, -0.2854517102241516, -0.16841816902160645, -0.05138462781906128, 0.06564891338348389, 0.18268245458602905, 0.2997159957885742, 0.4167495369911194, 0.5337830781936646, 0.6508166193962097, 0.7678501605987549, 0.8848837018013, 1.0019172430038452, 1.1189508438110352, 1.2359843254089355, 1.353017807006836, 1.4700514078140259, 1.5870850086212158, 1.7041184902191162, 1.8211519718170166, 1.9381855726242065, 2.0552191734313965, 2.172252655029297, 2.2892861366271973, 2.4063196182250977, 2.523353338241577, 2.6403868198394775, 2.757420301437378, 2.8744540214538574, 2.991487503051758, 3.108520984649658, 3.2255544662475586, 3.342587947845459, 3.4596216678619385, 3.576655149459839, 3.6936886310577393, 3.8107223510742188, 3.927755832672119, 4.0447893142700195]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 6.0, 3.0, 9.0, 11.0, 10.0, 15.0, 11.0, 14.0, 29.0, 20.0, 32.0, 56.0, 57.0, 108.0, 141.0, 170.0, 337.0, 848.0, 2155.0, 7698.0, 44170.0, 3970659.0, 147342.0, 14489.0, 3608.0, 1225.0, 496.0, 261.0, 121.0, 69.0, 37.0, 23.0, 14.0, 14.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.232666015625, -3.15869140625, -3.084716796875, -3.0107421875, -2.936767578125, -2.86279296875, -2.788818359375, -2.71484375, -2.640869140625, -2.56689453125, -2.492919921875, -2.4189453125, -2.344970703125, -2.27099609375, -2.197021484375, -2.123046875, -2.049072265625, -1.97509765625, -1.901123046875, -1.8271484375, -1.753173828125, -1.67919921875, -1.605224609375, -1.53125, -1.457275390625, -1.38330078125, -1.309326171875, -1.2353515625, -1.161376953125, -1.08740234375, -1.013427734375, -0.939453125, -0.865478515625, -0.79150390625, -0.717529296875, -0.6435546875, -0.569580078125, -0.49560546875, -0.421630859375, -0.34765625, -0.273681640625, -0.19970703125, -0.125732421875, -0.0517578125, 0.022216796875, 0.09619140625, 0.170166015625, 0.244140625, 0.318115234375, 0.39208984375, 0.466064453125, 0.5400390625, 0.614013671875, 0.68798828125, 0.761962890625, 0.8359375, 0.909912109375, 0.98388671875, 1.057861328125, 1.1318359375, 1.205810546875, 1.27978515625, 1.353759765625, 1.427734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 20.0, 31.0, 60.0, 82.0, 126.0, 133.0, 152.0, 118.0, 117.0, 63.0, 37.0, 21.0, 17.0, 7.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.454345703125, -0.44472503662109375, -0.4351043701171875, -0.42548370361328125, -0.415863037109375, -0.40624237060546875, -0.3966217041015625, -0.38700103759765625, -0.37738037109375, -0.36775970458984375, -0.3581390380859375, -0.34851837158203125, -0.338897705078125, -0.32927703857421875, -0.3196563720703125, -0.31003570556640625, -0.3004150390625, -0.29079437255859375, -0.2811737060546875, -0.27155303955078125, -0.261932373046875, -0.25231170654296875, -0.2426910400390625, -0.23307037353515625, -0.22344970703125, -0.21382904052734375, -0.2042083740234375, -0.19458770751953125, -0.184967041015625, -0.17534637451171875, -0.1657257080078125, -0.15610504150390625, -0.146484375, -0.13686370849609375, -0.1272430419921875, -0.11762237548828125, -0.108001708984375, -0.09838104248046875, -0.0887603759765625, -0.07913970947265625, -0.06951904296875, -0.05989837646484375, -0.0502777099609375, -0.04065704345703125, -0.031036376953125, -0.02141571044921875, -0.0117950439453125, -0.00217437744140625, 0.0074462890625, 0.01706695556640625, 0.0266876220703125, 0.03630828857421875, 0.045928955078125, 0.05554962158203125, 0.0651702880859375, 0.07479095458984375, 0.08441162109375, 0.09403228759765625, 0.1036529541015625, 0.11327362060546875, 0.122894287109375, 0.13251495361328125, 0.1421356201171875, 0.15175628662109375, 0.161376953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 7.0, 19.0, 18.0, 29.0, 41.0, 69.0, 66.0, 115.0, 160.0, 274.0, 496.0, 942.0, 2405.0, 6932.0, 26970.0, 336917.0, 3738463.0, 61306.0, 12078.0, 3523.0, 1490.0, 704.0, 421.0, 266.0, 175.0, 126.0, 72.0, 57.0, 47.0, 20.0, 17.0, 15.0, 6.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.548828125, -2.482147216796875, -2.41546630859375, -2.348785400390625, -2.2821044921875, -2.215423583984375, -2.14874267578125, -2.082061767578125, -2.015380859375, -1.948699951171875, -1.88201904296875, -1.815338134765625, -1.7486572265625, -1.681976318359375, -1.61529541015625, -1.548614501953125, -1.48193359375, -1.415252685546875, -1.34857177734375, -1.281890869140625, -1.2152099609375, -1.148529052734375, -1.08184814453125, -1.015167236328125, -0.948486328125, -0.881805419921875, -0.81512451171875, -0.748443603515625, -0.6817626953125, -0.615081787109375, -0.54840087890625, -0.481719970703125, -0.4150390625, -0.348358154296875, -0.28167724609375, -0.214996337890625, -0.1483154296875, -0.081634521484375, -0.01495361328125, 0.051727294921875, 0.118408203125, 0.185089111328125, 0.25177001953125, 0.318450927734375, 0.3851318359375, 0.451812744140625, 0.51849365234375, 0.585174560546875, 0.65185546875, 0.718536376953125, 0.78521728515625, 0.851898193359375, 0.9185791015625, 0.985260009765625, 1.05194091796875, 1.118621826171875, 1.185302734375, 1.251983642578125, 1.31866455078125, 1.385345458984375, 1.4520263671875, 1.518707275390625, 1.58538818359375, 1.652069091796875, 1.71875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 6.0, 8.0, 12.0, 18.0, 39.0, 50.0, 90.0, 222.0, 865.0, 2026.0, 400.0, 127.0, 60.0, 47.0, 25.0, 16.0, 18.0, 11.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4677734375, -0.4532661437988281, -0.43875885009765625, -0.4242515563964844, -0.4097442626953125, -0.3952369689941406, -0.38072967529296875, -0.3662223815917969, -0.351715087890625, -0.3372077941894531, -0.32270050048828125, -0.3081932067871094, -0.2936859130859375, -0.2791786193847656, -0.26467132568359375, -0.2501640319824219, -0.23565673828125, -0.22114944458007812, -0.20664215087890625, -0.19213485717773438, -0.1776275634765625, -0.16312026977539062, -0.14861297607421875, -0.13410568237304688, -0.119598388671875, -0.10509109497070312, -0.09058380126953125, -0.07607650756835938, -0.0615692138671875, -0.047061920166015625, -0.03255462646484375, -0.018047332763671875, -0.0035400390625, 0.010967254638671875, 0.02547454833984375, 0.039981842041015625, 0.0544891357421875, 0.06899642944335938, 0.08350372314453125, 0.09801101684570312, 0.112518310546875, 0.12702560424804688, 0.14153289794921875, 0.15604019165039062, 0.1705474853515625, 0.18505477905273438, 0.19956207275390625, 0.21406936645507812, 0.22857666015625, 0.24308395385742188, 0.25759124755859375, 0.2720985412597656, 0.2866058349609375, 0.3011131286621094, 0.31562042236328125, 0.3301277160644531, 0.344635009765625, 0.3591423034667969, 0.37364959716796875, 0.3881568908691406, 0.4026641845703125, 0.4171714782714844, 0.43167877197265625, 0.4461860656738281, 0.460693359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 15.0, 24.0, 31.0, 61.0, 84.0, 87.0, 126.0, 142.0, 125.0, 90.0, 67.0, 48.0, 34.0, 10.0, 15.0, 9.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994015455245972, -1.8349367380142212, -1.7704719305038452, -1.7060070037841797, -1.6415421962738037, -1.5770773887634277, -1.5126125812530518, -1.4481477737426758, -1.3836829662322998, -1.3192181587219238, -1.2547533512115479, -1.1902885437011719, -1.1258236169815063, -1.0613588094711304, -0.9968940019607544, -0.9324291944503784, -0.8679642677307129, -0.8034994602203369, -0.7390345931053162, -0.6745697855949402, -0.6101049184799194, -0.5456401109695435, -0.4811753034591675, -0.4167104661464691, -0.35224562883377075, -0.2877807915210724, -0.22331596910953522, -0.15885114669799805, -0.09438630938529968, -0.02992147207260132, 0.03454333543777466, 0.09900817275047302, 0.16347289085388184, 0.2279377281665802, 0.29240256547927856, 0.35686737298965454, 0.4213322103023529, 0.48579704761505127, 0.5502618551254272, 0.6147266626358032, 0.679191529750824, 0.7436563372612, 0.8081212043762207, 0.8725860118865967, 0.9370508193969727, 1.0015156269073486, 1.0659804344177246, 1.1304453611373901, 1.1949101686477661, 1.259374976158142, 1.323839783668518, 1.3883047103881836, 1.4527695178985596, 1.5172343254089355, 1.5816991329193115, 1.6461639404296875, 1.7106287479400635, 1.7750935554504395, 1.8395583629608154, 1.9040231704711914, 1.968488097190857, 2.0329527854919434, 2.0974178314208984, 2.1618826389312744, 2.2263474464416504]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 4.0, 14.0, 27.0, 20.0, 27.0, 33.0, 21.0, 37.0, 29.0, 59.0, 46.0, 45.0, 54.0, 48.0, 49.0, 52.0, 53.0, 34.0, 40.0, 54.0, 36.0, 23.0, 35.0, 30.0, 27.0, 19.0, 13.0, 11.0, 10.0, 7.0, 7.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.325851559638977, -1.289284110069275, -1.2527167797088623, -1.2161493301391602, -1.1795819997787476, -1.1430145502090454, -1.1064472198486328, -1.0698797702789307, -1.0333123207092285, -0.9967449307441711, -0.9601775407791138, -0.9236101508140564, -0.887042760848999, -0.8504753112792969, -0.8139079213142395, -0.7773405313491821, -0.7407732009887695, -0.7042058110237122, -0.6676384210586548, -0.6310710310935974, -0.59450364112854, -0.5579361915588379, -0.5213688015937805, -0.48480141162872314, -0.44823402166366577, -0.4116666316986084, -0.375099241733551, -0.33853182196617126, -0.3019644320011139, -0.2653970420360565, -0.22882963716983795, -0.19226223230361938, -0.15569496154785156, -0.11912756413221359, -0.08256016671657562, -0.04599276930093765, -0.009425371885299683, 0.02714201807975769, 0.06370942294597626, 0.10027682781219482, 0.1368442177772522, 0.17341160774230957, 0.20997901260852814, 0.2465464174747467, 0.2831138074398041, 0.31968119740486145, 0.3562486171722412, 0.3928160071372986, 0.42938339710235596, 0.46595078706741333, 0.5025181770324707, 0.5390855669975281, 0.5756529569625854, 0.6122204065322876, 0.648787796497345, 0.6853551864624023, 0.7219225764274597, 0.7584899663925171, 0.7950573563575745, 0.8316247463226318, 0.868192195892334, 0.9047595262527466, 0.9413269758224487, 0.9778943657875061, 1.0144617557525635]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 7.0, 11.0, 12.0, 11.0, 16.0, 21.0, 27.0, 26.0, 56.0, 86.0, 111.0, 185.0, 371.0, 753.0, 2040.0, 6712.0, 30572.0, 236052.0, 662803.0, 87210.0, 15211.0, 3783.0, 1223.0, 502.0, 271.0, 138.0, 89.0, 51.0, 41.0, 33.0, 32.0, 8.0, 19.0, 13.0, 5.0, 8.0, 6.0, 5.0, 6.0, 2.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0], "bins": [-1.623046875, -1.57830810546875, -1.5335693359375, -1.48883056640625, -1.444091796875, -1.39935302734375, -1.3546142578125, -1.30987548828125, -1.26513671875, -1.22039794921875, -1.1756591796875, -1.13092041015625, -1.086181640625, -1.04144287109375, -0.9967041015625, -0.95196533203125, -0.9072265625, -0.86248779296875, -0.8177490234375, -0.77301025390625, -0.728271484375, -0.68353271484375, -0.6387939453125, -0.59405517578125, -0.54931640625, -0.50457763671875, -0.4598388671875, -0.41510009765625, -0.370361328125, -0.32562255859375, -0.2808837890625, -0.23614501953125, -0.19140625, -0.14666748046875, -0.1019287109375, -0.05718994140625, -0.012451171875, 0.03228759765625, 0.0770263671875, 0.12176513671875, 0.16650390625, 0.21124267578125, 0.2559814453125, 0.30072021484375, 0.345458984375, 0.39019775390625, 0.4349365234375, 0.47967529296875, 0.5244140625, 0.56915283203125, 0.6138916015625, 0.65863037109375, 0.703369140625, 0.74810791015625, 0.7928466796875, 0.83758544921875, 0.88232421875, 0.92706298828125, 0.9718017578125, 1.01654052734375, 1.061279296875, 1.10601806640625, 1.1507568359375, 1.19549560546875, 1.240234375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 16.0, 20.0, 42.0, 69.0, 90.0, 119.0, 147.0, 120.0, 118.0, 92.0, 50.0, 42.0, 32.0, 14.0, 12.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.463623046875, -0.45354461669921875, -0.4434661865234375, -0.43338775634765625, -0.423309326171875, -0.41323089599609375, -0.4031524658203125, -0.39307403564453125, -0.38299560546875, -0.37291717529296875, -0.3628387451171875, -0.35276031494140625, -0.342681884765625, -0.33260345458984375, -0.3225250244140625, -0.31244659423828125, -0.3023681640625, -0.29228973388671875, -0.2822113037109375, -0.27213287353515625, -0.262054443359375, -0.25197601318359375, -0.2418975830078125, -0.23181915283203125, -0.22174072265625, -0.21166229248046875, -0.2015838623046875, -0.19150543212890625, -0.181427001953125, -0.17134857177734375, -0.1612701416015625, -0.15119171142578125, -0.14111328125, -0.13103485107421875, -0.1209564208984375, -0.11087799072265625, -0.100799560546875, -0.09072113037109375, -0.0806427001953125, -0.07056427001953125, -0.06048583984375, -0.05040740966796875, -0.0403289794921875, -0.03025054931640625, -0.020172119140625, -0.01009368896484375, -1.52587890625e-05, 0.01006317138671875, 0.0201416015625, 0.03022003173828125, 0.0402984619140625, 0.05037689208984375, 0.060455322265625, 0.07053375244140625, 0.0806121826171875, 0.09069061279296875, 0.10076904296875, 0.11084747314453125, 0.1209259033203125, 0.13100433349609375, 0.141082763671875, 0.15116119384765625, 0.1612396240234375, 0.17131805419921875, 0.181396484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 7.0, 11.0, 11.0, 23.0, 32.0, 52.0, 63.0, 96.0, 163.0, 312.0, 530.0, 963.0, 2073.0, 4773.0, 13472.0, 45806.0, 226686.0, 574669.0, 131366.0, 30521.0, 9683.0, 3648.0, 1675.0, 785.0, 446.0, 261.0, 145.0, 93.0, 53.0, 49.0, 27.0, 20.0, 9.0, 3.0, 10.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1025390625, -1.07220458984375, -1.0418701171875, -1.01153564453125, -0.981201171875, -0.95086669921875, -0.9205322265625, -0.89019775390625, -0.85986328125, -0.82952880859375, -0.7991943359375, -0.76885986328125, -0.738525390625, -0.70819091796875, -0.6778564453125, -0.64752197265625, -0.6171875, -0.58685302734375, -0.5565185546875, -0.52618408203125, -0.495849609375, -0.46551513671875, -0.4351806640625, -0.40484619140625, -0.37451171875, -0.34417724609375, -0.3138427734375, -0.28350830078125, -0.253173828125, -0.22283935546875, -0.1925048828125, -0.16217041015625, -0.1318359375, -0.10150146484375, -0.0711669921875, -0.04083251953125, -0.010498046875, 0.01983642578125, 0.0501708984375, 0.08050537109375, 0.11083984375, 0.14117431640625, 0.1715087890625, 0.20184326171875, 0.232177734375, 0.26251220703125, 0.2928466796875, 0.32318115234375, 0.353515625, 0.38385009765625, 0.4141845703125, 0.44451904296875, 0.474853515625, 0.50518798828125, 0.5355224609375, 0.56585693359375, 0.59619140625, 0.62652587890625, 0.6568603515625, 0.68719482421875, 0.717529296875, 0.74786376953125, 0.7781982421875, 0.80853271484375, 0.8388671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 9.0, 7.0, 14.0, 22.0, 26.0, 22.0, 35.0, 48.0, 51.0, 63.0, 80.0, 57.0, 75.0, 70.0, 60.0, 62.0, 60.0, 58.0, 39.0, 28.0, 35.0, 19.0, 15.0, 8.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1252517700195312, -1.0962066650390625, -1.0671615600585938, -1.038116455078125, -1.0090713500976562, -0.9800262451171875, -0.9509811401367188, -0.92193603515625, -0.8928909301757812, -0.8638458251953125, -0.8348007202148438, -0.805755615234375, -0.7767105102539062, -0.7476654052734375, -0.7186203002929688, -0.6895751953125, -0.6605300903320312, -0.6314849853515625, -0.6024398803710938, -0.573394775390625, -0.5443496704101562, -0.5153045654296875, -0.48625946044921875, -0.45721435546875, -0.42816925048828125, -0.3991241455078125, -0.37007904052734375, -0.341033935546875, -0.31198883056640625, -0.2829437255859375, -0.25389862060546875, -0.224853515625, -0.19580841064453125, -0.1667633056640625, -0.13771820068359375, -0.108673095703125, -0.07962799072265625, -0.0505828857421875, -0.02153778076171875, 0.00750732421875, 0.03655242919921875, 0.0655975341796875, 0.09464263916015625, 0.123687744140625, 0.15273284912109375, 0.1817779541015625, 0.21082305908203125, 0.2398681640625, 0.26891326904296875, 0.2979583740234375, 0.32700347900390625, 0.356048583984375, 0.38509368896484375, 0.4141387939453125, 0.44318389892578125, 0.47222900390625, 0.5012741088867188, 0.5303192138671875, 0.5593643188476562, 0.588409423828125, 0.6174545288085938, 0.6464996337890625, 0.6755447387695312, 0.70458984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 8.0, 10.0, 10.0, 12.0, 20.0, 26.0, 40.0, 60.0, 72.0, 121.0, 212.0, 352.0, 588.0, 1104.0, 2234.0, 5428.0, 17745.0, 105174.0, 696754.0, 180767.0, 25097.0, 6992.0, 2663.0, 1323.0, 668.0, 404.0, 230.0, 149.0, 99.0, 54.0, 34.0, 22.0, 20.0, 15.0, 9.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6258316040039062, -0.6066436767578125, -0.5874557495117188, -0.568267822265625, -0.5490798950195312, -0.5298919677734375, -0.5107040405273438, -0.49151611328125, -0.47232818603515625, -0.4531402587890625, -0.43395233154296875, -0.414764404296875, -0.39557647705078125, -0.3763885498046875, -0.35720062255859375, -0.3380126953125, -0.31882476806640625, -0.2996368408203125, -0.28044891357421875, -0.261260986328125, -0.24207305908203125, -0.2228851318359375, -0.20369720458984375, -0.18450927734375, -0.16532135009765625, -0.1461334228515625, -0.12694549560546875, -0.107757568359375, -0.08856964111328125, -0.0693817138671875, -0.05019378662109375, -0.031005859375, -0.01181793212890625, 0.0073699951171875, 0.02655792236328125, 0.045745849609375, 0.06493377685546875, 0.0841217041015625, 0.10330963134765625, 0.12249755859375, 0.14168548583984375, 0.1608734130859375, 0.18006134033203125, 0.199249267578125, 0.21843719482421875, 0.2376251220703125, 0.25681304931640625, 0.2760009765625, 0.29518890380859375, 0.3143768310546875, 0.33356475830078125, 0.352752685546875, 0.37194061279296875, 0.3911285400390625, 0.41031646728515625, 0.42950439453125, 0.44869232177734375, 0.4678802490234375, 0.48706817626953125, 0.506256103515625, 0.5254440307617188, 0.5446319580078125, 0.5638198852539062, 0.5830078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 7.0, 9.0, 22.0, 33.0, 54.0, 71.0, 141.0, 190.0, 159.0, 123.0, 68.0, 42.0, 24.0, 10.0, 14.0, 11.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016057491302490234, -0.0001559574156999588, -0.00015133991837501526, -0.00014672242105007172, -0.00014210492372512817, -0.00013748742640018463, -0.0001328699290752411, -0.00012825243175029755, -0.000123634934425354, -0.00011901743710041046, -0.00011439993977546692, -0.00010978244245052338, -0.00010516494512557983, -0.00010054744780063629, -9.592995047569275e-05, -9.13124531507492e-05, -8.669495582580566e-05, -8.207745850086212e-05, -7.745996117591858e-05, -7.284246385097504e-05, -6.82249665260315e-05, -6.360746920108795e-05, -5.898997187614441e-05, -5.437247455120087e-05, -4.9754977226257324e-05, -4.513747990131378e-05, -4.051998257637024e-05, -3.59024852514267e-05, -3.1284987926483154e-05, -2.6667490601539612e-05, -2.204999327659607e-05, -1.7432495951652527e-05, -1.2814998626708984e-05, -8.197501301765442e-06, -3.5800039768218994e-06, 1.037493348121643e-06, 5.6549906730651855e-06, 1.0272487998008728e-05, 1.488998532295227e-05, 1.9507482647895813e-05, 2.4124979972839355e-05, 2.8742477297782898e-05, 3.335997462272644e-05, 3.797747194766998e-05, 4.2594969272613525e-05, 4.721246659755707e-05, 5.182996392250061e-05, 5.644746124744415e-05, 6.10649585723877e-05, 6.568245589733124e-05, 7.029995322227478e-05, 7.491745054721832e-05, 7.953494787216187e-05, 8.415244519710541e-05, 8.876994252204895e-05, 9.338743984699249e-05, 9.800493717193604e-05, 0.00010262243449687958, 0.00010723993182182312, 0.00011185742914676666, 0.0001164749264717102, 0.00012109242379665375, 0.0001257099211215973, 0.00013032741844654083, 0.00013494491577148438]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 5.0, 17.0, 17.0, 17.0, 17.0, 42.0, 45.0, 68.0, 83.0, 146.0, 206.0, 332.0, 555.0, 1044.0, 1927.0, 4128.0, 10042.0, 31976.0, 197884.0, 649514.0, 112787.0, 22721.0, 7743.0, 3327.0, 1665.0, 865.0, 450.0, 309.0, 173.0, 128.0, 102.0, 64.0, 33.0, 33.0, 18.0, 15.0, 11.0, 11.0, 7.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.572265625, -0.5534210205078125, -0.534576416015625, -0.5157318115234375, -0.49688720703125, -0.4780426025390625, -0.459197998046875, -0.4403533935546875, -0.4215087890625, -0.4026641845703125, -0.383819580078125, -0.3649749755859375, -0.34613037109375, -0.3272857666015625, -0.308441162109375, -0.2895965576171875, -0.270751953125, -0.2519073486328125, -0.233062744140625, -0.2142181396484375, -0.19537353515625, -0.1765289306640625, -0.157684326171875, -0.1388397216796875, -0.1199951171875, -0.1011505126953125, -0.082305908203125, -0.0634613037109375, -0.04461669921875, -0.0257720947265625, -0.006927490234375, 0.0119171142578125, 0.03076171875, 0.0496063232421875, 0.068450927734375, 0.0872955322265625, 0.10614013671875, 0.1249847412109375, 0.143829345703125, 0.1626739501953125, 0.1815185546875, 0.2003631591796875, 0.219207763671875, 0.2380523681640625, 0.25689697265625, 0.2757415771484375, 0.294586181640625, 0.3134307861328125, 0.332275390625, 0.3511199951171875, 0.369964599609375, 0.3888092041015625, 0.40765380859375, 0.4264984130859375, 0.445343017578125, 0.4641876220703125, 0.4830322265625, 0.5018768310546875, 0.520721435546875, 0.5395660400390625, 0.55841064453125, 0.5772552490234375, 0.596099853515625, 0.6149444580078125, 0.6337890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 5.0, 6.0, 10.0, 13.0, 12.0, 24.0, 31.0, 54.0, 69.0, 103.0, 116.0, 121.0, 117.0, 83.0, 59.0, 41.0, 31.0, 28.0, 14.0, 18.0, 8.0, 5.0, 7.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.447265625, -0.4346122741699219, -0.42195892333984375, -0.4093055725097656, -0.3966522216796875, -0.3839988708496094, -0.37134552001953125, -0.3586921691894531, -0.346038818359375, -0.3333854675292969, -0.32073211669921875, -0.3080787658691406, -0.2954254150390625, -0.2827720642089844, -0.27011871337890625, -0.2574653625488281, -0.24481201171875, -0.23215866088867188, -0.21950531005859375, -0.20685195922851562, -0.1941986083984375, -0.18154525756835938, -0.16889190673828125, -0.15623855590820312, -0.143585205078125, -0.13093185424804688, -0.11827850341796875, -0.10562515258789062, -0.0929718017578125, -0.08031845092773438, -0.06766510009765625, -0.055011749267578125, -0.0423583984375, -0.029705047607421875, -0.01705169677734375, -0.004398345947265625, 0.0082550048828125, 0.020908355712890625, 0.03356170654296875, 0.046215057373046875, 0.058868408203125, 0.07152175903320312, 0.08417510986328125, 0.09682846069335938, 0.1094818115234375, 0.12213516235351562, 0.13478851318359375, 0.14744186401367188, 0.16009521484375, 0.17274856567382812, 0.18540191650390625, 0.19805526733398438, 0.2107086181640625, 0.22336196899414062, 0.23601531982421875, 0.24866867065429688, 0.261322021484375, 0.2739753723144531, 0.28662872314453125, 0.2992820739746094, 0.3119354248046875, 0.3245887756347656, 0.33724212646484375, 0.3498954772949219, 0.362548828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 20.0, 18.0, 25.0, 62.0, 114.0, 222.0, 245.0, 141.0, 60.0, 41.0, 22.0, 15.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.541660308837891, -4.260741233825684, -3.9798223972320557, -3.6989035606384277, -3.4179844856262207, -3.1370654106140137, -2.8561465740203857, -2.575227737426758, -2.294308662414551, -2.0133895874023438, -1.7324707508087158, -1.4515517950057983, -1.1706328392028809, -0.8897138833999634, -0.6087949275970459, -0.3278759717941284, -0.04695701599121094, 0.23396193981170654, 0.514880895614624, 0.7957998514175415, 1.076718807220459, 1.3576377630233765, 1.638556718826294, 1.9194756746292114, 2.200394630432129, 2.481313705444336, 2.762232542037964, 3.043151378631592, 3.324070453643799, 3.604989528656006, 3.885908365249634, 4.166827201843262, 4.447747230529785, 4.728666305541992, 5.009585380554199, 5.290503978729248, 5.571423053741455, 5.852342128753662, 6.133260726928711, 6.414179801940918, 6.695098876953125, 6.976017951965332, 7.256937026977539, 7.537855625152588, 7.818774700164795, 8.099693298339844, 8.38061237335205, 8.661531448364258, 8.942450523376465, 9.223369598388672, 9.504288673400879, 9.785207748413086, 10.066125869750977, 10.347044944763184, 10.62796401977539, 10.908883094787598, 11.189802169799805, 11.470721244812012, 11.751640319824219, 12.032559394836426, 12.313478469848633, 12.594396591186523, 12.87531566619873, 13.156234741210938, 13.437153816223145]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 8.0, 16.0, 17.0, 10.0, 29.0, 34.0, 25.0, 36.0, 25.0, 37.0, 41.0, 63.0, 51.0, 80.0, 61.0, 68.0, 58.0, 59.0, 45.0, 36.0, 44.0, 33.0, 27.0, 19.0, 15.0, 14.0, 10.0, 7.0, 8.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.831258773803711, -5.677872180938721, -5.5244855880737305, -5.371099472045898, -5.217712879180908, -5.064326286315918, -4.910939693450928, -4.7575531005859375, -4.6041669845581055, -4.450780391693115, -4.297393798828125, -4.144007682800293, -3.9906210899353027, -3.8372344970703125, -3.6838479042053223, -3.530461311340332, -3.377074718475342, -3.2236881256103516, -3.0703017711639404, -2.91691517829895, -2.763528823852539, -2.610142230987549, -2.4567556381225586, -2.3033690452575684, -2.1499826908111572, -1.9965962171554565, -1.8432097434997559, -1.6898231506347656, -1.536436676979065, -1.3830502033233643, -1.229663610458374, -1.0762771368026733, -0.9228904247283936, -0.7695039510726929, -0.6161174178123474, -0.46273091435432434, -0.30934441089630127, -0.15595793724060059, -0.002571403980255127, 0.15081512928009033, 0.304201602935791, 0.4575881063938141, 0.6109746098518372, 0.7643611431121826, 0.9177476167678833, 1.071134090423584, 1.2245206832885742, 1.377907156944275, 1.5312936305999756, 1.6846801042556763, 1.838066577911377, 1.9914531707763672, 2.1448397636413574, 2.2982261180877686, 2.451612710952759, 2.60499906539917, 2.75838565826416, 2.9117722511291504, 3.0651586055755615, 3.2185451984405518, 3.371931552886963, 3.525318145751953, 3.6787047386169434, 3.8320913314819336, 3.9854776859283447]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 5.0, 6.0, 8.0, 14.0, 25.0, 21.0, 32.0, 38.0, 57.0, 80.0, 115.0, 209.0, 429.0, 1034.0, 3710.0, 19981.0, 1239259.0, 2899306.0, 23521.0, 4350.0, 1236.0, 461.0, 182.0, 88.0, 50.0, 24.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0], "bins": [-4.80078125, -4.702850341796875, -4.60491943359375, -4.506988525390625, -4.4090576171875, -4.311126708984375, -4.21319580078125, -4.115264892578125, -4.017333984375, -3.919403076171875, -3.82147216796875, -3.723541259765625, -3.6256103515625, -3.527679443359375, -3.42974853515625, -3.331817626953125, -3.23388671875, -3.135955810546875, -3.03802490234375, -2.940093994140625, -2.8421630859375, -2.744232177734375, -2.64630126953125, -2.548370361328125, -2.450439453125, -2.352508544921875, -2.25457763671875, -2.156646728515625, -2.0587158203125, -1.960784912109375, -1.86285400390625, -1.764923095703125, -1.6669921875, -1.569061279296875, -1.47113037109375, -1.373199462890625, -1.2752685546875, -1.177337646484375, -1.07940673828125, -0.981475830078125, -0.883544921875, -0.785614013671875, -0.68768310546875, -0.589752197265625, -0.4918212890625, -0.393890380859375, -0.29595947265625, -0.198028564453125, -0.10009765625, -0.002166748046875, 0.09576416015625, 0.193695068359375, 0.2916259765625, 0.389556884765625, 0.48748779296875, 0.585418701171875, 0.683349609375, 0.781280517578125, 0.87921142578125, 0.977142333984375, 1.0750732421875, 1.173004150390625, 1.27093505859375, 1.368865966796875, 1.466796875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 9.0, 15.0, 26.0, 44.0, 64.0, 95.0, 103.0, 110.0, 131.0, 129.0, 85.0, 57.0, 47.0, 26.0, 19.0, 11.0, 13.0, 3.0, 6.0, 6.0, 2.0, 3.0, 1.0], "bins": [-0.47607421875, -0.46637916564941406, -0.4566841125488281, -0.4469890594482422, -0.43729400634765625, -0.4275989532470703, -0.4179039001464844, -0.40820884704589844, -0.3985137939453125, -0.38881874084472656, -0.3791236877441406, -0.3694286346435547, -0.35973358154296875, -0.3500385284423828, -0.3403434753417969, -0.33064842224121094, -0.320953369140625, -0.31125831604003906, -0.3015632629394531, -0.2918682098388672, -0.28217315673828125, -0.2724781036376953, -0.2627830505371094, -0.25308799743652344, -0.2433929443359375, -0.23369789123535156, -0.22400283813476562, -0.2143077850341797, -0.20461273193359375, -0.1949176788330078, -0.18522262573242188, -0.17552757263183594, -0.16583251953125, -0.15613746643066406, -0.14644241333007812, -0.1367473602294922, -0.12705230712890625, -0.11735725402832031, -0.10766220092773438, -0.09796714782714844, -0.0882720947265625, -0.07857704162597656, -0.06888198852539062, -0.05918693542480469, -0.04949188232421875, -0.03979682922363281, -0.030101776123046875, -0.020406723022460938, -0.010711669921875, -0.0010166168212890625, 0.008678436279296875, 0.018373489379882812, 0.02806854248046875, 0.03776359558105469, 0.047458648681640625, 0.05715370178222656, 0.0668487548828125, 0.07654380798339844, 0.08623886108398438, 0.09593391418457031, 0.10562896728515625, 0.11532402038574219, 0.12501907348632812, 0.13471412658691406, 0.1444091796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 10.0, 13.0, 13.0, 28.0, 40.0, 96.0, 149.0, 396.0, 1080.0, 4751.0, 79962.0, 4087992.0, 16522.0, 2119.0, 559.0, 229.0, 119.0, 75.0, 38.0, 39.0, 11.0, 15.0, 7.0, 11.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.03125, -8.8177490234375, -8.604248046875, -8.3907470703125, -8.17724609375, -7.9637451171875, -7.750244140625, -7.5367431640625, -7.3232421875, -7.1097412109375, -6.896240234375, -6.6827392578125, -6.46923828125, -6.2557373046875, -6.042236328125, -5.8287353515625, -5.615234375, -5.4017333984375, -5.188232421875, -4.9747314453125, -4.76123046875, -4.5477294921875, -4.334228515625, -4.1207275390625, -3.9072265625, -3.6937255859375, -3.480224609375, -3.2667236328125, -3.05322265625, -2.8397216796875, -2.626220703125, -2.4127197265625, -2.19921875, -1.9857177734375, -1.772216796875, -1.5587158203125, -1.34521484375, -1.1317138671875, -0.918212890625, -0.7047119140625, -0.4912109375, -0.2777099609375, -0.064208984375, 0.1492919921875, 0.36279296875, 0.5762939453125, 0.789794921875, 1.0032958984375, 1.216796875, 1.4302978515625, 1.643798828125, 1.8572998046875, 2.07080078125, 2.2843017578125, 2.497802734375, 2.7113037109375, 2.9248046875, 3.1383056640625, 3.351806640625, 3.5653076171875, 3.77880859375, 3.9923095703125, 4.205810546875, 4.4193115234375, 4.6328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 4.0, 4.0, 12.0, 18.0, 39.0, 58.0, 103.0, 275.0, 1692.0, 1343.0, 294.0, 100.0, 46.0, 26.0, 21.0, 11.0, 7.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9540023803710938, -0.9221649169921875, -0.8903274536132812, -0.858489990234375, -0.8266525268554688, -0.7948150634765625, -0.7629776000976562, -0.73114013671875, -0.6993026733398438, -0.6674652099609375, -0.6356277465820312, -0.603790283203125, -0.5719528198242188, -0.5401153564453125, -0.5082778930664062, -0.4764404296875, -0.44460296630859375, -0.4127655029296875, -0.38092803955078125, -0.349090576171875, -0.31725311279296875, -0.2854156494140625, -0.25357818603515625, -0.22174072265625, -0.18990325927734375, -0.1580657958984375, -0.12622833251953125, -0.094390869140625, -0.06255340576171875, -0.0307159423828125, 0.00112152099609375, 0.032958984375, 0.06479644775390625, 0.0966339111328125, 0.12847137451171875, 0.160308837890625, 0.19214630126953125, 0.2239837646484375, 0.25582122802734375, 0.28765869140625, 0.31949615478515625, 0.3513336181640625, 0.38317108154296875, 0.415008544921875, 0.44684600830078125, 0.4786834716796875, 0.5105209350585938, 0.5423583984375, 0.5741958618164062, 0.6060333251953125, 0.6378707885742188, 0.669708251953125, 0.7015457153320312, 0.7333831787109375, 0.7652206420898438, 0.79705810546875, 0.8288955688476562, 0.8607330322265625, 0.8925704956054688, 0.924407958984375, 0.9562454223632812, 0.9880828857421875, 1.0199203491210938, 1.0517578125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 21.0, 107.0, 653.0, 192.0, 26.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.709108352661133, -16.95880889892578, -16.208507537841797, -15.458208084106445, -14.707908630371094, -13.957608222961426, -13.207307815551758, -12.457008361816406, -11.706707954406738, -10.95640754699707, -10.206108093261719, -9.45580768585205, -8.705507278442383, -7.955207824707031, -7.204907417297363, -6.4546074867248535, -5.704307556152344, -4.954007625579834, -4.203707695007324, -3.4534072875976562, -2.7031073570251465, -1.9528074264526367, -1.2025070190429688, -0.452207088470459, 0.2980928421020508, 1.04839289188385, 1.7986929416656494, 2.5489931106567383, 3.299293041229248, 4.049592971801758, 4.799893379211426, 5.5501933097839355, 6.3004913330078125, 7.050791263580322, 7.801091194152832, 8.5513916015625, 9.301691055297852, 10.05199146270752, 10.802291870117188, 11.552591323852539, 12.302891731262207, 13.053192138671875, 13.803491592407227, 14.553791999816895, 15.304092407226562, 16.054391860961914, 16.804691314697266, 17.55499267578125, 18.3052921295166, 19.055591583251953, 19.805892944335938, 20.55619239807129, 21.30649185180664, 22.056793212890625, 22.807092666625977, 23.557392120361328, 24.307693481445312, 25.057992935180664, 25.80829429626465, 26.55859375, 27.30889320373535, 28.059192657470703, 28.809494018554688, 29.55979347229004, 30.31009292602539]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 13.0, 15.0, 37.0, 54.0, 65.0, 78.0, 100.0, 107.0, 124.0, 117.0, 94.0, 57.0, 58.0, 35.0, 16.0, 12.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.502362251281738, -4.349108695983887, -4.195854663848877, -4.042601108551025, -3.889347553253174, -3.736093759536743, -3.5828399658203125, -3.429586410522461, -3.2763326168060303, -3.1230788230895996, -2.969825267791748, -2.8165714740753174, -2.6633176803588867, -2.510064125061035, -2.3568103313446045, -2.203556537628174, -2.0503029823303223, -1.8970493078231812, -1.74379563331604, -1.5905418395996094, -1.4372881650924683, -1.2840344905853271, -1.1307806968688965, -0.9775270223617554, -0.8242733478546143, -0.6710196733474731, -0.5177659392356873, -0.36451223492622375, -0.21125853061676025, -0.05800485610961914, 0.09524887800216675, 0.24850261211395264, 0.40175580978393555, 0.5550094842910767, 0.7082632184028625, 0.8615169525146484, 1.0147706270217896, 1.1680243015289307, 1.3212780952453613, 1.4745317697525024, 1.6277854442596436, 1.7810391187667847, 1.9342927932739258, 2.0875465869903564, 2.240800380706787, 2.3940539360046387, 2.5473077297210693, 2.7005615234375, 2.8538150787353516, 3.0070688724517822, 3.160322427749634, 3.3135762214660645, 3.466829776763916, 3.6200835704803467, 3.7733373641967773, 3.926590919494629, 4.0798444747924805, 4.233098030090332, 4.386352062225342, 4.539605617523193, 4.692859172821045, 4.846113204956055, 4.999366760253906, 5.152620315551758, 5.305874347686768]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 7.0, 7.0, 9.0, 9.0, 15.0, 22.0, 24.0, 37.0, 41.0, 67.0, 114.0, 164.0, 233.0, 409.0, 669.0, 1240.0, 2370.0, 5496.0, 15633.0, 62301.0, 423833.0, 443037.0, 65335.0, 16283.0, 5660.0, 2449.0, 1229.0, 660.0, 412.0, 236.0, 169.0, 99.0, 77.0, 51.0, 48.0, 28.0, 23.0, 12.0, 14.0, 9.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.283203125, -1.237396240234375, -1.19158935546875, -1.145782470703125, -1.0999755859375, -1.054168701171875, -1.00836181640625, -0.962554931640625, -0.916748046875, -0.870941162109375, -0.82513427734375, -0.779327392578125, -0.7335205078125, -0.687713623046875, -0.64190673828125, -0.596099853515625, -0.55029296875, -0.504486083984375, -0.45867919921875, -0.412872314453125, -0.3670654296875, -0.321258544921875, -0.27545166015625, -0.229644775390625, -0.183837890625, -0.138031005859375, -0.09222412109375, -0.046417236328125, -0.0006103515625, 0.045196533203125, 0.09100341796875, 0.136810302734375, 0.1826171875, 0.228424072265625, 0.27423095703125, 0.320037841796875, 0.3658447265625, 0.411651611328125, 0.45745849609375, 0.503265380859375, 0.549072265625, 0.594879150390625, 0.64068603515625, 0.686492919921875, 0.7322998046875, 0.778106689453125, 0.82391357421875, 0.869720458984375, 0.91552734375, 0.961334228515625, 1.00714111328125, 1.052947998046875, 1.0987548828125, 1.144561767578125, 1.19036865234375, 1.236175537109375, 1.281982421875, 1.327789306640625, 1.37359619140625, 1.419403076171875, 1.4652099609375, 1.511016845703125, 1.55682373046875, 1.602630615234375, 1.6484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 17.0, 33.0, 46.0, 56.0, 73.0, 116.0, 117.0, 111.0, 82.0, 105.0, 79.0, 44.0, 27.0, 25.0, 16.0, 13.0, 6.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30419921875, -0.294158935546875, -0.28411865234375, -0.274078369140625, -0.2640380859375, -0.253997802734375, -0.24395751953125, -0.233917236328125, -0.223876953125, -0.213836669921875, -0.20379638671875, -0.193756103515625, -0.1837158203125, -0.173675537109375, -0.16363525390625, -0.153594970703125, -0.1435546875, -0.133514404296875, -0.12347412109375, -0.113433837890625, -0.1033935546875, -0.093353271484375, -0.08331298828125, -0.073272705078125, -0.063232421875, -0.053192138671875, -0.04315185546875, -0.033111572265625, -0.0230712890625, -0.013031005859375, -0.00299072265625, 0.007049560546875, 0.01708984375, 0.027130126953125, 0.03717041015625, 0.047210693359375, 0.0572509765625, 0.067291259765625, 0.07733154296875, 0.087371826171875, 0.097412109375, 0.107452392578125, 0.11749267578125, 0.127532958984375, 0.1375732421875, 0.147613525390625, 0.15765380859375, 0.167694091796875, 0.177734375, 0.187774658203125, 0.19781494140625, 0.207855224609375, 0.2178955078125, 0.227935791015625, 0.23797607421875, 0.248016357421875, 0.258056640625, 0.268096923828125, 0.27813720703125, 0.288177490234375, 0.2982177734375, 0.308258056640625, 0.31829833984375, 0.328338623046875, 0.33837890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 15.0, 15.0, 20.0, 23.0, 41.0, 75.0, 114.0, 209.0, 308.0, 564.0, 1087.0, 2262.0, 5005.0, 11738.0, 30222.0, 90948.0, 322703.0, 400145.0, 119530.0, 37960.0, 14199.0, 5825.0, 2674.0, 1326.0, 644.0, 345.0, 196.0, 102.0, 77.0, 53.0, 41.0, 21.0, 20.0, 8.0, 9.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.79541015625, -0.7733840942382812, -0.7513580322265625, -0.7293319702148438, -0.707305908203125, -0.6852798461914062, -0.6632537841796875, -0.6412277221679688, -0.61920166015625, -0.5971755981445312, -0.5751495361328125, -0.5531234741210938, -0.531097412109375, -0.5090713500976562, -0.4870452880859375, -0.46501922607421875, -0.4429931640625, -0.42096710205078125, -0.3989410400390625, -0.37691497802734375, -0.354888916015625, -0.33286285400390625, -0.3108367919921875, -0.28881072998046875, -0.26678466796875, -0.24475860595703125, -0.2227325439453125, -0.20070648193359375, -0.178680419921875, -0.15665435791015625, -0.1346282958984375, -0.11260223388671875, -0.090576171875, -0.06855010986328125, -0.0465240478515625, -0.02449798583984375, -0.002471923828125, 0.01955413818359375, 0.0415802001953125, 0.06360626220703125, 0.08563232421875, 0.10765838623046875, 0.1296844482421875, 0.15171051025390625, 0.173736572265625, 0.19576263427734375, 0.2177886962890625, 0.23981475830078125, 0.2618408203125, 0.28386688232421875, 0.3058929443359375, 0.32791900634765625, 0.349945068359375, 0.37197113037109375, 0.3939971923828125, 0.41602325439453125, 0.43804931640625, 0.46007537841796875, 0.4821014404296875, 0.5041275024414062, 0.526153564453125, 0.5481796264648438, 0.5702056884765625, 0.5922317504882812, 0.6142578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 8.0, 8.0, 10.0, 8.0, 15.0, 17.0, 17.0, 27.0, 26.0, 33.0, 32.0, 35.0, 48.0, 34.0, 53.0, 51.0, 44.0, 48.0, 50.0, 48.0, 53.0, 44.0, 38.0, 34.0, 28.0, 27.0, 37.0, 19.0, 21.0, 20.0, 16.0, 10.0, 14.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.72412109375, -0.7038803100585938, -0.6836395263671875, -0.6633987426757812, -0.643157958984375, -0.6229171752929688, -0.6026763916015625, -0.5824356079101562, -0.56219482421875, -0.5419540405273438, -0.5217132568359375, -0.5014724731445312, -0.481231689453125, -0.46099090576171875, -0.4407501220703125, -0.42050933837890625, -0.4002685546875, -0.38002777099609375, -0.3597869873046875, -0.33954620361328125, -0.319305419921875, -0.29906463623046875, -0.2788238525390625, -0.25858306884765625, -0.23834228515625, -0.21810150146484375, -0.1978607177734375, -0.17761993408203125, -0.157379150390625, -0.13713836669921875, -0.1168975830078125, -0.09665679931640625, -0.076416015625, -0.05617523193359375, -0.0359344482421875, -0.01569366455078125, 0.004547119140625, 0.02478790283203125, 0.0450286865234375, 0.06526947021484375, 0.08551025390625, 0.10575103759765625, 0.1259918212890625, 0.14623260498046875, 0.166473388671875, 0.18671417236328125, 0.2069549560546875, 0.22719573974609375, 0.2474365234375, 0.26767730712890625, 0.2879180908203125, 0.30815887451171875, 0.328399658203125, 0.34864044189453125, 0.3688812255859375, 0.38912200927734375, 0.40936279296875, 0.42960357666015625, 0.4498443603515625, 0.47008514404296875, 0.490325927734375, 0.5105667114257812, 0.5308074951171875, 0.5510482788085938, 0.5712890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 5.0, 10.0, 16.0, 18.0, 49.0, 68.0, 94.0, 127.0, 246.0, 361.0, 601.0, 971.0, 1692.0, 3034.0, 5765.0, 12546.0, 31145.0, 95906.0, 338862.0, 381927.0, 111785.0, 35553.0, 13715.0, 6368.0, 3322.0, 1732.0, 992.0, 560.0, 357.0, 219.0, 141.0, 113.0, 71.0, 55.0, 30.0, 25.0, 20.0, 12.0, 14.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26581573486328125, -0.2569732666015625, -0.24813079833984375, -0.239288330078125, -0.23044586181640625, -0.2216033935546875, -0.21276092529296875, -0.20391845703125, -0.19507598876953125, -0.1862335205078125, -0.17739105224609375, -0.168548583984375, -0.15970611572265625, -0.1508636474609375, -0.14202117919921875, -0.1331787109375, -0.12433624267578125, -0.1154937744140625, -0.10665130615234375, -0.097808837890625, -0.08896636962890625, -0.0801239013671875, -0.07128143310546875, -0.06243896484375, -0.05359649658203125, -0.0447540283203125, -0.03591156005859375, -0.027069091796875, -0.01822662353515625, -0.0093841552734375, -0.00054168701171875, 0.00830078125, 0.01714324951171875, 0.0259857177734375, 0.03482818603515625, 0.043670654296875, 0.05251312255859375, 0.0613555908203125, 0.07019805908203125, 0.07904052734375, 0.08788299560546875, 0.0967254638671875, 0.10556793212890625, 0.114410400390625, 0.12325286865234375, 0.1320953369140625, 0.14093780517578125, 0.1497802734375, 0.15862274169921875, 0.1674652099609375, 0.17630767822265625, 0.185150146484375, 0.19399261474609375, 0.2028350830078125, 0.21167755126953125, 0.22052001953125, 0.22936248779296875, 0.2382049560546875, 0.24704742431640625, 0.255889892578125, 0.26473236083984375, 0.2735748291015625, 0.28241729736328125, 0.291259765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 3.0, 10.0, 20.0, 14.0, 32.0, 49.0, 104.0, 166.0, 194.0, 159.0, 89.0, 65.0, 24.0, 20.0, 9.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014352798461914062, -0.00013868138194084167, -0.00013383477926254272, -0.00012898817658424377, -0.00012414157390594482, -0.00011929497122764587, -0.00011444836854934692, -0.00010960176587104797, -0.00010475516319274902, -9.990856051445007e-05, -9.506195783615112e-05, -9.021535515785217e-05, -8.536875247955322e-05, -8.052214980125427e-05, -7.567554712295532e-05, -7.082894444465637e-05, -6.598234176635742e-05, -6.113573908805847e-05, -5.628913640975952e-05, -5.144253373146057e-05, -4.659593105316162e-05, -4.174932837486267e-05, -3.690272569656372e-05, -3.205612301826477e-05, -2.720952033996582e-05, -2.236291766166687e-05, -1.751631498336792e-05, -1.266971230506897e-05, -7.82310962677002e-06, -2.9765069484710693e-06, 1.8700957298278809e-06, 6.716698408126831e-06, 1.1563301086425781e-05, 1.640990376472473e-05, 2.125650644302368e-05, 2.6103109121322632e-05, 3.094971179962158e-05, 3.579631447792053e-05, 4.064291715621948e-05, 4.548951983451843e-05, 5.033612251281738e-05, 5.518272519111633e-05, 6.002932786941528e-05, 6.487593054771423e-05, 6.972253322601318e-05, 7.456913590431213e-05, 7.941573858261108e-05, 8.426234126091003e-05, 8.910894393920898e-05, 9.395554661750793e-05, 9.880214929580688e-05, 0.00010364875197410583, 0.00010849535465240479, 0.00011334195733070374, 0.00011818856000900269, 0.00012303516268730164, 0.00012788176536560059, 0.00013272836804389954, 0.00013757497072219849, 0.00014242157340049744, 0.0001472681760787964, 0.00015211477875709534, 0.0001569613814353943, 0.00016180798411369324, 0.0001666545867919922]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 11.0, 15.0, 15.0, 38.0, 34.0, 61.0, 86.0, 138.0, 230.0, 369.0, 661.0, 1097.0, 2043.0, 4198.0, 9645.0, 25478.0, 81229.0, 355227.0, 422951.0, 95323.0, 29080.0, 10751.0, 4799.0, 2183.0, 1200.0, 664.0, 361.0, 222.0, 155.0, 96.0, 55.0, 32.0, 36.0, 12.0, 15.0, 5.0, 9.0, 4.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.41357421875, -0.4017791748046875, -0.389984130859375, -0.3781890869140625, -0.36639404296875, -0.3545989990234375, -0.342803955078125, -0.3310089111328125, -0.3192138671875, -0.3074188232421875, -0.295623779296875, -0.2838287353515625, -0.27203369140625, -0.2602386474609375, -0.248443603515625, -0.2366485595703125, -0.224853515625, -0.2130584716796875, -0.201263427734375, -0.1894683837890625, -0.17767333984375, -0.1658782958984375, -0.154083251953125, -0.1422882080078125, -0.1304931640625, -0.1186981201171875, -0.106903076171875, -0.0951080322265625, -0.08331298828125, -0.0715179443359375, -0.059722900390625, -0.0479278564453125, -0.0361328125, -0.0243377685546875, -0.012542724609375, -0.0007476806640625, 0.01104736328125, 0.0228424072265625, 0.034637451171875, 0.0464324951171875, 0.0582275390625, 0.0700225830078125, 0.081817626953125, 0.0936126708984375, 0.10540771484375, 0.1172027587890625, 0.128997802734375, 0.1407928466796875, 0.152587890625, 0.1643829345703125, 0.176177978515625, 0.1879730224609375, 0.19976806640625, 0.2115631103515625, 0.223358154296875, 0.2351531982421875, 0.2469482421875, 0.2587432861328125, 0.270538330078125, 0.2823333740234375, 0.29412841796875, 0.3059234619140625, 0.317718505859375, 0.3295135498046875, 0.34130859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 9.0, 7.0, 10.0, 13.0, 20.0, 26.0, 24.0, 33.0, 45.0, 53.0, 69.0, 68.0, 104.0, 81.0, 76.0, 76.0, 57.0, 34.0, 30.0, 38.0, 19.0, 16.0, 21.0, 15.0, 10.0, 7.0, 9.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2369384765625, -0.22908973693847656, -0.22124099731445312, -0.2133922576904297, -0.20554351806640625, -0.1976947784423828, -0.18984603881835938, -0.18199729919433594, -0.1741485595703125, -0.16629981994628906, -0.15845108032226562, -0.1506023406982422, -0.14275360107421875, -0.1349048614501953, -0.12705612182617188, -0.11920738220214844, -0.111358642578125, -0.10350990295410156, -0.09566116333007812, -0.08781242370605469, -0.07996368408203125, -0.07211494445800781, -0.06426620483398438, -0.05641746520996094, -0.0485687255859375, -0.04071998596191406, -0.032871246337890625, -0.025022506713867188, -0.01717376708984375, -0.009325027465820312, -0.001476287841796875, 0.0063724517822265625, 0.01422119140625, 0.022069931030273438, 0.029918670654296875, 0.03776741027832031, 0.04561614990234375, 0.05346488952636719, 0.061313629150390625, 0.06916236877441406, 0.0770111083984375, 0.08485984802246094, 0.09270858764648438, 0.10055732727050781, 0.10840606689453125, 0.11625480651855469, 0.12410354614257812, 0.13195228576660156, 0.139801025390625, 0.14764976501464844, 0.15549850463867188, 0.1633472442626953, 0.17119598388671875, 0.1790447235107422, 0.18689346313476562, 0.19474220275878906, 0.2025909423828125, 0.21043968200683594, 0.21828842163085938, 0.2261371612548828, 0.23398590087890625, 0.2418346405029297, 0.24968338012695312, 0.25753211975097656, 0.265380859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 6.0, 13.0, 18.0, 32.0, 56.0, 111.0, 161.0, 176.0, 172.0, 100.0, 64.0, 36.0, 11.0, 13.0, 12.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4878716468811035, -5.288812160491943, -5.089752197265625, -4.890692710876465, -4.691633224487305, -4.4925737380981445, -4.293514251708984, -4.094454288482666, -3.895394802093506, -3.6963353157043457, -3.4972755908966064, -3.298215866088867, -3.099156379699707, -2.900096893310547, -2.7010371685028076, -2.5019774436950684, -2.302917957305908, -2.103858470916748, -1.9047987461090088, -1.705739140510559, -1.5066795349121094, -1.3076199293136597, -1.10856032371521, -0.9095007181167603, -0.7104411125183105, -0.5113815069198608, -0.31232190132141113, -0.11326229572296143, 0.08579730987548828, 0.284856915473938, 0.4839165210723877, 0.6829761266708374, 0.8820362091064453, 1.081095814704895, 1.2801554203033447, 1.4792150259017944, 1.6782746315002441, 1.8773342370986938, 2.0763938426971436, 2.275453567504883, 2.474513053894043, 2.673572540283203, 2.8726322650909424, 3.0716919898986816, 3.270751476287842, 3.469810962677002, 3.668870687484741, 3.8679304122924805, 4.066989898681641, 4.266049385070801, 4.465108871459961, 4.664168834686279, 4.8632283210754395, 5.0622878074646, 5.261347770690918, 5.460407257080078, 5.659466743469238, 5.858526229858398, 6.057585716247559, 6.256645679473877, 6.455705165863037, 6.654764652252197, 6.853824615478516, 7.052884101867676, 7.251943588256836]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 3.0, 6.0, 5.0, 10.0, 9.0, 5.0, 9.0, 11.0, 23.0, 15.0, 20.0, 24.0, 37.0, 40.0, 23.0, 40.0, 46.0, 45.0, 34.0, 44.0, 45.0, 57.0, 41.0, 37.0, 41.0, 38.0, 42.0, 43.0, 23.0, 29.0, 23.0, 24.0, 24.0, 13.0, 17.0, 8.0, 6.0, 10.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5036134719848633, -3.3969221115112305, -3.2902307510375977, -3.183539390563965, -3.076848030090332, -2.970156669616699, -2.8634653091430664, -2.7567739486694336, -2.650082588195801, -2.543391227722168, -2.436699867248535, -2.3300085067749023, -2.2233171463012695, -2.1166257858276367, -2.009934425354004, -1.9032431840896606, -1.7965519428253174, -1.6898605823516846, -1.5831692218780518, -1.476477861404419, -1.3697865009307861, -1.2630951404571533, -1.15640389919281, -1.0497125387191772, -0.9430211782455444, -0.8363298177719116, -0.7296384572982788, -0.6229471564292908, -0.516255795955658, -0.40956443548202515, -0.3028731346130371, -0.1961817741394043, -0.08949017524719238, 0.017201170325279236, 0.12389251589775085, 0.23058384656906128, 0.3372752070426941, 0.4439665675163269, 0.5506578683853149, 0.6573492288589478, 0.7640405893325806, 0.8707319498062134, 0.9774233102798462, 1.0841145515441895, 1.1908059120178223, 1.297497272491455, 1.404188632965088, 1.5108799934387207, 1.6175713539123535, 1.7242627143859863, 1.8309540748596191, 1.937645435333252, 2.0443367958068848, 2.1510281562805176, 2.2577195167541504, 2.364410877227783, 2.471102237701416, 2.577793598175049, 2.6844849586486816, 2.7911763191223145, 2.8978676795959473, 3.00455904006958, 3.111250400543213, 3.2179417610168457, 3.3246328830718994]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 10.0, 11.0, 15.0, 21.0, 25.0, 28.0, 52.0, 51.0, 84.0, 123.0, 147.0, 270.0, 450.0, 839.0, 1881.0, 4809.0, 15530.0, 94514.0, 3973517.0, 79618.0, 14015.0, 4456.0, 1707.0, 830.0, 433.0, 276.0, 160.0, 107.0, 78.0, 54.0, 36.0, 27.0, 24.0, 11.0, 15.0, 13.0, 3.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8291015625, -1.7572784423828125, -1.685455322265625, -1.6136322021484375, -1.54180908203125, -1.4699859619140625, -1.398162841796875, -1.3263397216796875, -1.2545166015625, -1.1826934814453125, -1.110870361328125, -1.0390472412109375, -0.96722412109375, -0.8954010009765625, -0.823577880859375, -0.7517547607421875, -0.679931640625, -0.6081085205078125, -0.536285400390625, -0.4644622802734375, -0.39263916015625, -0.3208160400390625, -0.248992919921875, -0.1771697998046875, -0.1053466796875, -0.0335235595703125, 0.038299560546875, 0.1101226806640625, 0.18194580078125, 0.2537689208984375, 0.325592041015625, 0.3974151611328125, 0.46923828125, 0.5410614013671875, 0.612884521484375, 0.6847076416015625, 0.75653076171875, 0.8283538818359375, 0.900177001953125, 0.9720001220703125, 1.0438232421875, 1.1156463623046875, 1.187469482421875, 1.2592926025390625, 1.33111572265625, 1.4029388427734375, 1.474761962890625, 1.5465850830078125, 1.618408203125, 1.6902313232421875, 1.762054443359375, 1.8338775634765625, 1.90570068359375, 1.9775238037109375, 2.049346923828125, 2.1211700439453125, 2.1929931640625, 2.2648162841796875, 2.336639404296875, 2.4084625244140625, 2.48028564453125, 2.5521087646484375, 2.623931884765625, 2.6957550048828125, 2.767578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 6.0, 7.0, 14.0, 13.0, 24.0, 36.0, 61.0, 66.0, 61.0, 75.0, 108.0, 98.0, 87.0, 76.0, 74.0, 60.0, 41.0, 23.0, 23.0, 13.0, 6.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.279541015625, -0.27059173583984375, -0.2616424560546875, -0.25269317626953125, -0.243743896484375, -0.23479461669921875, -0.2258453369140625, -0.21689605712890625, -0.20794677734375, -0.19899749755859375, -0.1900482177734375, -0.18109893798828125, -0.172149658203125, -0.16320037841796875, -0.1542510986328125, -0.14530181884765625, -0.1363525390625, -0.12740325927734375, -0.1184539794921875, -0.10950469970703125, -0.100555419921875, -0.09160614013671875, -0.0826568603515625, -0.07370758056640625, -0.06475830078125, -0.05580902099609375, -0.0468597412109375, -0.03791046142578125, -0.028961181640625, -0.02001190185546875, -0.0110626220703125, -0.00211334228515625, 0.0068359375, 0.01578521728515625, 0.0247344970703125, 0.03368377685546875, 0.042633056640625, 0.05158233642578125, 0.0605316162109375, 0.06948089599609375, 0.07843017578125, 0.08737945556640625, 0.0963287353515625, 0.10527801513671875, 0.114227294921875, 0.12317657470703125, 0.1321258544921875, 0.14107513427734375, 0.1500244140625, 0.15897369384765625, 0.1679229736328125, 0.17687225341796875, 0.185821533203125, 0.19477081298828125, 0.2037200927734375, 0.21266937255859375, 0.22161865234375, 0.23056793212890625, 0.2395172119140625, 0.24846649169921875, 0.257415771484375, 0.26636505126953125, 0.2753143310546875, 0.28426361083984375, 0.293212890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 6.0, 3.0, 6.0, 2.0, 12.0, 18.0, 8.0, 17.0, 23.0, 23.0, 30.0, 42.0, 56.0, 68.0, 154.0, 502.0, 3551.0, 55337.0, 4087101.0, 42987.0, 3246.0, 559.0, 152.0, 86.0, 79.0, 36.0, 26.0, 28.0, 27.0, 16.0, 14.0, 18.0, 13.0, 14.0, 8.0, 3.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.3828125, -5.24639892578125, -5.1099853515625, -4.97357177734375, -4.837158203125, -4.70074462890625, -4.5643310546875, -4.42791748046875, -4.29150390625, -4.15509033203125, -4.0186767578125, -3.88226318359375, -3.745849609375, -3.60943603515625, -3.4730224609375, -3.33660888671875, -3.2001953125, -3.06378173828125, -2.9273681640625, -2.79095458984375, -2.654541015625, -2.51812744140625, -2.3817138671875, -2.24530029296875, -2.10888671875, -1.97247314453125, -1.8360595703125, -1.69964599609375, -1.563232421875, -1.42681884765625, -1.2904052734375, -1.15399169921875, -1.017578125, -0.88116455078125, -0.7447509765625, -0.60833740234375, -0.471923828125, -0.33551025390625, -0.1990966796875, -0.06268310546875, 0.07373046875, 0.21014404296875, 0.3465576171875, 0.48297119140625, 0.619384765625, 0.75579833984375, 0.8922119140625, 1.02862548828125, 1.1650390625, 1.30145263671875, 1.4378662109375, 1.57427978515625, 1.710693359375, 1.84710693359375, 1.9835205078125, 2.11993408203125, 2.25634765625, 2.39276123046875, 2.5291748046875, 2.66558837890625, 2.802001953125, 2.93841552734375, 3.0748291015625, 3.21124267578125, 3.34765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 6.0, 8.0, 22.0, 29.0, 84.0, 206.0, 2243.0, 1127.0, 190.0, 73.0, 31.0, 26.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.30023956298828125, -0.2699127197265625, -0.23958587646484375, -0.209259033203125, -0.17893218994140625, -0.1486053466796875, -0.11827850341796875, -0.08795166015625, -0.05762481689453125, -0.0272979736328125, 0.00302886962890625, 0.033355712890625, 0.06368255615234375, 0.0940093994140625, 0.12433624267578125, 0.1546630859375, 0.18498992919921875, 0.2153167724609375, 0.24564361572265625, 0.275970458984375, 0.30629730224609375, 0.3366241455078125, 0.36695098876953125, 0.39727783203125, 0.42760467529296875, 0.4579315185546875, 0.48825836181640625, 0.518585205078125, 0.5489120483398438, 0.5792388916015625, 0.6095657348632812, 0.639892578125, 0.6702194213867188, 0.7005462646484375, 0.7308731079101562, 0.761199951171875, 0.7915267944335938, 0.8218536376953125, 0.8521804809570312, 0.88250732421875, 0.9128341674804688, 0.9431610107421875, 0.9734878540039062, 1.003814697265625, 1.0341415405273438, 1.0644683837890625, 1.0947952270507812, 1.1251220703125, 1.1554489135742188, 1.1857757568359375, 1.2161026000976562, 1.246429443359375, 1.2767562866210938, 1.3070831298828125, 1.3374099731445312, 1.36773681640625, 1.3980636596679688, 1.4283905029296875, 1.4587173461914062, 1.489044189453125, 1.5193710327148438, 1.5496978759765625, 1.5800247192382812, 1.6103515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 11.0, 22.0, 71.0, 328.0, 339.0, 149.0, 42.0, 17.0, 10.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.684720993041992, -8.363730430603027, -8.042738914489746, -7.721748352050781, -7.400757789611816, -7.079766750335693, -6.75877571105957, -6.4377851486206055, -6.116794109344482, -5.795803070068359, -5.4748125076293945, -5.1538214683532715, -4.832830429077148, -4.511839866638184, -4.1908488273620605, -3.8698580265045166, -3.5488672256469727, -3.2278764247894287, -2.9068856239318848, -2.5858945846557617, -2.2649037837982178, -1.9439129829406738, -1.6229220628738403, -1.3019311428070068, -0.9809403419494629, -0.6599494814872742, -0.33895862102508545, -0.01796776056289673, 0.303023099899292, 0.6240139007568359, 0.9450048208236694, 1.265995740890503, 1.5869855880737305, 1.9079763889312744, 2.2289671897888184, 2.5499582290649414, 2.8709490299224854, 3.1919398307800293, 3.5129308700561523, 3.8339216709136963, 4.15491247177124, 4.475903511047363, 4.796894073486328, 5.117885112762451, 5.438876152038574, 5.759866714477539, 6.080857753753662, 6.401848793029785, 6.72283935546875, 7.043830394744873, 7.364820957183838, 7.685811996459961, 8.006802558898926, 8.32779312133789, 8.648784637451172, 8.969775199890137, 9.290765762329102, 9.611756324768066, 9.932747840881348, 10.253738403320312, 10.574728965759277, 10.895719528198242, 11.216711044311523, 11.537701606750488, 11.85869312286377]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 11.0, 7.0, 11.0, 15.0, 43.0, 37.0, 52.0, 65.0, 69.0, 84.0, 108.0, 80.0, 71.0, 73.0, 60.0, 69.0, 41.0, 30.0, 23.0, 20.0, 15.0, 6.0, 4.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.737337589263916, -3.6351592540740967, -3.5329811573028564, -3.430802822113037, -3.3286244869232178, -3.2264461517333984, -3.124268054962158, -3.022089719772339, -2.9199113845825195, -2.8177330493927, -2.71555495262146, -2.6133766174316406, -2.5111982822418213, -2.409019947052002, -2.3068418502807617, -2.2046635150909424, -2.102485418319702, -2.000307083129883, -1.898128867149353, -1.7959506511688232, -1.693772315979004, -1.5915940999984741, -1.4894158840179443, -1.387237548828125, -1.2850593328475952, -1.1828811168670654, -1.080702781677246, -0.9785245656967163, -0.8763462901115417, -0.7741680145263672, -0.6719897985458374, -0.5698115229606628, -0.4676334857940674, -0.3654552102088928, -0.26327696442604065, -0.16109871864318848, -0.058920443058013916, 0.043257832527160645, 0.14543604850769043, 0.247614324092865, 0.34979259967803955, 0.4519708752632141, 0.5541491508483887, 0.6563273668289185, 0.758505642414093, 0.8606839179992676, 0.9628621339797974, 1.0650403499603271, 1.1672186851501465, 1.2693969011306763, 1.3715752363204956, 1.4737534523010254, 1.5759317874908447, 1.6781100034713745, 1.7802882194519043, 1.8824665546417236, 1.9846447706222534, 2.086822986602783, 2.1890013217926025, 2.291179656982422, 2.393357753753662, 2.4955360889434814, 2.597714424133301, 2.699892520904541, 2.8020708560943604]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 9.0, 15.0, 21.0, 29.0, 48.0, 51.0, 58.0, 99.0, 171.0, 232.0, 353.0, 579.0, 1068.0, 2067.0, 4396.0, 10738.0, 31640.0, 128881.0, 543421.0, 245692.0, 51229.0, 15640.0, 6056.0, 2722.0, 1338.0, 753.0, 425.0, 260.0, 158.0, 113.0, 91.0, 55.0, 46.0, 28.0, 19.0, 8.0, 12.0, 7.0, 9.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.236663818359375, -1.19500732421875, -1.153350830078125, -1.1116943359375, -1.070037841796875, -1.02838134765625, -0.986724853515625, -0.945068359375, -0.903411865234375, -0.86175537109375, -0.820098876953125, -0.7784423828125, -0.736785888671875, -0.69512939453125, -0.653472900390625, -0.61181640625, -0.570159912109375, -0.52850341796875, -0.486846923828125, -0.4451904296875, -0.403533935546875, -0.36187744140625, -0.320220947265625, -0.278564453125, -0.236907958984375, -0.19525146484375, -0.153594970703125, -0.1119384765625, -0.070281982421875, -0.02862548828125, 0.013031005859375, 0.0546875, 0.096343994140625, 0.13800048828125, 0.179656982421875, 0.2213134765625, 0.262969970703125, 0.30462646484375, 0.346282958984375, 0.387939453125, 0.429595947265625, 0.47125244140625, 0.512908935546875, 0.5545654296875, 0.596221923828125, 0.63787841796875, 0.679534912109375, 0.72119140625, 0.762847900390625, 0.80450439453125, 0.846160888671875, 0.8878173828125, 0.929473876953125, 0.97113037109375, 1.012786865234375, 1.054443359375, 1.096099853515625, 1.13775634765625, 1.179412841796875, 1.2210693359375, 1.262725830078125, 1.30438232421875, 1.346038818359375, 1.3876953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 10.0, 18.0, 15.0, 22.0, 23.0, 45.0, 55.0, 60.0, 82.0, 89.0, 72.0, 70.0, 76.0, 73.0, 62.0, 49.0, 46.0, 34.0, 22.0, 12.0, 11.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29833984375, -0.2893104553222656, -0.28028106689453125, -0.2712516784667969, -0.2622222900390625, -0.2531929016113281, -0.24416351318359375, -0.23513412475585938, -0.226104736328125, -0.21707534790039062, -0.20804595947265625, -0.19901657104492188, -0.1899871826171875, -0.18095779418945312, -0.17192840576171875, -0.16289901733398438, -0.15386962890625, -0.14484024047851562, -0.13581085205078125, -0.12678146362304688, -0.1177520751953125, -0.10872268676757812, -0.09969329833984375, -0.09066390991210938, -0.081634521484375, -0.07260513305664062, -0.06357574462890625, -0.054546356201171875, -0.0455169677734375, -0.036487579345703125, -0.02745819091796875, -0.018428802490234375, -0.0093994140625, -0.000370025634765625, 0.00865936279296875, 0.017688751220703125, 0.0267181396484375, 0.035747528076171875, 0.04477691650390625, 0.053806304931640625, 0.062835693359375, 0.07186508178710938, 0.08089447021484375, 0.08992385864257812, 0.0989532470703125, 0.10798263549804688, 0.11701202392578125, 0.12604141235351562, 0.13507080078125, 0.14410018920898438, 0.15312957763671875, 0.16215896606445312, 0.1711883544921875, 0.18021774291992188, 0.18924713134765625, 0.19827651977539062, 0.207305908203125, 0.21633529663085938, 0.22536468505859375, 0.23439407348632812, 0.2434234619140625, 0.2524528503417969, 0.26148223876953125, 0.2705116271972656, 0.279541015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 12.0, 23.0, 23.0, 21.0, 31.0, 39.0, 84.0, 110.0, 190.0, 291.0, 436.0, 878.0, 1561.0, 3219.0, 6466.0, 14477.0, 35249.0, 99908.0, 324528.0, 371646.0, 117406.0, 40691.0, 16292.0, 7258.0, 3509.0, 1879.0, 990.0, 493.0, 318.0, 173.0, 107.0, 77.0, 53.0, 38.0, 26.0, 16.0, 9.0, 7.0, 1.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.73583984375, -0.712158203125, -0.6884765625, -0.664794921875, -0.64111328125, -0.617431640625, -0.59375, -0.570068359375, -0.54638671875, -0.522705078125, -0.4990234375, -0.475341796875, -0.45166015625, -0.427978515625, -0.404296875, -0.380615234375, -0.35693359375, -0.333251953125, -0.3095703125, -0.285888671875, -0.26220703125, -0.238525390625, -0.21484375, -0.191162109375, -0.16748046875, -0.143798828125, -0.1201171875, -0.096435546875, -0.07275390625, -0.049072265625, -0.025390625, -0.001708984375, 0.02197265625, 0.045654296875, 0.0693359375, 0.093017578125, 0.11669921875, 0.140380859375, 0.1640625, 0.187744140625, 0.21142578125, 0.235107421875, 0.2587890625, 0.282470703125, 0.30615234375, 0.329833984375, 0.353515625, 0.377197265625, 0.40087890625, 0.424560546875, 0.4482421875, 0.471923828125, 0.49560546875, 0.519287109375, 0.54296875, 0.566650390625, 0.59033203125, 0.614013671875, 0.6376953125, 0.661376953125, 0.68505859375, 0.708740234375, 0.732421875, 0.756103515625, 0.77978515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 4.0, 5.0, 8.0, 12.0, 8.0, 8.0, 14.0, 15.0, 17.0, 22.0, 20.0, 26.0, 28.0, 41.0, 45.0, 36.0, 42.0, 47.0, 38.0, 39.0, 41.0, 47.0, 40.0, 61.0, 41.0, 32.0, 35.0, 44.0, 29.0, 31.0, 19.0, 19.0, 14.0, 11.0, 17.0, 9.0, 5.0, 9.0, 2.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70703125, -0.6821975708007812, -0.6573638916015625, -0.6325302124023438, -0.607696533203125, -0.5828628540039062, -0.5580291748046875, -0.5331954956054688, -0.50836181640625, -0.48352813720703125, -0.4586944580078125, -0.43386077880859375, -0.409027099609375, -0.38419342041015625, -0.3593597412109375, -0.33452606201171875, -0.3096923828125, -0.28485870361328125, -0.2600250244140625, -0.23519134521484375, -0.210357666015625, -0.18552398681640625, -0.1606903076171875, -0.13585662841796875, -0.11102294921875, -0.08618927001953125, -0.0613555908203125, -0.03652191162109375, -0.011688232421875, 0.01314544677734375, 0.0379791259765625, 0.06281280517578125, 0.087646484375, 0.11248016357421875, 0.1373138427734375, 0.16214752197265625, 0.186981201171875, 0.21181488037109375, 0.2366485595703125, 0.26148223876953125, 0.28631591796875, 0.31114959716796875, 0.3359832763671875, 0.36081695556640625, 0.385650634765625, 0.41048431396484375, 0.4353179931640625, 0.46015167236328125, 0.4849853515625, 0.5098190307617188, 0.5346527099609375, 0.5594863891601562, 0.584320068359375, 0.6091537475585938, 0.6339874267578125, 0.6588211059570312, 0.68365478515625, 0.7084884643554688, 0.7333221435546875, 0.7581558227539062, 0.782989501953125, 0.8078231811523438, 0.8326568603515625, 0.8574905395507812, 0.88232421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 21.0, 21.0, 34.0, 60.0, 72.0, 139.0, 194.0, 318.0, 617.0, 1369.0, 2914.0, 7404.0, 24592.0, 122049.0, 602637.0, 228915.0, 38926.0, 10801.0, 3850.0, 1685.0, 819.0, 440.0, 232.0, 135.0, 97.0, 50.0, 44.0, 31.0, 17.0, 12.0, 9.0, 11.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.607421875, -0.5903892517089844, -0.5733566284179688, -0.5563240051269531, -0.5392913818359375, -0.5222587585449219, -0.5052261352539062, -0.4881935119628906, -0.471160888671875, -0.4541282653808594, -0.43709564208984375, -0.4200630187988281, -0.4030303955078125, -0.3859977722167969, -0.36896514892578125, -0.3519325256347656, -0.33489990234375, -0.3178672790527344, -0.30083465576171875, -0.2838020324707031, -0.2667694091796875, -0.24973678588867188, -0.23270416259765625, -0.21567153930664062, -0.198638916015625, -0.18160629272460938, -0.16457366943359375, -0.14754104614257812, -0.1305084228515625, -0.11347579956054688, -0.09644317626953125, -0.07941055297851562, -0.0623779296875, -0.045345306396484375, -0.02831268310546875, -0.011280059814453125, 0.0057525634765625, 0.022785186767578125, 0.03981781005859375, 0.056850433349609375, 0.073883056640625, 0.09091567993164062, 0.10794830322265625, 0.12498092651367188, 0.1420135498046875, 0.15904617309570312, 0.17607879638671875, 0.19311141967773438, 0.21014404296875, 0.22717666625976562, 0.24420928955078125, 0.2612419128417969, 0.2782745361328125, 0.2953071594238281, 0.31233978271484375, 0.3293724060058594, 0.346405029296875, 0.3634376525878906, 0.38047027587890625, 0.3975028991699219, 0.4145355224609375, 0.4315681457519531, 0.44860076904296875, 0.4656333923339844, 0.482666015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 8.0, 12.0, 20.0, 21.0, 27.0, 61.0, 73.0, 99.0, 117.0, 142.0, 111.0, 102.0, 49.0, 40.0, 29.0, 15.0, 13.0, 15.0, 7.0, 3.0, 2.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012373924255371094, -0.00012001954019069672, -0.0001162998378276825, -0.00011258013546466827, -0.00010886043310165405, -0.00010514073073863983, -0.00010142102837562561, -9.770132601261139e-05, -9.398162364959717e-05, -9.026192128658295e-05, -8.654221892356873e-05, -8.28225165605545e-05, -7.910281419754028e-05, -7.538311183452606e-05, -7.166340947151184e-05, -6.794370710849762e-05, -6.42240047454834e-05, -6.050430238246918e-05, -5.6784600019454956e-05, -5.3064897656440735e-05, -4.9345195293426514e-05, -4.562549293041229e-05, -4.190579056739807e-05, -3.818608820438385e-05, -3.446638584136963e-05, -3.074668347835541e-05, -2.7026981115341187e-05, -2.3307278752326965e-05, -1.9587576389312744e-05, -1.5867874026298523e-05, -1.2148171663284302e-05, -8.42846930027008e-06, -4.708766937255859e-06, -9.890645742416382e-07, 2.730637788772583e-06, 6.450340151786804e-06, 1.0170042514801025e-05, 1.3889744877815247e-05, 1.7609447240829468e-05, 2.132914960384369e-05, 2.504885196685791e-05, 2.876855432987213e-05, 3.248825669288635e-05, 3.6207959055900574e-05, 3.9927661418914795e-05, 4.3647363781929016e-05, 4.736706614494324e-05, 5.108676850795746e-05, 5.480647087097168e-05, 5.85261732339859e-05, 6.224587559700012e-05, 6.596557796001434e-05, 6.968528032302856e-05, 7.340498268604279e-05, 7.712468504905701e-05, 8.084438741207123e-05, 8.456408977508545e-05, 8.828379213809967e-05, 9.200349450111389e-05, 9.572319686412811e-05, 9.944289922714233e-05, 0.00010316260159015656, 0.00010688230395317078, 0.000110602006316185, 0.00011432170867919922]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 8.0, 11.0, 21.0, 17.0, 30.0, 37.0, 57.0, 86.0, 113.0, 176.0, 299.0, 538.0, 864.0, 1514.0, 2984.0, 6654.0, 16576.0, 51159.0, 246474.0, 545048.0, 123198.0, 31469.0, 11220.0, 4742.0, 2288.0, 1198.0, 644.0, 367.0, 251.0, 139.0, 101.0, 79.0, 50.0, 30.0, 27.0, 20.0, 10.0, 19.0, 8.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.55615234375, -0.5383834838867188, -0.5206146240234375, -0.5028457641601562, -0.485076904296875, -0.46730804443359375, -0.4495391845703125, -0.43177032470703125, -0.41400146484375, -0.39623260498046875, -0.3784637451171875, -0.36069488525390625, -0.342926025390625, -0.32515716552734375, -0.3073883056640625, -0.28961944580078125, -0.2718505859375, -0.25408172607421875, -0.2363128662109375, -0.21854400634765625, -0.200775146484375, -0.18300628662109375, -0.1652374267578125, -0.14746856689453125, -0.12969970703125, -0.11193084716796875, -0.0941619873046875, -0.07639312744140625, -0.058624267578125, -0.04085540771484375, -0.0230865478515625, -0.00531768798828125, 0.012451171875, 0.03022003173828125, 0.0479888916015625, 0.06575775146484375, 0.083526611328125, 0.10129547119140625, 0.1190643310546875, 0.13683319091796875, 0.15460205078125, 0.17237091064453125, 0.1901397705078125, 0.20790863037109375, 0.225677490234375, 0.24344635009765625, 0.2612152099609375, 0.27898406982421875, 0.2967529296875, 0.31452178955078125, 0.3322906494140625, 0.35005950927734375, 0.367828369140625, 0.38559722900390625, 0.4033660888671875, 0.42113494873046875, 0.43890380859375, 0.45667266845703125, 0.4744415283203125, 0.49221038818359375, 0.509979248046875, 0.5277481079101562, 0.5455169677734375, 0.5632858276367188, 0.5810546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 0.0, 5.0, 9.0, 7.0, 4.0, 7.0, 7.0, 9.0, 19.0, 18.0, 31.0, 28.0, 37.0, 57.0, 57.0, 76.0, 100.0, 70.0, 75.0, 74.0, 48.0, 55.0, 42.0, 34.0, 26.0, 21.0, 20.0, 10.0, 11.0, 12.0, 5.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.38720703125, -0.37526702880859375, -0.3633270263671875, -0.35138702392578125, -0.339447021484375, -0.32750701904296875, -0.3155670166015625, -0.30362701416015625, -0.29168701171875, -0.27974700927734375, -0.2678070068359375, -0.25586700439453125, -0.243927001953125, -0.23198699951171875, -0.2200469970703125, -0.20810699462890625, -0.1961669921875, -0.18422698974609375, -0.1722869873046875, -0.16034698486328125, -0.148406982421875, -0.13646697998046875, -0.1245269775390625, -0.11258697509765625, -0.10064697265625, -0.08870697021484375, -0.0767669677734375, -0.06482696533203125, -0.052886962890625, -0.04094696044921875, -0.0290069580078125, -0.01706695556640625, -0.005126953125, 0.00681304931640625, 0.0187530517578125, 0.03069305419921875, 0.042633056640625, 0.05457305908203125, 0.0665130615234375, 0.07845306396484375, 0.09039306640625, 0.10233306884765625, 0.1142730712890625, 0.12621307373046875, 0.138153076171875, 0.15009307861328125, 0.1620330810546875, 0.17397308349609375, 0.1859130859375, 0.19785308837890625, 0.2097930908203125, 0.22173309326171875, 0.233673095703125, 0.24561309814453125, 0.2575531005859375, 0.26949310302734375, 0.28143310546875, 0.29337310791015625, 0.3053131103515625, 0.31725311279296875, 0.329193115234375, 0.34113311767578125, 0.3530731201171875, 0.36501312255859375, 0.376953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 8.0, 13.0, 32.0, 73.0, 131.0, 177.0, 209.0, 149.0, 87.0, 41.0, 30.0, 18.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.909470558166504, -7.619542121887207, -7.32961368560791, -7.039685249328613, -6.749756813049316, -6.4598283767700195, -6.169900417327881, -5.879971981048584, -5.590043544769287, -5.30011510848999, -5.010186672210693, -4.7202582359313965, -4.430330276489258, -4.140401840209961, -3.850473403930664, -3.560544967651367, -3.2706165313720703, -2.9806880950927734, -2.6907596588134766, -2.400831460952759, -2.110903024673462, -1.820974588394165, -1.5310462713241577, -1.2411179542541504, -0.9511895179748535, -0.6612611413002014, -0.3713327646255493, -0.08140438795089722, 0.20852398872375488, 0.49845242500305176, 0.7883807420730591, 1.0783090591430664, 1.3682374954223633, 1.6581659317016602, 1.9480942487716675, 2.238022565841675, 2.5279510021209717, 2.8178794384002686, 3.1078076362609863, 3.397736072540283, 3.68766450881958, 3.977592945098877, 4.267521381378174, 4.557449817657471, 4.847377777099609, 5.137306213378906, 5.427234649658203, 5.7171630859375, 6.007091522216797, 6.297019958496094, 6.586948394775391, 6.8768768310546875, 7.166805267333984, 7.456733703613281, 7.74666166305542, 8.036590576171875, 8.326519012451172, 8.616447448730469, 8.906375885009766, 9.196304321289062, 9.48623275756836, 9.776161193847656, 10.066089630126953, 10.35601806640625, 10.64594554901123]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 7.0, 1.0, 8.0, 9.0, 9.0, 12.0, 14.0, 18.0, 16.0, 30.0, 20.0, 29.0, 38.0, 39.0, 32.0, 44.0, 50.0, 49.0, 54.0, 51.0, 35.0, 44.0, 47.0, 37.0, 43.0, 36.0, 39.0, 30.0, 32.0, 18.0, 22.0, 14.0, 15.0, 17.0, 8.0, 13.0, 7.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.7762956619262695, -4.626414775848389, -4.47653341293335, -4.326652526855469, -4.176771640777588, -4.026890754699707, -3.877009391784668, -3.727128505706787, -3.577247381210327, -3.427366256713867, -3.2774853706359863, -3.1276042461395264, -2.9777231216430664, -2.8278422355651855, -2.6779611110687256, -2.5280799865722656, -2.3781991004943848, -2.228317975997925, -2.078437089920044, -1.928555965423584, -1.7786749601364136, -1.6287939548492432, -1.4789128303527832, -1.3290318250656128, -1.1791508197784424, -1.029269814491272, -0.8793887495994568, -0.7295076847076416, -0.5796266794204712, -0.4297456741333008, -0.2798646092414856, -0.1299835443496704, 0.019897937774658203, 0.169778972864151, 0.3196600079536438, 0.4695410430431366, 0.6194220781326294, 0.7693030834197998, 0.919184148311615, 1.0690652132034302, 1.2189462184906006, 1.368827223777771, 1.5187082290649414, 1.6685893535614014, 1.8184703588485718, 1.9683513641357422, 2.118232488632202, 2.268113613128662, 2.417994499206543, 2.567875623703003, 2.717756509780884, 2.8676376342773438, 3.0175185203552246, 3.1673996448516846, 3.3172807693481445, 3.4671616554260254, 3.6170427799224854, 3.7669239044189453, 3.916804790496826, 4.066685676574707, 4.216567039489746, 4.366447925567627, 4.516328811645508, 4.666210174560547, 4.816091060638428]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 13.0, 29.0, 31.0, 41.0, 54.0, 87.0, 124.0, 254.0, 501.0, 1154.0, 3387.0, 14885.0, 369971.0, 3773888.0, 22053.0, 4730.0, 1603.0, 686.0, 325.0, 171.0, 100.0, 59.0, 36.0, 27.0, 16.0, 5.0, 10.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84765625, -3.7410888671875, -3.634521484375, -3.5279541015625, -3.42138671875, -3.3148193359375, -3.208251953125, -3.1016845703125, -2.9951171875, -2.8885498046875, -2.781982421875, -2.6754150390625, -2.56884765625, -2.4622802734375, -2.355712890625, -2.2491455078125, -2.142578125, -2.0360107421875, -1.929443359375, -1.8228759765625, -1.71630859375, -1.6097412109375, -1.503173828125, -1.3966064453125, -1.2900390625, -1.1834716796875, -1.076904296875, -0.9703369140625, -0.86376953125, -0.7572021484375, -0.650634765625, -0.5440673828125, -0.4375, -0.3309326171875, -0.224365234375, -0.1177978515625, -0.01123046875, 0.0953369140625, 0.201904296875, 0.3084716796875, 0.4150390625, 0.5216064453125, 0.628173828125, 0.7347412109375, 0.84130859375, 0.9478759765625, 1.054443359375, 1.1610107421875, 1.267578125, 1.3741455078125, 1.480712890625, 1.5872802734375, 1.69384765625, 1.8004150390625, 1.906982421875, 2.0135498046875, 2.1201171875, 2.2266845703125, 2.333251953125, 2.4398193359375, 2.54638671875, 2.6529541015625, 2.759521484375, 2.8660888671875, 2.97265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 12.0, 12.0, 23.0, 48.0, 52.0, 66.0, 76.0, 106.0, 116.0, 103.0, 91.0, 70.0, 62.0, 64.0, 36.0, 21.0, 16.0, 5.0, 10.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.529296875, -0.5163497924804688, -0.5034027099609375, -0.49045562744140625, -0.477508544921875, -0.46456146240234375, -0.4516143798828125, -0.43866729736328125, -0.42572021484375, -0.41277313232421875, -0.3998260498046875, -0.38687896728515625, -0.373931884765625, -0.36098480224609375, -0.3480377197265625, -0.33509063720703125, -0.3221435546875, -0.30919647216796875, -0.2962493896484375, -0.28330230712890625, -0.270355224609375, -0.25740814208984375, -0.2444610595703125, -0.23151397705078125, -0.21856689453125, -0.20561981201171875, -0.1926727294921875, -0.17972564697265625, -0.166778564453125, -0.15383148193359375, -0.1408843994140625, -0.12793731689453125, -0.114990234375, -0.10204315185546875, -0.0890960693359375, -0.07614898681640625, -0.063201904296875, -0.05025482177734375, -0.0373077392578125, -0.02436065673828125, -0.01141357421875, 0.00153350830078125, 0.0144805908203125, 0.02742767333984375, 0.040374755859375, 0.05332183837890625, 0.0662689208984375, 0.07921600341796875, 0.0921630859375, 0.10511016845703125, 0.1180572509765625, 0.13100433349609375, 0.143951416015625, 0.15689849853515625, 0.1698455810546875, 0.18279266357421875, 0.19573974609375, 0.20868682861328125, 0.2216339111328125, 0.23458099365234375, 0.247528076171875, 0.26047515869140625, 0.2734222412109375, 0.28636932373046875, 0.29931640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 12.0, 8.0, 14.0, 19.0, 27.0, 55.0, 78.0, 115.0, 162.0, 281.0, 498.0, 843.0, 1574.0, 2971.0, 6171.0, 13978.0, 38797.0, 182271.0, 3564695.0, 301398.0, 49155.0, 16896.0, 7132.0, 3258.0, 1669.0, 887.0, 541.0, 265.0, 170.0, 107.0, 65.0, 42.0, 36.0, 30.0, 18.0, 5.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1822967529296875, -1.140960693359375, -1.0996246337890625, -1.05828857421875, -1.0169525146484375, -0.975616455078125, -0.9342803955078125, -0.8929443359375, -0.8516082763671875, -0.810272216796875, -0.7689361572265625, -0.72760009765625, -0.6862640380859375, -0.644927978515625, -0.6035919189453125, -0.562255859375, -0.5209197998046875, -0.479583740234375, -0.4382476806640625, -0.39691162109375, -0.3555755615234375, -0.314239501953125, -0.2729034423828125, -0.2315673828125, -0.1902313232421875, -0.148895263671875, -0.1075592041015625, -0.06622314453125, -0.0248870849609375, 0.016448974609375, 0.0577850341796875, 0.09912109375, 0.1404571533203125, 0.181793212890625, 0.2231292724609375, 0.26446533203125, 0.3058013916015625, 0.347137451171875, 0.3884735107421875, 0.4298095703125, 0.4711456298828125, 0.512481689453125, 0.5538177490234375, 0.59515380859375, 0.6364898681640625, 0.677825927734375, 0.7191619873046875, 0.760498046875, 0.8018341064453125, 0.843170166015625, 0.8845062255859375, 0.92584228515625, 0.9671783447265625, 1.008514404296875, 1.0498504638671875, 1.0911865234375, 1.1325225830078125, 1.173858642578125, 1.2151947021484375, 1.25653076171875, 1.2978668212890625, 1.339202880859375, 1.3805389404296875, 1.421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 7.0, 3.0, 12.0, 12.0, 11.0, 10.0, 25.0, 50.0, 50.0, 75.0, 141.0, 341.0, 1360.0, 1309.0, 280.0, 138.0, 81.0, 42.0, 25.0, 24.0, 19.0, 13.0, 6.0, 6.0, 7.0, 1.0, 7.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.79443359375, -0.7755126953125, -0.756591796875, -0.7376708984375, -0.71875, -0.6998291015625, -0.680908203125, -0.6619873046875, -0.64306640625, -0.6241455078125, -0.605224609375, -0.5863037109375, -0.5673828125, -0.5484619140625, -0.529541015625, -0.5106201171875, -0.49169921875, -0.4727783203125, -0.453857421875, -0.4349365234375, -0.416015625, -0.3970947265625, -0.378173828125, -0.3592529296875, -0.34033203125, -0.3214111328125, -0.302490234375, -0.2835693359375, -0.2646484375, -0.2457275390625, -0.226806640625, -0.2078857421875, -0.18896484375, -0.1700439453125, -0.151123046875, -0.1322021484375, -0.11328125, -0.0943603515625, -0.075439453125, -0.0565185546875, -0.03759765625, -0.0186767578125, 0.000244140625, 0.0191650390625, 0.0380859375, 0.0570068359375, 0.075927734375, 0.0948486328125, 0.11376953125, 0.1326904296875, 0.151611328125, 0.1705322265625, 0.189453125, 0.2083740234375, 0.227294921875, 0.2462158203125, 0.26513671875, 0.2840576171875, 0.302978515625, 0.3218994140625, 0.3408203125, 0.3597412109375, 0.378662109375, 0.3975830078125, 0.41650390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 17.0, 15.0, 32.0, 54.0, 92.0, 129.0, 190.0, 195.0, 129.0, 71.0, 23.0, 18.0, 10.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.834409713745117, -6.671724319458008, -6.509038925170898, -6.346353530883789, -6.18366813659668, -6.02098274230957, -5.858297348022461, -5.695611953735352, -5.532926559448242, -5.370241165161133, -5.207555770874023, -5.044870376586914, -4.882184982299805, -4.719499588012695, -4.556814193725586, -4.394128799438477, -4.231443405151367, -4.068758010864258, -3.9060726165771484, -3.743387222290039, -3.5807018280029297, -3.4180164337158203, -3.255331039428711, -3.0926456451416016, -2.9299607276916504, -2.767275333404541, -2.6045899391174316, -2.4419045448303223, -2.279219150543213, -2.1165337562561035, -1.9538484811782837, -1.7911630868911743, -1.6284778118133545, -1.4657924175262451, -1.3031070232391357, -1.1404216289520264, -0.9777362942695618, -0.8150508999824524, -0.6523655652999878, -0.4896801710128784, -0.32699477672576904, -0.16430939733982086, -0.0016240179538726807, 0.1610613465309143, 0.3237467408180237, 0.48643213510513306, 0.6491174697875977, 0.811802864074707, 0.9744882583618164, 1.1371736526489258, 1.2998590469360352, 1.4625444412231445, 1.625229835510254, 1.7879152297973633, 1.950600504875183, 2.113286018371582, 2.2759714126586914, 2.438656806945801, 2.60134220123291, 2.7640275955200195, 2.926712989807129, 3.0893983840942383, 3.2520837783813477, 3.414769172668457, 3.5774543285369873]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 9.0, 11.0, 18.0, 10.0, 19.0, 21.0, 21.0, 20.0, 25.0, 29.0, 35.0, 37.0, 42.0, 41.0, 34.0, 37.0, 35.0, 40.0, 55.0, 34.0, 48.0, 43.0, 38.0, 35.0, 29.0, 32.0, 29.0, 17.0, 21.0, 25.0, 14.0, 12.0, 17.0, 10.0, 6.0, 8.0, 10.0, 6.0, 2.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6138734817504883, -1.5613279342651367, -1.5087823867797852, -1.4562368392944336, -1.403691291809082, -1.3511457443237305, -1.2986003160476685, -1.246054768562317, -1.1935092210769653, -1.1409636735916138, -1.0884181261062622, -1.0358725786209106, -0.9833270907402039, -0.9307815432548523, -0.8782360553741455, -0.825690507888794, -0.7731449604034424, -0.7205994129180908, -0.6680538654327393, -0.6155083775520325, -0.5629628300666809, -0.5104172825813293, -0.45787176489830017, -0.405326247215271, -0.35278069972991943, -0.30023515224456787, -0.2476896345615387, -0.19514410197734833, -0.14259856939315796, -0.0900530219078064, -0.03750750422477722, 0.015038013458251953, 0.06758356094360352, 0.12012909352779388, 0.17267462611198425, 0.22522015869617462, 0.277765691280365, 0.33031123876571655, 0.3828567564487457, 0.4354022741317749, 0.48794782161712646, 0.540493369102478, 0.5930389165878296, 0.6455844044685364, 0.6981299519538879, 0.7506754994392395, 0.8032209873199463, 0.8557665348052979, 0.9083120822906494, 0.960857629776001, 1.0134031772613525, 1.065948724746704, 1.1184942722320557, 1.1710398197174072, 1.2235852479934692, 1.2761307954788208, 1.3286763429641724, 1.381221890449524, 1.4337674379348755, 1.486312985420227, 1.538858413696289, 1.5914039611816406, 1.6439495086669922, 1.6964950561523438, 1.7490406036376953]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 14.0, 13.0, 14.0, 18.0, 24.0, 36.0, 60.0, 70.0, 114.0, 178.0, 303.0, 501.0, 1133.0, 2586.0, 6623.0, 22238.0, 106828.0, 651131.0, 206376.0, 34316.0, 9505.0, 3330.0, 1439.0, 659.0, 412.0, 200.0, 146.0, 74.0, 61.0, 39.0, 27.0, 27.0, 9.0, 8.0, 7.0, 5.0, 1.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3720703125, -1.3224639892578125, -1.272857666015625, -1.2232513427734375, -1.17364501953125, -1.1240386962890625, -1.074432373046875, -1.0248260498046875, -0.9752197265625, -0.9256134033203125, -0.876007080078125, -0.8264007568359375, -0.77679443359375, -0.7271881103515625, -0.677581787109375, -0.6279754638671875, -0.578369140625, -0.5287628173828125, -0.479156494140625, -0.4295501708984375, -0.37994384765625, -0.3303375244140625, -0.280731201171875, -0.2311248779296875, -0.1815185546875, -0.1319122314453125, -0.082305908203125, -0.0326995849609375, 0.01690673828125, 0.0665130615234375, 0.116119384765625, 0.1657257080078125, 0.21533203125, 0.2649383544921875, 0.314544677734375, 0.3641510009765625, 0.41375732421875, 0.4633636474609375, 0.512969970703125, 0.5625762939453125, 0.6121826171875, 0.6617889404296875, 0.711395263671875, 0.7610015869140625, 0.81060791015625, 0.8602142333984375, 0.909820556640625, 0.9594268798828125, 1.009033203125, 1.0586395263671875, 1.108245849609375, 1.1578521728515625, 1.20745849609375, 1.2570648193359375, 1.306671142578125, 1.3562774658203125, 1.4058837890625, 1.4554901123046875, 1.505096435546875, 1.5547027587890625, 1.60430908203125, 1.6539154052734375, 1.703521728515625, 1.7531280517578125, 1.802734375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 13.0, 22.0, 42.0, 36.0, 55.0, 68.0, 80.0, 102.0, 112.0, 102.0, 86.0, 73.0, 60.0, 52.0, 28.0, 16.0, 12.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.53173828125, -0.5192337036132812, -0.5067291259765625, -0.49422454833984375, -0.481719970703125, -0.46921539306640625, -0.4567108154296875, -0.44420623779296875, -0.43170166015625, -0.41919708251953125, -0.4066925048828125, -0.39418792724609375, -0.381683349609375, -0.36917877197265625, -0.3566741943359375, -0.34416961669921875, -0.3316650390625, -0.31916046142578125, -0.3066558837890625, -0.29415130615234375, -0.281646728515625, -0.26914215087890625, -0.2566375732421875, -0.24413299560546875, -0.23162841796875, -0.21912384033203125, -0.2066192626953125, -0.19411468505859375, -0.181610107421875, -0.16910552978515625, -0.1566009521484375, -0.14409637451171875, -0.131591796875, -0.11908721923828125, -0.1065826416015625, -0.09407806396484375, -0.081573486328125, -0.06906890869140625, -0.0565643310546875, -0.04405975341796875, -0.03155517578125, -0.01905059814453125, -0.0065460205078125, 0.00595855712890625, 0.018463134765625, 0.03096771240234375, 0.0434722900390625, 0.05597686767578125, 0.0684814453125, 0.08098602294921875, 0.0934906005859375, 0.10599517822265625, 0.118499755859375, 0.13100433349609375, 0.1435089111328125, 0.15601348876953125, 0.16851806640625, 0.18102264404296875, 0.1935272216796875, 0.20603179931640625, 0.218536376953125, 0.23104095458984375, 0.2435455322265625, 0.25605010986328125, 0.2685546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 19.0, 19.0, 26.0, 29.0, 46.0, 85.0, 109.0, 136.0, 275.0, 368.0, 644.0, 997.0, 1795.0, 3251.0, 6266.0, 12715.0, 28106.0, 69883.0, 211245.0, 442868.0, 165246.0, 57067.0, 23793.0, 11017.0, 5579.0, 2887.0, 1569.0, 880.0, 546.0, 382.0, 230.0, 157.0, 91.0, 55.0, 44.0, 30.0, 18.0, 12.0, 14.0, 12.0, 10.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.66845703125, -0.6464691162109375, -0.624481201171875, -0.6024932861328125, -0.58050537109375, -0.5585174560546875, -0.536529541015625, -0.5145416259765625, -0.4925537109375, -0.4705657958984375, -0.448577880859375, -0.4265899658203125, -0.40460205078125, -0.3826141357421875, -0.360626220703125, -0.3386383056640625, -0.316650390625, -0.2946624755859375, -0.272674560546875, -0.2506866455078125, -0.22869873046875, -0.2067108154296875, -0.184722900390625, -0.1627349853515625, -0.1407470703125, -0.1187591552734375, -0.096771240234375, -0.0747833251953125, -0.05279541015625, -0.0308074951171875, -0.008819580078125, 0.0131683349609375, 0.03515625, 0.0571441650390625, 0.079132080078125, 0.1011199951171875, 0.12310791015625, 0.1450958251953125, 0.167083740234375, 0.1890716552734375, 0.2110595703125, 0.2330474853515625, 0.255035400390625, 0.2770233154296875, 0.29901123046875, 0.3209991455078125, 0.342987060546875, 0.3649749755859375, 0.386962890625, 0.4089508056640625, 0.430938720703125, 0.4529266357421875, 0.47491455078125, 0.4969024658203125, 0.518890380859375, 0.5408782958984375, 0.5628662109375, 0.5848541259765625, 0.606842041015625, 0.6288299560546875, 0.65081787109375, 0.6728057861328125, 0.694793701171875, 0.7167816162109375, 0.73876953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 11.0, 10.0, 11.0, 15.0, 10.0, 15.0, 14.0, 17.0, 22.0, 30.0, 43.0, 32.0, 41.0, 34.0, 53.0, 40.0, 52.0, 50.0, 52.0, 58.0, 50.0, 27.0, 43.0, 46.0, 30.0, 24.0, 28.0, 23.0, 21.0, 15.0, 17.0, 12.0, 13.0, 11.0, 11.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.896484375, -0.8692474365234375, -0.842010498046875, -0.8147735595703125, -0.78753662109375, -0.7602996826171875, -0.733062744140625, -0.7058258056640625, -0.6785888671875, -0.6513519287109375, -0.624114990234375, -0.5968780517578125, -0.56964111328125, -0.5424041748046875, -0.515167236328125, -0.4879302978515625, -0.460693359375, -0.4334564208984375, -0.406219482421875, -0.3789825439453125, -0.35174560546875, -0.3245086669921875, -0.297271728515625, -0.2700347900390625, -0.2427978515625, -0.2155609130859375, -0.188323974609375, -0.1610870361328125, -0.13385009765625, -0.1066131591796875, -0.079376220703125, -0.0521392822265625, -0.02490234375, 0.0023345947265625, 0.029571533203125, 0.0568084716796875, 0.08404541015625, 0.1112823486328125, 0.138519287109375, 0.1657562255859375, 0.1929931640625, 0.2202301025390625, 0.247467041015625, 0.2747039794921875, 0.30194091796875, 0.3291778564453125, 0.356414794921875, 0.3836517333984375, 0.410888671875, 0.4381256103515625, 0.465362548828125, 0.4925994873046875, 0.51983642578125, 0.5470733642578125, 0.574310302734375, 0.6015472412109375, 0.6287841796875, 0.6560211181640625, 0.683258056640625, 0.7104949951171875, 0.73773193359375, 0.7649688720703125, 0.792205810546875, 0.8194427490234375, 0.8466796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 10.0, 4.0, 3.0, 12.0, 14.0, 13.0, 13.0, 35.0, 35.0, 51.0, 102.0, 159.0, 276.0, 477.0, 1011.0, 2523.0, 8073.0, 36434.0, 373012.0, 562584.0, 48168.0, 10150.0, 2967.0, 1113.0, 511.0, 303.0, 133.0, 92.0, 74.0, 56.0, 35.0, 27.0, 18.0, 15.0, 11.0, 7.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0], "bins": [-0.669921875, -0.6523284912109375, -0.634735107421875, -0.6171417236328125, -0.59954833984375, -0.5819549560546875, -0.564361572265625, -0.5467681884765625, -0.5291748046875, -0.5115814208984375, -0.493988037109375, -0.4763946533203125, -0.45880126953125, -0.4412078857421875, -0.423614501953125, -0.4060211181640625, -0.388427734375, -0.3708343505859375, -0.353240966796875, -0.3356475830078125, -0.31805419921875, -0.3004608154296875, -0.282867431640625, -0.2652740478515625, -0.2476806640625, -0.2300872802734375, -0.212493896484375, -0.1949005126953125, -0.17730712890625, -0.1597137451171875, -0.142120361328125, -0.1245269775390625, -0.10693359375, -0.0893402099609375, -0.071746826171875, -0.0541534423828125, -0.03656005859375, -0.0189666748046875, -0.001373291015625, 0.0162200927734375, 0.0338134765625, 0.0514068603515625, 0.069000244140625, 0.0865936279296875, 0.10418701171875, 0.1217803955078125, 0.139373779296875, 0.1569671630859375, 0.174560546875, 0.1921539306640625, 0.209747314453125, 0.2273406982421875, 0.24493408203125, 0.2625274658203125, 0.280120849609375, 0.2977142333984375, 0.3153076171875, 0.3329010009765625, 0.350494384765625, 0.3680877685546875, 0.38568115234375, 0.4032745361328125, 0.420867919921875, 0.4384613037109375, 0.4560546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 6.0, 4.0, 9.0, 7.0, 12.0, 10.0, 11.0, 22.0, 37.0, 49.0, 48.0, 56.0, 71.0, 130.0, 115.0, 103.0, 81.0, 51.0, 49.0, 32.0, 15.0, 15.0, 14.0, 9.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.867813110351562e-05, -7.638614624738693e-05, -7.409416139125824e-05, -7.180217653512955e-05, -6.951019167900085e-05, -6.721820682287216e-05, -6.492622196674347e-05, -6.263423711061478e-05, -6.0342252254486084e-05, -5.805026739835739e-05, -5.57582825422287e-05, -5.3466297686100006e-05, -5.1174312829971313e-05, -4.888232797384262e-05, -4.659034311771393e-05, -4.4298358261585236e-05, -4.200637340545654e-05, -3.971438854932785e-05, -3.742240369319916e-05, -3.5130418837070465e-05, -3.283843398094177e-05, -3.054644912481308e-05, -2.8254464268684387e-05, -2.5962479412555695e-05, -2.3670494556427002e-05, -2.137850970029831e-05, -1.9086524844169617e-05, -1.6794539988040924e-05, -1.4502555131912231e-05, -1.2210570275783539e-05, -9.918585419654846e-06, -7.6266005635261536e-06, -5.334615707397461e-06, -3.0426308512687683e-06, -7.506459951400757e-07, 1.541338860988617e-06, 3.8333237171173096e-06, 6.125308573246002e-06, 8.417293429374695e-06, 1.0709278285503387e-05, 1.300126314163208e-05, 1.5293247997760773e-05, 1.7585232853889465e-05, 1.9877217710018158e-05, 2.216920256614685e-05, 2.4461187422275543e-05, 2.6753172278404236e-05, 2.904515713453293e-05, 3.133714199066162e-05, 3.3629126846790314e-05, 3.5921111702919006e-05, 3.82130965590477e-05, 4.050508141517639e-05, 4.2797066271305084e-05, 4.508905112743378e-05, 4.738103598356247e-05, 4.967302083969116e-05, 5.1965005695819855e-05, 5.425699055194855e-05, 5.654897540807724e-05, 5.884096026420593e-05, 6.113294512033463e-05, 6.342492997646332e-05, 6.571691483259201e-05, 6.80088996887207e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 4.0, 8.0, 5.0, 8.0, 20.0, 15.0, 40.0, 44.0, 67.0, 106.0, 162.0, 253.0, 488.0, 1086.0, 2538.0, 8058.0, 40304.0, 741258.0, 223736.0, 21644.0, 5184.0, 1764.0, 803.0, 374.0, 183.0, 116.0, 79.0, 64.0, 41.0, 26.0, 24.0, 8.0, 10.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8203125, -0.7918548583984375, -0.763397216796875, -0.7349395751953125, -0.70648193359375, -0.6780242919921875, -0.649566650390625, -0.6211090087890625, -0.5926513671875, -0.5641937255859375, -0.535736083984375, -0.5072784423828125, -0.47882080078125, -0.4503631591796875, -0.421905517578125, -0.3934478759765625, -0.364990234375, -0.3365325927734375, -0.308074951171875, -0.2796173095703125, -0.25115966796875, -0.2227020263671875, -0.194244384765625, -0.1657867431640625, -0.1373291015625, -0.1088714599609375, -0.080413818359375, -0.0519561767578125, -0.02349853515625, 0.0049591064453125, 0.033416748046875, 0.0618743896484375, 0.09033203125, 0.1187896728515625, 0.147247314453125, 0.1757049560546875, 0.20416259765625, 0.2326202392578125, 0.261077880859375, 0.2895355224609375, 0.3179931640625, 0.3464508056640625, 0.374908447265625, 0.4033660888671875, 0.43182373046875, 0.4602813720703125, 0.488739013671875, 0.5171966552734375, 0.545654296875, 0.5741119384765625, 0.602569580078125, 0.6310272216796875, 0.65948486328125, 0.6879425048828125, 0.716400146484375, 0.7448577880859375, 0.7733154296875, 0.8017730712890625, 0.830230712890625, 0.8586883544921875, 0.88714599609375, 0.9156036376953125, 0.944061279296875, 0.9725189208984375, 1.0009765625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 8.0, 6.0, 8.0, 10.0, 21.0, 21.0, 41.0, 67.0, 95.0, 178.0, 192.0, 123.0, 54.0, 53.0, 29.0, 21.0, 11.0, 7.0, 7.0, 8.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5383453369140625, -0.522979736328125, -0.5076141357421875, -0.49224853515625, -0.4768829345703125, -0.461517333984375, -0.4461517333984375, -0.4307861328125, -0.4154205322265625, -0.400054931640625, -0.3846893310546875, -0.36932373046875, -0.3539581298828125, -0.338592529296875, -0.3232269287109375, -0.307861328125, -0.2924957275390625, -0.277130126953125, -0.2617645263671875, -0.24639892578125, -0.2310333251953125, -0.215667724609375, -0.2003021240234375, -0.1849365234375, -0.1695709228515625, -0.154205322265625, -0.1388397216796875, -0.12347412109375, -0.1081085205078125, -0.092742919921875, -0.0773773193359375, -0.06201171875, -0.0466461181640625, -0.031280517578125, -0.0159149169921875, -0.00054931640625, 0.0148162841796875, 0.030181884765625, 0.0455474853515625, 0.0609130859375, 0.0762786865234375, 0.091644287109375, 0.1070098876953125, 0.12237548828125, 0.1377410888671875, 0.153106689453125, 0.1684722900390625, 0.183837890625, 0.1992034912109375, 0.214569091796875, 0.2299346923828125, 0.24530029296875, 0.2606658935546875, 0.276031494140625, 0.2913970947265625, 0.3067626953125, 0.3221282958984375, 0.337493896484375, 0.3528594970703125, 0.36822509765625, 0.3835906982421875, 0.398956298828125, 0.4143218994140625, 0.4296875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 8.0, 9.0, 17.0, 23.0, 53.0, 97.0, 127.0, 172.0, 189.0, 110.0, 84.0, 37.0, 25.0, 14.0, 8.0, 17.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.693691730499268, -6.434723854064941, -6.175756454467773, -5.9167890548706055, -5.657821178436279, -5.398853302001953, -5.139885902404785, -4.880918502807617, -4.621950626373291, -4.362982749938965, -4.104015350341797, -3.84504771232605, -3.5860800743103027, -3.3271124362945557, -3.0681447982788086, -2.8091771602630615, -2.5502095222473145, -2.2912418842315674, -2.0322742462158203, -1.7733066082000732, -1.5143389701843262, -1.255371332168579, -0.996403694152832, -0.737436056137085, -0.4784684181213379, -0.21950078010559082, 0.03946685791015625, 0.2984344959259033, 0.5574021339416504, 0.8163697719573975, 1.0753374099731445, 1.3343050479888916, 1.5932722091674805, 1.8522398471832275, 2.1112074851989746, 2.3701751232147217, 2.6291427612304688, 2.888110399246216, 3.147078037261963, 3.40604567527771, 3.665013313293457, 3.923980951309204, 4.182948589324951, 4.441916465759277, 4.700883865356445, 4.959851264953613, 5.2188191413879395, 5.477787017822266, 5.736754417419434, 5.995721817016602, 6.254689693450928, 6.513657569885254, 6.772624969482422, 7.03159236907959, 7.290560245513916, 7.549528121948242, 7.80849552154541, 8.067462921142578, 8.326431274414062, 8.58539867401123, 8.844366073608398, 9.103333473205566, 9.362300872802734, 9.621269226074219, 9.880236625671387]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 10.0, 8.0, 9.0, 15.0, 15.0, 19.0, 29.0, 28.0, 34.0, 33.0, 46.0, 46.0, 33.0, 55.0, 64.0, 42.0, 53.0, 47.0, 51.0, 41.0, 54.0, 40.0, 31.0, 30.0, 38.0, 37.0, 26.0, 13.0, 11.0, 9.0, 12.0, 10.0, 8.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.510470390319824, -5.339556694030762, -5.168642520904541, -4.9977288246154785, -4.826814651489258, -4.655900955200195, -4.484987258911133, -4.314073085784912, -4.143158912658691, -3.97224497795105, -3.801331043243408, -3.6304173469543457, -3.459503173828125, -3.2885894775390625, -3.117675542831421, -2.9467616081237793, -2.775847911834717, -2.604933977127075, -2.4340200424194336, -2.263106346130371, -2.0921921730041504, -1.9212783575057983, -1.7503645420074463, -1.5794506072998047, -1.408536672592163, -1.2376227378845215, -1.0667088031768799, -0.8957949876785278, -0.7248810529708862, -0.5539671182632446, -0.3830533027648926, -0.21213936805725098, -0.041225433349609375, 0.12968847155570984, 0.30060237646102905, 0.4715162515640259, 0.6424301862716675, 0.8133441209793091, 0.9842579364776611, 1.1551718711853027, 1.3260858058929443, 1.496999740600586, 1.6679136753082275, 1.8388274908065796, 2.0097413063049316, 2.1806554794311523, 2.351569175720215, 2.5224831104278564, 2.693397045135498, 2.8643109798431396, 3.0352249145507812, 3.2061386108398438, 3.3770527839660645, 3.547966480255127, 3.7188804149627686, 3.88979434967041, 4.060708045959473, 4.231621742248535, 4.402535915374756, 4.573449611663818, 4.744363784790039, 4.915277481079102, 5.086191177368164, 5.257105350494385, 5.4280195236206055]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 9.0, 20.0, 37.0, 61.0, 101.0, 176.0, 320.0, 952.0, 4085.0, 48647.0, 4115014.0, 20403.0, 2920.0, 837.0, 333.0, 177.0, 75.0, 41.0, 18.0, 13.0, 10.0, 14.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5390625, -5.38677978515625, -5.2344970703125, -5.08221435546875, -4.929931640625, -4.77764892578125, -4.6253662109375, -4.47308349609375, -4.32080078125, -4.16851806640625, -4.0162353515625, -3.86395263671875, -3.711669921875, -3.55938720703125, -3.4071044921875, -3.25482177734375, -3.1025390625, -2.95025634765625, -2.7979736328125, -2.64569091796875, -2.493408203125, -2.34112548828125, -2.1888427734375, -2.03656005859375, -1.88427734375, -1.73199462890625, -1.5797119140625, -1.42742919921875, -1.275146484375, -1.12286376953125, -0.9705810546875, -0.81829833984375, -0.666015625, -0.51373291015625, -0.3614501953125, -0.20916748046875, -0.056884765625, 0.09539794921875, 0.2476806640625, 0.39996337890625, 0.55224609375, 0.70452880859375, 0.8568115234375, 1.00909423828125, 1.161376953125, 1.31365966796875, 1.4659423828125, 1.61822509765625, 1.7705078125, 1.92279052734375, 2.0750732421875, 2.22735595703125, 2.379638671875, 2.53192138671875, 2.6842041015625, 2.83648681640625, 2.98876953125, 3.14105224609375, 3.2933349609375, 3.44561767578125, 3.597900390625, 3.75018310546875, 3.9024658203125, 4.05474853515625, 4.20703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 3.0, 18.0, 30.0, 40.0, 53.0, 80.0, 79.0, 93.0, 115.0, 90.0, 92.0, 90.0, 64.0, 52.0, 29.0, 27.0, 17.0, 7.0, 4.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5859375, -0.57159423828125, -0.5572509765625, -0.54290771484375, -0.528564453125, -0.51422119140625, -0.4998779296875, -0.48553466796875, -0.47119140625, -0.45684814453125, -0.4425048828125, -0.42816162109375, -0.413818359375, -0.39947509765625, -0.3851318359375, -0.37078857421875, -0.3564453125, -0.34210205078125, -0.3277587890625, -0.31341552734375, -0.299072265625, -0.28472900390625, -0.2703857421875, -0.25604248046875, -0.24169921875, -0.22735595703125, -0.2130126953125, -0.19866943359375, -0.184326171875, -0.16998291015625, -0.1556396484375, -0.14129638671875, -0.126953125, -0.11260986328125, -0.0982666015625, -0.08392333984375, -0.069580078125, -0.05523681640625, -0.0408935546875, -0.02655029296875, -0.01220703125, 0.00213623046875, 0.0164794921875, 0.03082275390625, 0.045166015625, 0.05950927734375, 0.0738525390625, 0.08819580078125, 0.1025390625, 0.11688232421875, 0.1312255859375, 0.14556884765625, 0.159912109375, 0.17425537109375, 0.1885986328125, 0.20294189453125, 0.21728515625, 0.23162841796875, 0.2459716796875, 0.26031494140625, 0.274658203125, 0.28900146484375, 0.3033447265625, 0.31768798828125, 0.33203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 6.0, 17.0, 18.0, 28.0, 22.0, 32.0, 61.0, 71.0, 118.0, 153.0, 214.0, 290.0, 483.0, 803.0, 1417.0, 2873.0, 6160.0, 15468.0, 53217.0, 988679.0, 3030337.0, 62750.0, 17376.0, 6577.0, 2990.0, 1600.0, 830.0, 552.0, 348.0, 216.0, 134.0, 122.0, 65.0, 77.0, 38.0, 40.0, 18.0, 16.0, 10.0, 13.0, 7.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.794921875, -1.73712158203125, -1.6793212890625, -1.62152099609375, -1.563720703125, -1.50592041015625, -1.4481201171875, -1.39031982421875, -1.33251953125, -1.27471923828125, -1.2169189453125, -1.15911865234375, -1.101318359375, -1.04351806640625, -0.9857177734375, -0.92791748046875, -0.8701171875, -0.81231689453125, -0.7545166015625, -0.69671630859375, -0.638916015625, -0.58111572265625, -0.5233154296875, -0.46551513671875, -0.40771484375, -0.34991455078125, -0.2921142578125, -0.23431396484375, -0.176513671875, -0.11871337890625, -0.0609130859375, -0.00311279296875, 0.0546875, 0.11248779296875, 0.1702880859375, 0.22808837890625, 0.285888671875, 0.34368896484375, 0.4014892578125, 0.45928955078125, 0.51708984375, 0.57489013671875, 0.6326904296875, 0.69049072265625, 0.748291015625, 0.80609130859375, 0.8638916015625, 0.92169189453125, 0.9794921875, 1.03729248046875, 1.0950927734375, 1.15289306640625, 1.210693359375, 1.26849365234375, 1.3262939453125, 1.38409423828125, 1.44189453125, 1.49969482421875, 1.5574951171875, 1.61529541015625, 1.673095703125, 1.73089599609375, 1.7886962890625, 1.84649658203125, 1.904296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 6.0, 14.0, 12.0, 23.0, 18.0, 47.0, 49.0, 70.0, 214.0, 776.0, 2219.0, 287.0, 118.0, 63.0, 48.0, 16.0, 13.0, 14.0, 15.0, 11.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7021484375, -0.680999755859375, -0.65985107421875, -0.638702392578125, -0.6175537109375, -0.596405029296875, -0.57525634765625, -0.554107666015625, -0.532958984375, -0.511810302734375, -0.49066162109375, -0.469512939453125, -0.4483642578125, -0.427215576171875, -0.40606689453125, -0.384918212890625, -0.36376953125, -0.342620849609375, -0.32147216796875, -0.300323486328125, -0.2791748046875, -0.258026123046875, -0.23687744140625, -0.215728759765625, -0.194580078125, -0.173431396484375, -0.15228271484375, -0.131134033203125, -0.1099853515625, -0.088836669921875, -0.06768798828125, -0.046539306640625, -0.025390625, -0.004241943359375, 0.01690673828125, 0.038055419921875, 0.0592041015625, 0.080352783203125, 0.10150146484375, 0.122650146484375, 0.143798828125, 0.164947509765625, 0.18609619140625, 0.207244873046875, 0.2283935546875, 0.249542236328125, 0.27069091796875, 0.291839599609375, 0.31298828125, 0.334136962890625, 0.35528564453125, 0.376434326171875, 0.3975830078125, 0.418731689453125, 0.43988037109375, 0.461029052734375, 0.482177734375, 0.503326416015625, 0.52447509765625, 0.545623779296875, 0.5667724609375, 0.587921142578125, 0.60906982421875, 0.630218505859375, 0.6513671875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 9.0, 12.0, 25.0, 27.0, 67.0, 98.0, 191.0, 233.0, 158.0, 93.0, 43.0, 15.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1549787521362305, -4.990641117095947, -4.826303958892822, -4.661966323852539, -4.497629165649414, -4.333291530609131, -4.168954372406006, -4.004616737365723, -3.8402793407440186, -3.6759419441223145, -3.5116045475006104, -3.3472671508789062, -3.182929515838623, -3.018592357635498, -2.854254722595215, -2.6899173259735107, -2.5255799293518066, -2.3612425327301025, -2.1969051361083984, -2.0325677394866943, -1.8682302236557007, -1.7038928270339966, -1.539555311203003, -1.3752179145812988, -1.2108805179595947, -1.0465431213378906, -0.8822056651115417, -0.7178682088851929, -0.5535308122634888, -0.38919341564178467, -0.2248559594154358, -0.060518503189086914, 0.10381937026977539, 0.2681567966938019, 0.43249422311782837, 0.5968316793441772, 0.7611690759658813, 0.9255064725875854, 1.089843988418579, 1.2541813850402832, 1.4185187816619873, 1.5828561782836914, 1.7471935749053955, 1.9115310907363892, 2.075868606567383, 2.240205764770508, 2.404543399810791, 2.568880796432495, 2.733218193054199, 2.8975555896759033, 3.0618929862976074, 3.2262303829193115, 3.3905677795410156, 3.554905414581299, 3.719242811203003, 3.883580207824707, 4.047917366027832, 4.212255001068115, 4.37659215927124, 4.540929794311523, 4.705266952514648, 4.869604587554932, 5.033941745758057, 5.19827938079834, 5.362617015838623]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 8.0, 9.0, 13.0, 17.0, 12.0, 17.0, 25.0, 25.0, 30.0, 30.0, 52.0, 39.0, 46.0, 49.0, 50.0, 45.0, 44.0, 54.0, 52.0, 33.0, 46.0, 45.0, 34.0, 39.0, 25.0, 34.0, 25.0, 23.0, 16.0, 17.0, 10.0, 2.0, 5.0, 10.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9063098430633545, -1.847139835357666, -1.787969946861267, -1.7287999391555786, -1.6696300506591797, -1.6104600429534912, -1.5512900352478027, -1.4921201467514038, -1.4329502582550049, -1.3737802505493164, -1.3146103620529175, -1.255440354347229, -1.19627046585083, -1.1371004581451416, -1.0779304504394531, -1.0187605619430542, -0.9595905542373657, -0.900420606136322, -0.8412506580352783, -0.7820806503295898, -0.7229107618331909, -0.6637407541275024, -0.6045708060264587, -0.545400857925415, -0.48623090982437134, -0.42706096172332764, -0.36789101362228394, -0.30872103571891785, -0.24955108761787415, -0.19038113951683044, -0.13121116161346436, -0.07204121351242065, -0.012871146202087402, 0.046298809349536896, 0.1054687649011612, 0.1646387279033661, 0.2238086760044098, 0.2829786241054535, 0.3421486020088196, 0.4013185501098633, 0.460488498210907, 0.5196584463119507, 0.5788283944129944, 0.6379983425140381, 0.6971683502197266, 0.7563382387161255, 0.815508246421814, 0.8746781945228577, 0.9338481426239014, 0.9930180907249451, 1.0521880388259888, 1.1113580465316772, 1.1705279350280762, 1.2296979427337646, 1.2888679504394531, 1.348037838935852, 1.407207727432251, 1.4663777351379395, 1.5255476236343384, 1.5847176313400269, 1.6438875198364258, 1.7030575275421143, 1.7622275352478027, 1.8213974237442017, 1.8805674314498901]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 5.0, 4.0, 5.0, 23.0, 20.0, 30.0, 47.0, 62.0, 80.0, 165.0, 262.0, 510.0, 1160.0, 3052.0, 10588.0, 50576.0, 430287.0, 479140.0, 55321.0, 11515.0, 3259.0, 1198.0, 521.0, 261.0, 159.0, 89.0, 50.0, 51.0, 35.0, 17.0, 10.0, 12.0, 6.0, 7.0, 1.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6793365478515625, -1.619415283203125, -1.5594940185546875, -1.49957275390625, -1.4396514892578125, -1.379730224609375, -1.3198089599609375, -1.2598876953125, -1.1999664306640625, -1.140045166015625, -1.0801239013671875, -1.02020263671875, -0.9602813720703125, -0.900360107421875, -0.8404388427734375, -0.780517578125, -0.7205963134765625, -0.660675048828125, -0.6007537841796875, -0.54083251953125, -0.4809112548828125, -0.420989990234375, -0.3610687255859375, -0.3011474609375, -0.2412261962890625, -0.181304931640625, -0.1213836669921875, -0.06146240234375, -0.0015411376953125, 0.058380126953125, 0.1183013916015625, 0.17822265625, 0.2381439208984375, 0.298065185546875, 0.3579864501953125, 0.41790771484375, 0.4778289794921875, 0.537750244140625, 0.5976715087890625, 0.6575927734375, 0.7175140380859375, 0.777435302734375, 0.8373565673828125, 0.89727783203125, 0.9571990966796875, 1.017120361328125, 1.0770416259765625, 1.136962890625, 1.1968841552734375, 1.256805419921875, 1.3167266845703125, 1.37664794921875, 1.4365692138671875, 1.496490478515625, 1.5564117431640625, 1.6163330078125, 1.6762542724609375, 1.736175537109375, 1.7960968017578125, 1.85601806640625, 1.9159393310546875, 1.975860595703125, 2.0357818603515625, 2.095703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 10.0, 26.0, 33.0, 60.0, 83.0, 83.0, 91.0, 113.0, 82.0, 91.0, 97.0, 57.0, 54.0, 43.0, 23.0, 17.0, 5.0, 9.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5694465637207031, -0.5544204711914062, -0.5393943786621094, -0.5243682861328125, -0.5093421936035156, -0.49431610107421875, -0.4792900085449219, -0.464263916015625, -0.4492378234863281, -0.43421173095703125, -0.4191856384277344, -0.4041595458984375, -0.3891334533691406, -0.37410736083984375, -0.3590812683105469, -0.34405517578125, -0.3290290832519531, -0.31400299072265625, -0.2989768981933594, -0.2839508056640625, -0.2689247131347656, -0.25389862060546875, -0.23887252807617188, -0.223846435546875, -0.20882034301757812, -0.19379425048828125, -0.17876815795898438, -0.1637420654296875, -0.14871597290039062, -0.13368988037109375, -0.11866378784179688, -0.1036376953125, -0.08861160278320312, -0.07358551025390625, -0.058559417724609375, -0.0435333251953125, -0.028507232666015625, -0.01348114013671875, 0.001544952392578125, 0.016571044921875, 0.031597137451171875, 0.04662322998046875, 0.061649322509765625, 0.0766754150390625, 0.09170150756835938, 0.10672760009765625, 0.12175369262695312, 0.13677978515625, 0.15180587768554688, 0.16683197021484375, 0.18185806274414062, 0.1968841552734375, 0.21191024780273438, 0.22693634033203125, 0.24196243286132812, 0.256988525390625, 0.2720146179199219, 0.28704071044921875, 0.3020668029785156, 0.3170928955078125, 0.3321189880371094, 0.34714508056640625, 0.3621711730957031, 0.377197265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 14.0, 19.0, 21.0, 36.0, 46.0, 91.0, 126.0, 190.0, 327.0, 523.0, 924.0, 1626.0, 2755.0, 5214.0, 9937.0, 19983.0, 44134.0, 107523.0, 305378.0, 337143.0, 119485.0, 47860.0, 21973.0, 10875.0, 5366.0, 2923.0, 1612.0, 982.0, 527.0, 325.0, 188.0, 156.0, 85.0, 53.0, 38.0, 39.0, 17.0, 9.0, 9.0, 5.0, 4.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63525390625, -0.6133880615234375, -0.591522216796875, -0.5696563720703125, -0.54779052734375, -0.5259246826171875, -0.504058837890625, -0.4821929931640625, -0.4603271484375, -0.4384613037109375, -0.416595458984375, -0.3947296142578125, -0.37286376953125, -0.3509979248046875, -0.329132080078125, -0.3072662353515625, -0.285400390625, -0.2635345458984375, -0.241668701171875, -0.2198028564453125, -0.19793701171875, -0.1760711669921875, -0.154205322265625, -0.1323394775390625, -0.1104736328125, -0.0886077880859375, -0.066741943359375, -0.0448760986328125, -0.02301025390625, -0.0011444091796875, 0.020721435546875, 0.0425872802734375, 0.064453125, 0.0863189697265625, 0.108184814453125, 0.1300506591796875, 0.15191650390625, 0.1737823486328125, 0.195648193359375, 0.2175140380859375, 0.2393798828125, 0.2612457275390625, 0.283111572265625, 0.3049774169921875, 0.32684326171875, 0.3487091064453125, 0.370574951171875, 0.3924407958984375, 0.414306640625, 0.4361724853515625, 0.458038330078125, 0.4799041748046875, 0.50177001953125, 0.5236358642578125, 0.545501708984375, 0.5673675537109375, 0.5892333984375, 0.6110992431640625, 0.632965087890625, 0.6548309326171875, 0.67669677734375, 0.6985626220703125, 0.720428466796875, 0.7422943115234375, 0.76416015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 2.0, 4.0, 7.0, 17.0, 13.0, 10.0, 14.0, 23.0, 22.0, 28.0, 25.0, 38.0, 50.0, 34.0, 43.0, 46.0, 37.0, 37.0, 39.0, 47.0, 43.0, 68.0, 36.0, 38.0, 34.0, 42.0, 25.0, 22.0, 23.0, 22.0, 15.0, 21.0, 14.0, 14.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1103515625, -1.07989501953125, -1.0494384765625, -1.01898193359375, -0.988525390625, -0.95806884765625, -0.9276123046875, -0.89715576171875, -0.86669921875, -0.83624267578125, -0.8057861328125, -0.77532958984375, -0.744873046875, -0.71441650390625, -0.6839599609375, -0.65350341796875, -0.623046875, -0.59259033203125, -0.5621337890625, -0.53167724609375, -0.501220703125, -0.47076416015625, -0.4403076171875, -0.40985107421875, -0.37939453125, -0.34893798828125, -0.3184814453125, -0.28802490234375, -0.257568359375, -0.22711181640625, -0.1966552734375, -0.16619873046875, -0.1357421875, -0.10528564453125, -0.0748291015625, -0.04437255859375, -0.013916015625, 0.01654052734375, 0.0469970703125, 0.07745361328125, 0.10791015625, 0.13836669921875, 0.1688232421875, 0.19927978515625, 0.229736328125, 0.26019287109375, 0.2906494140625, 0.32110595703125, 0.3515625, 0.38201904296875, 0.4124755859375, 0.44293212890625, 0.473388671875, 0.50384521484375, 0.5343017578125, 0.56475830078125, 0.59521484375, 0.62567138671875, 0.6561279296875, 0.68658447265625, 0.717041015625, 0.74749755859375, 0.7779541015625, 0.80841064453125, 0.8388671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 2.0, 8.0, 10.0, 11.0, 37.0, 45.0, 96.0, 203.0, 428.0, 943.0, 2475.0, 8432.0, 58783.0, 850072.0, 109781.0, 11968.0, 3119.0, 1113.0, 512.0, 237.0, 122.0, 61.0, 35.0, 20.0, 8.0, 4.0, 10.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86181640625, -0.837615966796875, -0.81341552734375, -0.789215087890625, -0.7650146484375, -0.740814208984375, -0.71661376953125, -0.692413330078125, -0.668212890625, -0.644012451171875, -0.61981201171875, -0.595611572265625, -0.5714111328125, -0.547210693359375, -0.52301025390625, -0.498809814453125, -0.474609375, -0.450408935546875, -0.42620849609375, -0.402008056640625, -0.3778076171875, -0.353607177734375, -0.32940673828125, -0.305206298828125, -0.281005859375, -0.256805419921875, -0.23260498046875, -0.208404541015625, -0.1842041015625, -0.160003662109375, -0.13580322265625, -0.111602783203125, -0.08740234375, -0.063201904296875, -0.03900146484375, -0.014801025390625, 0.0093994140625, 0.033599853515625, 0.05780029296875, 0.082000732421875, 0.106201171875, 0.130401611328125, 0.15460205078125, 0.178802490234375, 0.2030029296875, 0.227203369140625, 0.25140380859375, 0.275604248046875, 0.2998046875, 0.324005126953125, 0.34820556640625, 0.372406005859375, 0.3966064453125, 0.420806884765625, 0.44500732421875, 0.469207763671875, 0.493408203125, 0.517608642578125, 0.54180908203125, 0.566009521484375, 0.5902099609375, 0.614410400390625, 0.63861083984375, 0.662811279296875, 0.68701171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 8.0, 12.0, 7.0, 12.0, 24.0, 19.0, 45.0, 41.0, 77.0, 105.0, 138.0, 130.0, 115.0, 67.0, 53.0, 45.0, 18.0, 21.0, 11.0, 4.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.614229202270508e-05, -9.313132613897324e-05, -9.01203602552414e-05, -8.710939437150955e-05, -8.409842848777771e-05, -8.108746260404587e-05, -7.807649672031403e-05, -7.506553083658218e-05, -7.205456495285034e-05, -6.90435990691185e-05, -6.603263318538666e-05, -6.302166730165482e-05, -6.0010701417922974e-05, -5.699973553419113e-05, -5.398876965045929e-05, -5.097780376672745e-05, -4.7966837882995605e-05, -4.4955871999263763e-05, -4.194490611553192e-05, -3.893394023180008e-05, -3.592297434806824e-05, -3.2912008464336395e-05, -2.9901042580604553e-05, -2.689007669687271e-05, -2.387911081314087e-05, -2.0868144929409027e-05, -1.7857179045677185e-05, -1.4846213161945343e-05, -1.1835247278213501e-05, -8.824281394481659e-06, -5.813315510749817e-06, -2.802349627017975e-06, 2.086162567138672e-07, 3.2195821404457092e-06, 6.230548024177551e-06, 9.241513907909393e-06, 1.2252479791641235e-05, 1.5263445675373077e-05, 1.827441155910492e-05, 2.128537744283676e-05, 2.4296343326568604e-05, 2.7307309210300446e-05, 3.0318275094032288e-05, 3.332924097776413e-05, 3.634020686149597e-05, 3.9351172745227814e-05, 4.2362138628959656e-05, 4.53731045126915e-05, 4.838407039642334e-05, 5.139503628015518e-05, 5.4406002163887024e-05, 5.7416968047618866e-05, 6.042793393135071e-05, 6.343889981508255e-05, 6.644986569881439e-05, 6.946083158254623e-05, 7.247179746627808e-05, 7.548276335000992e-05, 7.849372923374176e-05, 8.15046951174736e-05, 8.451566100120544e-05, 8.752662688493729e-05, 9.053759276866913e-05, 9.354855865240097e-05, 9.655952453613281e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 4.0, 9.0, 10.0, 23.0, 25.0, 46.0, 66.0, 83.0, 152.0, 262.0, 488.0, 943.0, 2408.0, 7985.0, 43881.0, 889968.0, 85280.0, 11299.0, 3111.0, 1175.0, 563.0, 249.0, 181.0, 123.0, 65.0, 50.0, 25.0, 29.0, 12.0, 12.0, 11.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.1598587036132812, -1.1263580322265625, -1.0928573608398438, -1.059356689453125, -1.0258560180664062, -0.9923553466796875, -0.9588546752929688, -0.92535400390625, -0.8918533325195312, -0.8583526611328125, -0.8248519897460938, -0.791351318359375, -0.7578506469726562, -0.7243499755859375, -0.6908493041992188, -0.6573486328125, -0.6238479614257812, -0.5903472900390625, -0.5568466186523438, -0.523345947265625, -0.48984527587890625, -0.4563446044921875, -0.42284393310546875, -0.38934326171875, -0.35584259033203125, -0.3223419189453125, -0.28884124755859375, -0.255340576171875, -0.22183990478515625, -0.1883392333984375, -0.15483856201171875, -0.121337890625, -0.08783721923828125, -0.0543365478515625, -0.02083587646484375, 0.012664794921875, 0.04616546630859375, 0.0796661376953125, 0.11316680908203125, 0.14666748046875, 0.18016815185546875, 0.2136688232421875, 0.24716949462890625, 0.280670166015625, 0.31417083740234375, 0.3476715087890625, 0.38117218017578125, 0.4146728515625, 0.44817352294921875, 0.4816741943359375, 0.5151748657226562, 0.548675537109375, 0.5821762084960938, 0.6156768798828125, 0.6491775512695312, 0.68267822265625, 0.7161788940429688, 0.7496795654296875, 0.7831802368164062, 0.816680908203125, 0.8501815795898438, 0.8836822509765625, 0.9171829223632812, 0.95068359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 6.0, 17.0, 22.0, 31.0, 97.0, 257.0, 302.0, 115.0, 55.0, 15.0, 23.0, 16.0, 13.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62353515625, -0.5976333618164062, -0.5717315673828125, -0.5458297729492188, -0.519927978515625, -0.49402618408203125, -0.4681243896484375, -0.44222259521484375, -0.41632080078125, -0.39041900634765625, -0.3645172119140625, -0.33861541748046875, -0.312713623046875, -0.28681182861328125, -0.2609100341796875, -0.23500823974609375, -0.2091064453125, -0.18320465087890625, -0.1573028564453125, -0.13140106201171875, -0.105499267578125, -0.07959747314453125, -0.0536956787109375, -0.02779388427734375, -0.00189208984375, 0.02400970458984375, 0.0499114990234375, 0.07581329345703125, 0.101715087890625, 0.12761688232421875, 0.1535186767578125, 0.17942047119140625, 0.205322265625, 0.23122406005859375, 0.2571258544921875, 0.28302764892578125, 0.308929443359375, 0.33483123779296875, 0.3607330322265625, 0.38663482666015625, 0.41253662109375, 0.43843841552734375, 0.4643402099609375, 0.49024200439453125, 0.516143798828125, 0.5420455932617188, 0.5679473876953125, 0.5938491821289062, 0.6197509765625, 0.6456527709960938, 0.6715545654296875, 0.6974563598632812, 0.723358154296875, 0.7492599487304688, 0.7751617431640625, 0.8010635375976562, 0.82696533203125, 0.8528671264648438, 0.8787689208984375, 0.9046707153320312, 0.930572509765625, 0.9564743041992188, 0.9823760986328125, 1.0082778930664062, 1.0341796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 0.0, 2.0, 23.0, 29.0, 78.0, 131.0, 253.0, 240.0, 141.0, 64.0, 23.0, 13.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.285696983337402, -6.86043643951416, -6.435175895690918, -6.009915351867676, -5.584654808044434, -5.159394264221191, -4.734133720397949, -4.308873176574707, -3.883612632751465, -3.4583520889282227, -3.0330915451049805, -2.6078310012817383, -2.182570457458496, -1.757309913635254, -1.3320493698120117, -0.9067888259887695, -0.48152828216552734, -0.056267738342285156, 0.36899280548095703, 0.7942533493041992, 1.2195138931274414, 1.6447744369506836, 2.070034980773926, 2.495295524597168, 2.92055606842041, 3.3458166122436523, 3.7710771560668945, 4.196337699890137, 4.621598243713379, 5.046858787536621, 5.472119331359863, 5.8973798751831055, 6.322641372680664, 6.747901916503906, 7.173162460327148, 7.598423004150391, 8.023683547973633, 8.448944091796875, 8.874204635620117, 9.29946517944336, 9.724725723266602, 10.149986267089844, 10.575246810913086, 11.000507354736328, 11.42576789855957, 11.851028442382812, 12.276288986206055, 12.701549530029297, 13.126810073852539, 13.552070617675781, 13.977331161499023, 14.402591705322266, 14.827852249145508, 15.25311279296875, 15.678373336791992, 16.103633880615234, 16.528894424438477, 16.95415496826172, 17.37941551208496, 17.804676055908203, 18.229936599731445, 18.655197143554688, 19.08045768737793, 19.505718231201172, 19.930978775024414]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 4.0, 11.0, 6.0, 2.0, 5.0, 9.0, 16.0, 11.0, 16.0, 22.0, 23.0, 27.0, 27.0, 24.0, 25.0, 27.0, 26.0, 37.0, 40.0, 35.0, 39.0, 48.0, 41.0, 24.0, 43.0, 35.0, 37.0, 35.0, 36.0, 33.0, 33.0, 29.0, 28.0, 20.0, 11.0, 15.0, 18.0, 21.0, 13.0, 12.0, 3.0, 9.0, 8.0, 6.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.478695869445801, -4.344449520111084, -4.210202693939209, -4.075956344604492, -3.9417099952697754, -3.8074634075164795, -3.6732168197631836, -3.538970470428467, -3.404723882675171, -3.270477294921875, -3.136230945587158, -3.0019843578338623, -2.8677377700805664, -2.7334914207458496, -2.5992448329925537, -2.464998245239258, -2.330751895904541, -2.196505308151245, -2.0622589588165283, -1.9280123710632324, -1.793765902519226, -1.6595194339752197, -1.5252728462219238, -1.3910263776779175, -1.2567799091339111, -1.1225334405899048, -0.9882869124412537, -0.8540403842926025, -0.7197939157485962, -0.5855474472045898, -0.4513009190559387, -0.3170543909072876, -0.18280792236328125, -0.048561424016952515, 0.08568507432937622, 0.21993157267570496, 0.3541780710220337, 0.48842453956604004, 0.6226710677146912, 0.7569175958633423, 0.8911640644073486, 1.025410532951355, 1.1596570014953613, 1.2939035892486572, 1.4281500577926636, 1.56239652633667, 1.6966431140899658, 1.8308895826339722, 1.9651360511779785, 2.0993826389312744, 2.233628988265991, 2.367875576019287, 2.502121925354004, 2.6363685131073, 2.7706151008605957, 2.9048614501953125, 3.0391080379486084, 3.1733546257019043, 3.307600975036621, 3.441847562789917, 3.576094150543213, 3.7103404998779297, 3.8445870876312256, 3.9788336753845215, 4.113080024719238]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 7.0, 18.0, 24.0, 39.0, 59.0, 84.0, 136.0, 163.0, 321.0, 533.0, 956.0, 2252.0, 8089.0, 68394.0, 4073571.0, 30102.0, 5648.0, 1858.0, 844.0, 456.0, 242.0, 173.0, 105.0, 55.0, 38.0, 28.0, 13.0, 16.0, 8.0, 12.0, 8.0, 4.0, 2.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.8099365234375, -3.670654296875, -3.5313720703125, -3.39208984375, -3.2528076171875, -3.113525390625, -2.9742431640625, -2.8349609375, -2.6956787109375, -2.556396484375, -2.4171142578125, -2.27783203125, -2.1385498046875, -1.999267578125, -1.8599853515625, -1.720703125, -1.5814208984375, -1.442138671875, -1.3028564453125, -1.16357421875, -1.0242919921875, -0.885009765625, -0.7457275390625, -0.6064453125, -0.4671630859375, -0.327880859375, -0.1885986328125, -0.04931640625, 0.0899658203125, 0.229248046875, 0.3685302734375, 0.5078125, 0.6470947265625, 0.786376953125, 0.9256591796875, 1.06494140625, 1.2042236328125, 1.343505859375, 1.4827880859375, 1.6220703125, 1.7613525390625, 1.900634765625, 2.0399169921875, 2.17919921875, 2.3184814453125, 2.457763671875, 2.5970458984375, 2.736328125, 2.8756103515625, 3.014892578125, 3.1541748046875, 3.29345703125, 3.4327392578125, 3.572021484375, 3.7113037109375, 3.8505859375, 3.9898681640625, 4.129150390625, 4.2684326171875, 4.40771484375, 4.5469970703125, 4.686279296875, 4.8255615234375, 4.96484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 12.0, 5.0, 16.0, 15.0, 29.0, 37.0, 33.0, 39.0, 56.0, 67.0, 60.0, 61.0, 71.0, 66.0, 66.0, 64.0, 54.0, 54.0, 46.0, 40.0, 32.0, 18.0, 10.0, 13.0, 8.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.2931251525878906, -0.28253936767578125, -0.2719535827636719, -0.2613677978515625, -0.2507820129394531, -0.24019622802734375, -0.22961044311523438, -0.219024658203125, -0.20843887329101562, -0.19785308837890625, -0.18726730346679688, -0.1766815185546875, -0.16609573364257812, -0.15550994873046875, -0.14492416381835938, -0.13433837890625, -0.12375259399414062, -0.11316680908203125, -0.10258102416992188, -0.0919952392578125, -0.08140945434570312, -0.07082366943359375, -0.060237884521484375, -0.049652099609375, -0.039066314697265625, -0.02848052978515625, -0.017894744873046875, -0.0073089599609375, 0.003276824951171875, 0.01386260986328125, 0.024448394775390625, 0.0350341796875, 0.045619964599609375, 0.05620574951171875, 0.06679153442382812, 0.0773773193359375, 0.08796310424804688, 0.09854888916015625, 0.10913467407226562, 0.119720458984375, 0.13030624389648438, 0.14089202880859375, 0.15147781372070312, 0.1620635986328125, 0.17264938354492188, 0.18323516845703125, 0.19382095336914062, 0.20440673828125, 0.21499252319335938, 0.22557830810546875, 0.23616409301757812, 0.2467498779296875, 0.2573356628417969, 0.26792144775390625, 0.2785072326660156, 0.289093017578125, 0.2996788024902344, 0.31026458740234375, 0.3208503723144531, 0.3314361572265625, 0.3420219421386719, 0.35260772705078125, 0.3631935119628906, 0.373779296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 10.0, 9.0, 15.0, 16.0, 29.0, 25.0, 49.0, 51.0, 79.0, 126.0, 146.0, 248.0, 378.0, 685.0, 1241.0, 2722.0, 6769.0, 20779.0, 149677.0, 3916333.0, 70078.0, 14545.0, 5256.0, 2287.0, 1093.0, 610.0, 299.0, 219.0, 143.0, 103.0, 65.0, 61.0, 40.0, 26.0, 18.0, 11.0, 14.0, 8.0, 5.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.01171875, -2.926544189453125, -2.84136962890625, -2.756195068359375, -2.6710205078125, -2.585845947265625, -2.50067138671875, -2.415496826171875, -2.330322265625, -2.245147705078125, -2.15997314453125, -2.074798583984375, -1.9896240234375, -1.904449462890625, -1.81927490234375, -1.734100341796875, -1.64892578125, -1.563751220703125, -1.47857666015625, -1.393402099609375, -1.3082275390625, -1.223052978515625, -1.13787841796875, -1.052703857421875, -0.967529296875, -0.882354736328125, -0.79718017578125, -0.712005615234375, -0.6268310546875, -0.541656494140625, -0.45648193359375, -0.371307373046875, -0.2861328125, -0.200958251953125, -0.11578369140625, -0.030609130859375, 0.0545654296875, 0.139739990234375, 0.22491455078125, 0.310089111328125, 0.395263671875, 0.480438232421875, 0.56561279296875, 0.650787353515625, 0.7359619140625, 0.821136474609375, 0.90631103515625, 0.991485595703125, 1.07666015625, 1.161834716796875, 1.24700927734375, 1.332183837890625, 1.4173583984375, 1.502532958984375, 1.58770751953125, 1.672882080078125, 1.758056640625, 1.843231201171875, 1.92840576171875, 2.013580322265625, 2.0987548828125, 2.183929443359375, 2.26910400390625, 2.354278564453125, 2.439453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 5.0, 9.0, 9.0, 23.0, 28.0, 47.0, 130.0, 334.0, 2936.0, 321.0, 101.0, 35.0, 20.0, 16.0, 11.0, 6.0, 4.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96142578125, -0.93182373046875, -0.9022216796875, -0.87261962890625, -0.843017578125, -0.81341552734375, -0.7838134765625, -0.75421142578125, -0.724609375, -0.69500732421875, -0.6654052734375, -0.63580322265625, -0.606201171875, -0.57659912109375, -0.5469970703125, -0.51739501953125, -0.48779296875, -0.45819091796875, -0.4285888671875, -0.39898681640625, -0.369384765625, -0.33978271484375, -0.3101806640625, -0.28057861328125, -0.2509765625, -0.22137451171875, -0.1917724609375, -0.16217041015625, -0.132568359375, -0.10296630859375, -0.0733642578125, -0.04376220703125, -0.01416015625, 0.01544189453125, 0.0450439453125, 0.07464599609375, 0.104248046875, 0.13385009765625, 0.1634521484375, 0.19305419921875, 0.22265625, 0.25225830078125, 0.2818603515625, 0.31146240234375, 0.341064453125, 0.37066650390625, 0.4002685546875, 0.42987060546875, 0.45947265625, 0.48907470703125, 0.5186767578125, 0.54827880859375, 0.577880859375, 0.60748291015625, 0.6370849609375, 0.66668701171875, 0.6962890625, 0.72589111328125, 0.7554931640625, 0.78509521484375, 0.814697265625, 0.84429931640625, 0.8739013671875, 0.90350341796875, 0.93310546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 19.0, 109.0, 405.0, 322.0, 87.0, 33.0, 11.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.819730758666992, -16.460721969604492, -16.101713180541992, -15.742704391479492, -15.383695602416992, -15.024686813354492, -14.665678024291992, -14.306669235229492, -13.947660446166992, -13.588651657104492, -13.229642868041992, -12.870634078979492, -12.511625289916992, -12.152616500854492, -11.793607711791992, -11.434598922729492, -11.075591087341309, -10.716582298278809, -10.357573509216309, -9.998564720153809, -9.639555931091309, -9.280547142028809, -8.921539306640625, -8.562530517578125, -8.203521728515625, -7.844512939453125, -7.485504150390625, -7.126495361328125, -6.767486572265625, -6.408477783203125, -6.049469470977783, -5.690460681915283, -5.331451892852783, -4.972443103790283, -4.613434314727783, -4.254426002502441, -3.8954169750213623, -3.5364081859588623, -3.1773996353149414, -2.8183908462524414, -2.4593820571899414, -2.1003732681274414, -1.741364598274231, -1.3823559284210205, -1.0233471393585205, -0.6643383502960205, -0.3053297996520996, 0.05367898941040039, 0.4126877784729004, 0.7716965079307556, 1.1307052373886108, 1.4897139072418213, 1.8487226963043213, 2.2077314853668213, 2.566740036010742, 2.925748825073242, 3.284757614135742, 3.643766403198242, 4.002775192260742, 4.361783981323242, 4.720792770385742, 5.079801559448242, 5.438809871673584, 5.797818660736084, 6.156827449798584]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 17.0, 20.0, 18.0, 32.0, 43.0, 50.0, 48.0, 66.0, 62.0, 83.0, 64.0, 69.0, 61.0, 71.0, 60.0, 43.0, 37.0, 44.0, 34.0, 23.0, 16.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265709638595581, -2.1792290210723877, -2.0927481651306152, -2.006267547607422, -1.919786810874939, -1.833306074142456, -1.7468254566192627, -1.6603447198867798, -1.5738639831542969, -1.487383246421814, -1.400902509689331, -1.3144218921661377, -1.2279411554336548, -1.1414604187011719, -1.0549798011779785, -0.9684990644454956, -0.8820183277130127, -0.7955375909805298, -0.7090569138526917, -0.6225762367248535, -0.5360954999923706, -0.4496147930622101, -0.36313408613204956, -0.2766534090042114, -0.19017267227172852, -0.103691965341568, -0.01721125841140747, 0.06926944851875305, 0.15575015544891357, 0.2422308623790741, 0.3287115693092346, 0.41519224643707275, 0.5016727447509766, 0.5881534814834595, 0.6746341586112976, 0.7611148357391357, 0.8475955724716187, 0.9340763092041016, 1.020556926727295, 1.1070376634597778, 1.1935184001922607, 1.2799991369247437, 1.3664798736572266, 1.45296049118042, 1.5394412279129028, 1.6259219646453857, 1.712402582168579, 1.798883318901062, 1.885364055633545, 1.9718447923660278, 2.0583255290985107, 2.144806146621704, 2.2312870025634766, 2.31776762008667, 2.4042482376098633, 2.4907288551330566, 2.577209711074829, 2.6636903285980225, 2.750171184539795, 2.8366518020629883, 2.9231324195861816, 3.009613275527954, 3.0960938930511475, 3.18257474899292, 3.2690553665161133]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 12.0, 12.0, 21.0, 32.0, 50.0, 73.0, 163.0, 310.0, 696.0, 1731.0, 6126.0, 32135.0, 406504.0, 548706.0, 41136.0, 7301.0, 2025.0, 783.0, 327.0, 164.0, 68.0, 48.0, 42.0, 20.0, 10.0, 12.0, 11.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.67578125, -2.589630126953125, -2.50347900390625, -2.417327880859375, -2.3311767578125, -2.245025634765625, -2.15887451171875, -2.072723388671875, -1.986572265625, -1.900421142578125, -1.81427001953125, -1.728118896484375, -1.6419677734375, -1.555816650390625, -1.46966552734375, -1.383514404296875, -1.29736328125, -1.211212158203125, -1.12506103515625, -1.038909912109375, -0.9527587890625, -0.866607666015625, -0.78045654296875, -0.694305419921875, -0.608154296875, -0.522003173828125, -0.43585205078125, -0.349700927734375, -0.2635498046875, -0.177398681640625, -0.09124755859375, -0.005096435546875, 0.0810546875, 0.167205810546875, 0.25335693359375, 0.339508056640625, 0.4256591796875, 0.511810302734375, 0.59796142578125, 0.684112548828125, 0.770263671875, 0.856414794921875, 0.94256591796875, 1.028717041015625, 1.1148681640625, 1.201019287109375, 1.28717041015625, 1.373321533203125, 1.45947265625, 1.545623779296875, 1.63177490234375, 1.717926025390625, 1.8040771484375, 1.890228271484375, 1.97637939453125, 2.062530517578125, 2.148681640625, 2.234832763671875, 2.32098388671875, 2.407135009765625, 2.4932861328125, 2.579437255859375, 2.66558837890625, 2.751739501953125, 2.837890625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 15.0, 17.0, 24.0, 37.0, 51.0, 73.0, 79.0, 89.0, 91.0, 105.0, 100.0, 76.0, 88.0, 45.0, 46.0, 21.0, 19.0, 14.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.82275390625, -0.8056755065917969, -0.7885971069335938, -0.7715187072753906, -0.7544403076171875, -0.7373619079589844, -0.7202835083007812, -0.7032051086425781, -0.686126708984375, -0.6690483093261719, -0.6519699096679688, -0.6348915100097656, -0.6178131103515625, -0.6007347106933594, -0.5836563110351562, -0.5665779113769531, -0.54949951171875, -0.5324211120605469, -0.5153427124023438, -0.4982643127441406, -0.4811859130859375, -0.4641075134277344, -0.44702911376953125, -0.4299507141113281, -0.412872314453125, -0.3957939147949219, -0.37871551513671875, -0.3616371154785156, -0.3445587158203125, -0.3274803161621094, -0.31040191650390625, -0.2933235168457031, -0.2762451171875, -0.2591667175292969, -0.24208831787109375, -0.22500991821289062, -0.2079315185546875, -0.19085311889648438, -0.17377471923828125, -0.15669631958007812, -0.139617919921875, -0.12253952026367188, -0.10546112060546875, -0.08838272094726562, -0.0713043212890625, -0.054225921630859375, -0.03714752197265625, -0.020069122314453125, -0.00299072265625, 0.014087677001953125, 0.03116607666015625, 0.048244476318359375, 0.0653228759765625, 0.08240127563476562, 0.09947967529296875, 0.11655807495117188, 0.133636474609375, 0.15071487426757812, 0.16779327392578125, 0.18487167358398438, 0.2019500732421875, 0.21902847290039062, 0.23610687255859375, 0.2531852722167969, 0.270263671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 9.0, 3.0, 8.0, 11.0, 14.0, 16.0, 27.0, 36.0, 55.0, 56.0, 103.0, 155.0, 255.0, 376.0, 741.0, 1231.0, 2439.0, 5183.0, 11766.0, 29646.0, 83236.0, 260651.0, 412154.0, 153994.0, 51547.0, 18989.0, 7972.0, 3561.0, 1840.0, 994.0, 562.0, 281.0, 221.0, 128.0, 84.0, 59.0, 31.0, 36.0, 24.0, 16.0, 13.0, 14.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.91943359375, -0.892608642578125, -0.86578369140625, -0.838958740234375, -0.8121337890625, -0.785308837890625, -0.75848388671875, -0.731658935546875, -0.704833984375, -0.678009033203125, -0.65118408203125, -0.624359130859375, -0.5975341796875, -0.570709228515625, -0.54388427734375, -0.517059326171875, -0.490234375, -0.463409423828125, -0.43658447265625, -0.409759521484375, -0.3829345703125, -0.356109619140625, -0.32928466796875, -0.302459716796875, -0.275634765625, -0.248809814453125, -0.22198486328125, -0.195159912109375, -0.1683349609375, -0.141510009765625, -0.11468505859375, -0.087860107421875, -0.06103515625, -0.034210205078125, -0.00738525390625, 0.019439697265625, 0.0462646484375, 0.073089599609375, 0.09991455078125, 0.126739501953125, 0.153564453125, 0.180389404296875, 0.20721435546875, 0.234039306640625, 0.2608642578125, 0.287689208984375, 0.31451416015625, 0.341339111328125, 0.3681640625, 0.394989013671875, 0.42181396484375, 0.448638916015625, 0.4754638671875, 0.502288818359375, 0.52911376953125, 0.555938720703125, 0.582763671875, 0.609588623046875, 0.63641357421875, 0.663238525390625, 0.6900634765625, 0.716888427734375, 0.74371337890625, 0.770538330078125, 0.79736328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 10.0, 7.0, 17.0, 15.0, 20.0, 24.0, 22.0, 29.0, 36.0, 32.0, 45.0, 33.0, 50.0, 47.0, 42.0, 47.0, 41.0, 54.0, 42.0, 38.0, 41.0, 40.0, 36.0, 28.0, 41.0, 24.0, 20.0, 20.0, 19.0, 21.0, 9.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3212890625, -1.2852249145507812, -1.2491607666015625, -1.2130966186523438, -1.177032470703125, -1.1409683227539062, -1.1049041748046875, -1.0688400268554688, -1.03277587890625, -0.9967117309570312, -0.9606475830078125, -0.9245834350585938, -0.888519287109375, -0.8524551391601562, -0.8163909912109375, -0.7803268432617188, -0.7442626953125, -0.7081985473632812, -0.6721343994140625, -0.6360702514648438, -0.600006103515625, -0.5639419555664062, -0.5278778076171875, -0.49181365966796875, -0.45574951171875, -0.41968536376953125, -0.3836212158203125, -0.34755706787109375, -0.311492919921875, -0.27542877197265625, -0.2393646240234375, -0.20330047607421875, -0.167236328125, -0.13117218017578125, -0.0951080322265625, -0.05904388427734375, -0.022979736328125, 0.01308441162109375, 0.0491485595703125, 0.08521270751953125, 0.12127685546875, 0.15734100341796875, 0.1934051513671875, 0.22946929931640625, 0.265533447265625, 0.30159759521484375, 0.3376617431640625, 0.37372589111328125, 0.4097900390625, 0.44585418701171875, 0.4819183349609375, 0.5179824829101562, 0.554046630859375, 0.5901107788085938, 0.6261749267578125, 0.6622390747070312, 0.69830322265625, 0.7343673706054688, 0.7704315185546875, 0.8064956665039062, 0.842559814453125, 0.8786239624023438, 0.9146881103515625, 0.9507522583007812, 0.98681640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 31.0, 55.0, 135.0, 333.0, 993.0, 3575.0, 21748.0, 423834.0, 566554.0, 25601.0, 4067.0, 1005.0, 334.0, 139.0, 64.0, 32.0, 13.0, 8.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1084136962890625, -1.067413330078125, -1.0264129638671875, -0.98541259765625, -0.9444122314453125, -0.903411865234375, -0.8624114990234375, -0.8214111328125, -0.7804107666015625, -0.739410400390625, -0.6984100341796875, -0.65740966796875, -0.6164093017578125, -0.575408935546875, -0.5344085693359375, -0.493408203125, -0.4524078369140625, -0.411407470703125, -0.3704071044921875, -0.32940673828125, -0.2884063720703125, -0.247406005859375, -0.2064056396484375, -0.1654052734375, -0.1244049072265625, -0.083404541015625, -0.0424041748046875, -0.00140380859375, 0.0395965576171875, 0.080596923828125, 0.1215972900390625, 0.16259765625, 0.2035980224609375, 0.244598388671875, 0.2855987548828125, 0.32659912109375, 0.3675994873046875, 0.408599853515625, 0.4496002197265625, 0.4906005859375, 0.5316009521484375, 0.572601318359375, 0.6136016845703125, 0.65460205078125, 0.6956024169921875, 0.736602783203125, 0.7776031494140625, 0.818603515625, 0.8596038818359375, 0.900604248046875, 0.9416046142578125, 0.98260498046875, 1.0236053466796875, 1.064605712890625, 1.1056060791015625, 1.1466064453125, 1.1876068115234375, 1.228607177734375, 1.2696075439453125, 1.31060791015625, 1.3516082763671875, 1.392608642578125, 1.4336090087890625, 1.474609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 16.0, 17.0, 29.0, 38.0, 68.0, 95.0, 213.0, 185.0, 97.0, 69.0, 46.0, 33.0, 21.0, 10.0, 10.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0002237558364868164, -0.0002175401896238327, -0.000211324542760849, -0.0002051088958978653, -0.0001988932490348816, -0.0001926776021718979, -0.00018646195530891418, -0.00018024630844593048, -0.00017403066158294678, -0.00016781501471996307, -0.00016159936785697937, -0.00015538372099399567, -0.00014916807413101196, -0.00014295242726802826, -0.00013673678040504456, -0.00013052113354206085, -0.00012430548667907715, -0.00011808983981609344, -0.00011187419295310974, -0.00010565854609012604, -9.944289922714233e-05, -9.322725236415863e-05, -8.701160550117493e-05, -8.079595863819122e-05, -7.458031177520752e-05, -6.836466491222382e-05, -6.214901804924011e-05, -5.593337118625641e-05, -4.9717724323272705e-05, -4.3502077460289e-05, -3.72864305973053e-05, -3.1070783734321594e-05, -2.485513687133789e-05, -1.8639490008354187e-05, -1.2423843145370483e-05, -6.20819628238678e-06, 7.450580596923828e-09, 6.2230974435806274e-06, 1.2438744306564331e-05, 1.8654391169548035e-05, 2.4870038032531738e-05, 3.108568489551544e-05, 3.7301331758499146e-05, 4.351697862148285e-05, 4.973262548446655e-05, 5.5948272347450256e-05, 6.216391921043396e-05, 6.837956607341766e-05, 7.459521293640137e-05, 8.081085979938507e-05, 8.702650666236877e-05, 9.324215352535248e-05, 9.945780038833618e-05, 0.00010567344725131989, 0.00011188909411430359, 0.00011810474097728729, 0.000124320387840271, 0.0001305360347032547, 0.0001367516815662384, 0.0001429673284292221, 0.0001491829752922058, 0.00015539862215518951, 0.00016161426901817322, 0.00016782991588115692, 0.00017404556274414062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 2.0, 6.0, 10.0, 20.0, 49.0, 65.0, 112.0, 163.0, 294.0, 491.0, 1061.0, 2417.0, 6516.0, 23285.0, 123556.0, 706337.0, 145752.0, 26242.0, 7223.0, 2589.0, 1081.0, 539.0, 270.0, 185.0, 85.0, 64.0, 32.0, 25.0, 16.0, 11.0, 13.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.82373046875, -0.7958450317382812, -0.7679595947265625, -0.7400741577148438, -0.712188720703125, -0.6843032836914062, -0.6564178466796875, -0.6285324096679688, -0.60064697265625, -0.5727615356445312, -0.5448760986328125, -0.5169906616210938, -0.489105224609375, -0.46121978759765625, -0.4333343505859375, -0.40544891357421875, -0.3775634765625, -0.34967803955078125, -0.3217926025390625, -0.29390716552734375, -0.266021728515625, -0.23813629150390625, -0.2102508544921875, -0.18236541748046875, -0.15447998046875, -0.12659454345703125, -0.0987091064453125, -0.07082366943359375, -0.042938232421875, -0.01505279541015625, 0.0128326416015625, 0.04071807861328125, 0.068603515625, 0.09648895263671875, 0.1243743896484375, 0.15225982666015625, 0.180145263671875, 0.20803070068359375, 0.2359161376953125, 0.26380157470703125, 0.29168701171875, 0.31957244873046875, 0.3474578857421875, 0.37534332275390625, 0.403228759765625, 0.43111419677734375, 0.4589996337890625, 0.48688507080078125, 0.5147705078125, 0.5426559448242188, 0.5705413818359375, 0.5984268188476562, 0.626312255859375, 0.6541976928710938, 0.6820831298828125, 0.7099685668945312, 0.73785400390625, 0.7657394409179688, 0.7936248779296875, 0.8215103149414062, 0.849395751953125, 0.8772811889648438, 0.9051666259765625, 0.9330520629882812, 0.9609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 4.0, 9.0, 8.0, 11.0, 17.0, 29.0, 39.0, 34.0, 87.0, 116.0, 168.0, 143.0, 101.0, 73.0, 34.0, 25.0, 32.0, 20.0, 13.0, 8.0, 6.0, 6.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.5762786865234375, -0.550994873046875, -0.5257110595703125, -0.50042724609375, -0.4751434326171875, -0.449859619140625, -0.4245758056640625, -0.3992919921875, -0.3740081787109375, -0.348724365234375, -0.3234405517578125, -0.29815673828125, -0.2728729248046875, -0.247589111328125, -0.2223052978515625, -0.197021484375, -0.1717376708984375, -0.146453857421875, -0.1211700439453125, -0.09588623046875, -0.0706024169921875, -0.045318603515625, -0.0200347900390625, 0.0052490234375, 0.0305328369140625, 0.055816650390625, 0.0811004638671875, 0.10638427734375, 0.1316680908203125, 0.156951904296875, 0.1822357177734375, 0.20751953125, 0.2328033447265625, 0.258087158203125, 0.2833709716796875, 0.30865478515625, 0.3339385986328125, 0.359222412109375, 0.3845062255859375, 0.4097900390625, 0.4350738525390625, 0.460357666015625, 0.4856414794921875, 0.51092529296875, 0.5362091064453125, 0.561492919921875, 0.5867767333984375, 0.612060546875, 0.6373443603515625, 0.662628173828125, 0.6879119873046875, 0.71319580078125, 0.7384796142578125, 0.763763427734375, 0.7890472412109375, 0.8143310546875, 0.8396148681640625, 0.864898681640625, 0.8901824951171875, 0.91546630859375, 0.9407501220703125, 0.966033935546875, 0.9913177490234375, 1.0166015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 16.0, 45.0, 139.0, 303.0, 301.0, 134.0, 46.0, 17.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.357422828674316, -9.661396980285645, -8.965370178222656, -8.269344329833984, -7.5733184814453125, -6.877292633056641, -6.1812663078308105, -5.4852399826049805, -4.789214134216309, -4.093188285827637, -3.3971619606018066, -2.7011358737945557, -2.0051097869873047, -1.3090837001800537, -0.6130576133728027, 0.08296871185302734, 0.7789945602416992, 1.4750206470489502, 2.171046733856201, 2.867072820663452, 3.563098907470703, 4.259124755859375, 4.955151081085205, 5.651177406311035, 6.347203254699707, 7.043229103088379, 7.739255428314209, 8.435281753540039, 9.131307601928711, 9.827333450317383, 10.523359298706055, 11.219386100769043, 11.915412902832031, 12.611438751220703, 13.307464599609375, 14.003491401672363, 14.699517250061035, 15.395543098449707, 16.091569900512695, 16.787595748901367, 17.48362159729004, 18.17964744567871, 18.875673294067383, 19.571699142456055, 20.26772689819336, 20.96375274658203, 21.659778594970703, 22.355804443359375, 23.051830291748047, 23.74785614013672, 24.44388198852539, 25.139907836914062, 25.835933685302734, 26.53196144104004, 27.22798728942871, 27.924013137817383, 28.620038986206055, 29.316064834594727, 30.0120906829834, 30.70811653137207, 31.404144287109375, 32.10017013549805, 32.79619598388672, 33.49222183227539, 34.18824768066406]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 4.0, 8.0, 8.0, 9.0, 9.0, 14.0, 11.0, 17.0, 13.0, 25.0, 26.0, 29.0, 30.0, 23.0, 25.0, 27.0, 30.0, 33.0, 26.0, 28.0, 41.0, 32.0, 33.0, 33.0, 43.0, 41.0, 38.0, 37.0, 32.0, 21.0, 26.0, 27.0, 33.0, 19.0, 17.0, 24.0, 7.0, 13.0, 11.0, 8.0, 13.0, 6.0, 9.0, 9.0, 4.0, 4.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0], "bins": [-4.9556121826171875, -4.808562755584717, -4.661513328552246, -4.514464378356934, -4.367414951324463, -4.220365524291992, -4.0733160972595215, -3.926266670227051, -3.779217481613159, -3.6321680545806885, -3.485118865966797, -3.338069438934326, -3.1910200119018555, -3.043970823287964, -2.896921396255493, -2.7498722076416016, -2.602822780609131, -2.45577335357666, -2.3087241649627686, -2.161674737930298, -2.0146255493164062, -1.8675761222839355, -1.7205266952514648, -1.5734773874282837, -1.4264280796051025, -1.2793787717819214, -1.1323294639587402, -0.9852800369262695, -0.8382307291030884, -0.6911814212799072, -0.5441320538520813, -0.39708268642425537, -0.2500333786010742, -0.10298404097557068, 0.04406529664993286, 0.1911146342754364, 0.33816397190093994, 0.4852132797241211, 0.632262647151947, 0.779312014579773, 0.9263613224029541, 1.0734106302261353, 1.2204599380493164, 1.367509365081787, 1.5145586729049683, 1.6616079807281494, 1.8086574077606201, 1.9557067155838013, 2.1027560234069824, 2.249805450439453, 2.3968546390533447, 2.5439040660858154, 2.690953254699707, 2.8380026817321777, 2.9850521087646484, 3.132101535797119, 3.2791507244110107, 3.4262001514434814, 3.573249340057373, 3.7202987670898438, 3.8673481941223145, 4.014397621154785, 4.161446571350098, 4.308495998382568, 4.455545425415039]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 4.0, 11.0, 20.0, 27.0, 30.0, 51.0, 64.0, 119.0, 169.0, 244.0, 486.0, 877.0, 2113.0, 6469.0, 33016.0, 3890135.0, 237338.0, 15803.0, 4101.0, 1547.0, 692.0, 363.0, 191.0, 129.0, 80.0, 58.0, 40.0, 25.0, 16.0, 8.0, 7.0, 6.0, 8.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.537109375, -3.425872802734375, -3.31463623046875, -3.203399658203125, -3.0921630859375, -2.980926513671875, -2.86968994140625, -2.758453369140625, -2.647216796875, -2.535980224609375, -2.42474365234375, -2.313507080078125, -2.2022705078125, -2.091033935546875, -1.97979736328125, -1.868560791015625, -1.75732421875, -1.646087646484375, -1.53485107421875, -1.423614501953125, -1.3123779296875, -1.201141357421875, -1.08990478515625, -0.978668212890625, -0.867431640625, -0.756195068359375, -0.64495849609375, -0.533721923828125, -0.4224853515625, -0.311248779296875, -0.20001220703125, -0.088775634765625, 0.0224609375, 0.133697509765625, 0.24493408203125, 0.356170654296875, 0.4674072265625, 0.578643798828125, 0.68988037109375, 0.801116943359375, 0.912353515625, 1.023590087890625, 1.13482666015625, 1.246063232421875, 1.3572998046875, 1.468536376953125, 1.57977294921875, 1.691009521484375, 1.80224609375, 1.913482666015625, 2.02471923828125, 2.135955810546875, 2.2471923828125, 2.358428955078125, 2.46966552734375, 2.580902099609375, 2.692138671875, 2.803375244140625, 2.91461181640625, 3.025848388671875, 3.1370849609375, 3.248321533203125, 3.35955810546875, 3.470794677734375, 3.58203125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 27.0, 32.0, 38.0, 47.0, 67.0, 61.0, 59.0, 70.0, 60.0, 70.0, 64.0, 71.0, 69.0, 50.0, 35.0, 40.0, 27.0, 18.0, 13.0, 15.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398193359375, -0.38513946533203125, -0.3720855712890625, -0.35903167724609375, -0.345977783203125, -0.33292388916015625, -0.3198699951171875, -0.30681610107421875, -0.29376220703125, -0.28070831298828125, -0.2676544189453125, -0.25460052490234375, -0.241546630859375, -0.22849273681640625, -0.2154388427734375, -0.20238494873046875, -0.1893310546875, -0.17627716064453125, -0.1632232666015625, -0.15016937255859375, -0.137115478515625, -0.12406158447265625, -0.1110076904296875, -0.09795379638671875, -0.08489990234375, -0.07184600830078125, -0.0587921142578125, -0.04573822021484375, -0.032684326171875, -0.01963043212890625, -0.0065765380859375, 0.00647735595703125, 0.01953125, 0.03258514404296875, 0.0456390380859375, 0.05869293212890625, 0.071746826171875, 0.08480072021484375, 0.0978546142578125, 0.11090850830078125, 0.12396240234375, 0.13701629638671875, 0.1500701904296875, 0.16312408447265625, 0.176177978515625, 0.18923187255859375, 0.2022857666015625, 0.21533966064453125, 0.2283935546875, 0.24144744873046875, 0.2545013427734375, 0.26755523681640625, 0.280609130859375, 0.29366302490234375, 0.3067169189453125, 0.31977081298828125, 0.33282470703125, 0.34587860107421875, 0.3589324951171875, 0.37198638916015625, 0.385040283203125, 0.39809417724609375, 0.4111480712890625, 0.42420196533203125, 0.437255859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 8.0, 4.0, 9.0, 13.0, 17.0, 17.0, 16.0, 32.0, 33.0, 57.0, 46.0, 76.0, 140.0, 198.0, 366.0, 646.0, 1260.0, 2844.0, 7486.0, 24250.0, 146692.0, 3809241.0, 161855.0, 25177.0, 7615.0, 3045.0, 1389.0, 703.0, 379.0, 192.0, 135.0, 88.0, 52.0, 49.0, 37.0, 24.0, 17.0, 16.0, 16.0, 7.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.159271240234375, -2.08612060546875, -2.012969970703125, -1.9398193359375, -1.866668701171875, -1.79351806640625, -1.720367431640625, -1.647216796875, -1.574066162109375, -1.50091552734375, -1.427764892578125, -1.3546142578125, -1.281463623046875, -1.20831298828125, -1.135162353515625, -1.06201171875, -0.988861083984375, -0.91571044921875, -0.842559814453125, -0.7694091796875, -0.696258544921875, -0.62310791015625, -0.549957275390625, -0.476806640625, -0.403656005859375, -0.33050537109375, -0.257354736328125, -0.1842041015625, -0.111053466796875, -0.03790283203125, 0.035247802734375, 0.1083984375, 0.181549072265625, 0.25469970703125, 0.327850341796875, 0.4010009765625, 0.474151611328125, 0.54730224609375, 0.620452880859375, 0.693603515625, 0.766754150390625, 0.83990478515625, 0.913055419921875, 0.9862060546875, 1.059356689453125, 1.13250732421875, 1.205657958984375, 1.27880859375, 1.351959228515625, 1.42510986328125, 1.498260498046875, 1.5714111328125, 1.644561767578125, 1.71771240234375, 1.790863037109375, 1.864013671875, 1.937164306640625, 2.01031494140625, 2.083465576171875, 2.1566162109375, 2.229766845703125, 2.30291748046875, 2.376068115234375, 2.44921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 11.0, 8.0, 17.0, 23.0, 37.0, 68.0, 171.0, 802.0, 2355.0, 337.0, 112.0, 54.0, 28.0, 19.0, 13.0, 3.0, 5.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4609222412109375, -1.416961669921875, -1.3730010986328125, -1.32904052734375, -1.2850799560546875, -1.241119384765625, -1.1971588134765625, -1.1531982421875, -1.1092376708984375, -1.065277099609375, -1.0213165283203125, -0.97735595703125, -0.9333953857421875, -0.889434814453125, -0.8454742431640625, -0.801513671875, -0.7575531005859375, -0.713592529296875, -0.6696319580078125, -0.62567138671875, -0.5817108154296875, -0.537750244140625, -0.4937896728515625, -0.4498291015625, -0.4058685302734375, -0.361907958984375, -0.3179473876953125, -0.27398681640625, -0.2300262451171875, -0.186065673828125, -0.1421051025390625, -0.09814453125, -0.0541839599609375, -0.010223388671875, 0.0337371826171875, 0.07769775390625, 0.1216583251953125, 0.165618896484375, 0.2095794677734375, 0.2535400390625, 0.2975006103515625, 0.341461181640625, 0.3854217529296875, 0.42938232421875, 0.4733428955078125, 0.517303466796875, 0.5612640380859375, 0.605224609375, 0.6491851806640625, 0.693145751953125, 0.7371063232421875, 0.78106689453125, 0.8250274658203125, 0.868988037109375, 0.9129486083984375, 0.9569091796875, 1.0008697509765625, 1.044830322265625, 1.0887908935546875, 1.13275146484375, 1.1767120361328125, 1.220672607421875, 1.2646331787109375, 1.30859375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 8.0, 23.0, 59.0, 110.0, 225.0, 260.0, 163.0, 85.0, 34.0, 17.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.926462173461914, -13.630342483520508, -13.334223747253418, -13.038104057312012, -12.741984367370605, -12.4458646774292, -12.14974594116211, -11.853626251220703, -11.557506561279297, -11.26138687133789, -10.9652681350708, -10.669148445129395, -10.373028755187988, -10.076909065246582, -9.780790328979492, -9.484670639038086, -9.18855094909668, -8.892431259155273, -8.596312522888184, -8.300192832946777, -8.004073143005371, -7.707953929901123, -7.411834716796875, -7.115715026855469, -6.819596290588379, -6.523477077484131, -6.227357387542725, -5.931238174438477, -5.63511848449707, -5.338999271392822, -5.042880058288574, -4.746760368347168, -4.4506402015686035, -4.1545209884643555, -3.858401298522949, -3.562282085418701, -3.266162395477295, -2.970043182373047, -2.6739237308502197, -2.3778042793273926, -2.0816848278045654, -1.7855653762817383, -1.4894459247589111, -1.1933265924453735, -0.8972071409225464, -0.6010876893997192, -0.30496835708618164, -0.008848905563354492, 0.28727054595947266, 0.5833899974822998, 0.8795093894004822, 1.1756287813186646, 1.4717482328414917, 1.7678676843643188, 2.0639870166778564, 2.3601064682006836, 2.6562259197235107, 2.952345371246338, 3.248464822769165, 3.544584274291992, 3.8407034873962402, 4.1368231773376465, 4.4329423904418945, 4.729062080383301, 5.025181293487549]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 12.0, 21.0, 21.0, 20.0, 28.0, 30.0, 29.0, 43.0, 54.0, 56.0, 51.0, 58.0, 60.0, 64.0, 46.0, 59.0, 58.0, 51.0, 38.0, 45.0, 35.0, 32.0, 20.0, 16.0, 13.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5452940464019775, -3.439828395843506, -3.334362745285034, -3.2288970947265625, -3.1234312057495117, -3.017965793609619, -2.9124999046325684, -2.8070342540740967, -2.701568603515625, -2.5961029529571533, -2.4906373023986816, -2.38517165184021, -2.2797060012817383, -2.1742401123046875, -2.068774461746216, -1.9633088111877441, -1.8578431606292725, -1.7523775100708008, -1.646911859512329, -1.5414460897445679, -1.4359804391860962, -1.3305147886276245, -1.2250490188598633, -1.1195833683013916, -1.01411771774292, -0.9086520671844482, -0.8031863570213318, -0.6977206468582153, -0.5922549962997437, -0.486789345741272, -0.3813236355781555, -0.27585792541503906, -0.17039251327514648, -0.06492683291435242, 0.04053884744644165, 0.14600452780723572, 0.2514702081680298, 0.35693585872650146, 0.4624015688896179, 0.5678672790527344, 0.673332929611206, 0.7787985801696777, 0.8842642903327942, 0.9897300004959106, 1.0951956510543823, 1.200661301612854, 1.3061270713806152, 1.411592721939087, 1.5170583724975586, 1.6225240230560303, 1.727989673614502, 1.8334554433822632, 1.9389210939407349, 2.044386863708496, 2.1498525142669678, 2.2553181648254395, 2.360783815383911, 2.466249465942383, 2.5717151165008545, 2.677180767059326, 2.782646656036377, 2.8881120681762695, 2.9935779571533203, 3.099043607711792, 3.2045092582702637]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 5.0, 13.0, 11.0, 13.0, 27.0, 58.0, 91.0, 147.0, 243.0, 542.0, 1243.0, 3367.0, 12917.0, 83437.0, 646667.0, 260109.0, 29885.0, 6250.0, 1891.0, 765.0, 380.0, 190.0, 106.0, 63.0, 38.0, 32.0, 14.0, 14.0, 8.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.751953125, -2.662445068359375, -2.57293701171875, -2.483428955078125, -2.3939208984375, -2.304412841796875, -2.21490478515625, -2.125396728515625, -2.035888671875, -1.946380615234375, -1.85687255859375, -1.767364501953125, -1.6778564453125, -1.588348388671875, -1.49884033203125, -1.409332275390625, -1.31982421875, -1.230316162109375, -1.14080810546875, -1.051300048828125, -0.9617919921875, -0.872283935546875, -0.78277587890625, -0.693267822265625, -0.603759765625, -0.514251708984375, -0.42474365234375, -0.335235595703125, -0.2457275390625, -0.156219482421875, -0.06671142578125, 0.022796630859375, 0.1123046875, 0.201812744140625, 0.29132080078125, 0.380828857421875, 0.4703369140625, 0.559844970703125, 0.64935302734375, 0.738861083984375, 0.828369140625, 0.917877197265625, 1.00738525390625, 1.096893310546875, 1.1864013671875, 1.275909423828125, 1.36541748046875, 1.454925537109375, 1.54443359375, 1.633941650390625, 1.72344970703125, 1.812957763671875, 1.9024658203125, 1.991973876953125, 2.08148193359375, 2.170989990234375, 2.260498046875, 2.350006103515625, 2.43951416015625, 2.529022216796875, 2.6185302734375, 2.708038330078125, 2.79754638671875, 2.887054443359375, 2.9765625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 27.0, 25.0, 42.0, 62.0, 53.0, 90.0, 80.0, 88.0, 92.0, 91.0, 78.0, 69.0, 47.0, 33.0, 24.0, 23.0, 17.0, 13.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63818359375, -0.6199264526367188, -0.6016693115234375, -0.5834121704101562, -0.565155029296875, -0.5468978881835938, -0.5286407470703125, -0.5103836059570312, -0.49212646484375, -0.47386932373046875, -0.4556121826171875, -0.43735504150390625, -0.419097900390625, -0.40084075927734375, -0.3825836181640625, -0.36432647705078125, -0.3460693359375, -0.32781219482421875, -0.3095550537109375, -0.29129791259765625, -0.273040771484375, -0.25478363037109375, -0.2365264892578125, -0.21826934814453125, -0.20001220703125, -0.18175506591796875, -0.1634979248046875, -0.14524078369140625, -0.126983642578125, -0.10872650146484375, -0.0904693603515625, -0.07221221923828125, -0.053955078125, -0.03569793701171875, -0.0174407958984375, 0.00081634521484375, 0.019073486328125, 0.03733062744140625, 0.0555877685546875, 0.07384490966796875, 0.09210205078125, 0.11035919189453125, 0.1286163330078125, 0.14687347412109375, 0.165130615234375, 0.18338775634765625, 0.2016448974609375, 0.21990203857421875, 0.2381591796875, 0.25641632080078125, 0.2746734619140625, 0.29293060302734375, 0.311187744140625, 0.32944488525390625, 0.3477020263671875, 0.36595916748046875, 0.38421630859375, 0.40247344970703125, 0.4207305908203125, 0.43898773193359375, 0.457244873046875, 0.47550201416015625, 0.4937591552734375, 0.5120162963867188, 0.5302734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 9.0, 12.0, 14.0, 10.0, 31.0, 29.0, 52.0, 89.0, 123.0, 184.0, 263.0, 482.0, 867.0, 1751.0, 3553.0, 8215.0, 20729.0, 57746.0, 192856.0, 467853.0, 197738.0, 59014.0, 21018.0, 8409.0, 3639.0, 1698.0, 850.0, 467.0, 293.0, 166.0, 108.0, 79.0, 63.0, 42.0, 22.0, 16.0, 17.0, 14.0, 5.0, 9.0, 6.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0947265625, -1.054931640625, -1.01513671875, -0.975341796875, -0.935546875, -0.895751953125, -0.85595703125, -0.816162109375, -0.7763671875, -0.736572265625, -0.69677734375, -0.656982421875, -0.6171875, -0.577392578125, -0.53759765625, -0.497802734375, -0.4580078125, -0.418212890625, -0.37841796875, -0.338623046875, -0.298828125, -0.259033203125, -0.21923828125, -0.179443359375, -0.1396484375, -0.099853515625, -0.06005859375, -0.020263671875, 0.01953125, 0.059326171875, 0.09912109375, 0.138916015625, 0.1787109375, 0.218505859375, 0.25830078125, 0.298095703125, 0.337890625, 0.377685546875, 0.41748046875, 0.457275390625, 0.4970703125, 0.536865234375, 0.57666015625, 0.616455078125, 0.65625, 0.696044921875, 0.73583984375, 0.775634765625, 0.8154296875, 0.855224609375, 0.89501953125, 0.934814453125, 0.974609375, 1.014404296875, 1.05419921875, 1.093994140625, 1.1337890625, 1.173583984375, 1.21337890625, 1.253173828125, 1.29296875, 1.332763671875, 1.37255859375, 1.412353515625, 1.4521484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 15.0, 12.0, 16.0, 24.0, 24.0, 23.0, 35.0, 28.0, 30.0, 34.0, 33.0, 41.0, 38.0, 45.0, 37.0, 39.0, 48.0, 48.0, 51.0, 45.0, 35.0, 33.0, 28.0, 24.0, 34.0, 28.0, 23.0, 25.0, 11.0, 16.0, 11.0, 12.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.49609375, -1.448974609375, -1.40185546875, -1.354736328125, -1.3076171875, -1.260498046875, -1.21337890625, -1.166259765625, -1.119140625, -1.072021484375, -1.02490234375, -0.977783203125, -0.9306640625, -0.883544921875, -0.83642578125, -0.789306640625, -0.7421875, -0.695068359375, -0.64794921875, -0.600830078125, -0.5537109375, -0.506591796875, -0.45947265625, -0.412353515625, -0.365234375, -0.318115234375, -0.27099609375, -0.223876953125, -0.1767578125, -0.129638671875, -0.08251953125, -0.035400390625, 0.01171875, 0.058837890625, 0.10595703125, 0.153076171875, 0.2001953125, 0.247314453125, 0.29443359375, 0.341552734375, 0.388671875, 0.435791015625, 0.48291015625, 0.530029296875, 0.5771484375, 0.624267578125, 0.67138671875, 0.718505859375, 0.765625, 0.812744140625, 0.85986328125, 0.906982421875, 0.9541015625, 1.001220703125, 1.04833984375, 1.095458984375, 1.142578125, 1.189697265625, 1.23681640625, 1.283935546875, 1.3310546875, 1.378173828125, 1.42529296875, 1.472412109375, 1.51953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 9.0, 11.0, 12.0, 27.0, 41.0, 64.0, 92.0, 165.0, 323.0, 633.0, 1395.0, 3405.0, 9954.0, 39735.0, 241191.0, 580491.0, 134770.0, 24670.0, 6790.0, 2635.0, 1064.0, 480.0, 264.0, 141.0, 79.0, 33.0, 22.0, 17.0, 15.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5481948852539062, -0.5265655517578125, -0.5049362182617188, -0.483306884765625, -0.46167755126953125, -0.4400482177734375, -0.41841888427734375, -0.39678955078125, -0.37516021728515625, -0.3535308837890625, -0.33190155029296875, -0.310272216796875, -0.28864288330078125, -0.2670135498046875, -0.24538421630859375, -0.2237548828125, -0.20212554931640625, -0.1804962158203125, -0.15886688232421875, -0.137237548828125, -0.11560821533203125, -0.0939788818359375, -0.07234954833984375, -0.05072021484375, -0.02909088134765625, -0.0074615478515625, 0.01416778564453125, 0.035797119140625, 0.05742645263671875, 0.0790557861328125, 0.10068511962890625, 0.122314453125, 0.14394378662109375, 0.1655731201171875, 0.18720245361328125, 0.208831787109375, 0.23046112060546875, 0.2520904541015625, 0.27371978759765625, 0.29534912109375, 0.31697845458984375, 0.3386077880859375, 0.36023712158203125, 0.381866455078125, 0.40349578857421875, 0.4251251220703125, 0.44675445556640625, 0.4683837890625, 0.49001312255859375, 0.5116424560546875, 0.5332717895507812, 0.554901123046875, 0.5765304565429688, 0.5981597900390625, 0.6197891235351562, 0.64141845703125, 0.6630477905273438, 0.6846771240234375, 0.7063064575195312, 0.727935791015625, 0.7495651245117188, 0.7711944580078125, 0.7928237915039062, 0.814453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 7.0, 5.0, 9.0, 14.0, 23.0, 20.0, 23.0, 20.0, 50.0, 67.0, 62.0, 72.0, 74.0, 106.0, 75.0, 76.0, 59.0, 45.0, 29.0, 39.0, 26.0, 15.0, 17.0, 17.0, 9.0, 3.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011795759201049805, -0.00011461973190307617, -0.0001112818717956543, -0.00010794401168823242, -0.00010460615158081055, -0.00010126829147338867, -9.79304313659668e-05, -9.459257125854492e-05, -9.125471115112305e-05, -8.791685104370117e-05, -8.45789909362793e-05, -8.124113082885742e-05, -7.790327072143555e-05, -7.456541061401367e-05, -7.12275505065918e-05, -6.788969039916992e-05, -6.455183029174805e-05, -6.121397018432617e-05, -5.78761100769043e-05, -5.453824996948242e-05, -5.120038986206055e-05, -4.786252975463867e-05, -4.45246696472168e-05, -4.118680953979492e-05, -3.784894943237305e-05, -3.451108932495117e-05, -3.11732292175293e-05, -2.7835369110107422e-05, -2.4497509002685547e-05, -2.1159648895263672e-05, -1.7821788787841797e-05, -1.4483928680419922e-05, -1.1146068572998047e-05, -7.808208465576172e-06, -4.470348358154297e-06, -1.1324882507324219e-06, 2.205371856689453e-06, 5.543231964111328e-06, 8.881092071533203e-06, 1.2218952178955078e-05, 1.5556812286376953e-05, 1.8894672393798828e-05, 2.2232532501220703e-05, 2.5570392608642578e-05, 2.8908252716064453e-05, 3.224611282348633e-05, 3.55839729309082e-05, 3.892183303833008e-05, 4.225969314575195e-05, 4.559755325317383e-05, 4.89354133605957e-05, 5.227327346801758e-05, 5.561113357543945e-05, 5.894899368286133e-05, 6.22868537902832e-05, 6.562471389770508e-05, 6.896257400512695e-05, 7.230043411254883e-05, 7.56382942199707e-05, 7.897615432739258e-05, 8.231401443481445e-05, 8.565187454223633e-05, 8.89897346496582e-05, 9.232759475708008e-05, 9.566545486450195e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 3.0, 5.0, 11.0, 12.0, 11.0, 13.0, 32.0, 40.0, 41.0, 67.0, 114.0, 159.0, 263.0, 460.0, 764.0, 1517.0, 2899.0, 6152.0, 15138.0, 43561.0, 147426.0, 407335.0, 290175.0, 86116.0, 26992.0, 9966.0, 4358.0, 2140.0, 1140.0, 604.0, 351.0, 215.0, 159.0, 87.0, 68.0, 45.0, 32.0, 28.0, 18.0, 11.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.55810546875, -0.5420608520507812, -0.5260162353515625, -0.5099716186523438, -0.493927001953125, -0.47788238525390625, -0.4618377685546875, -0.44579315185546875, -0.42974853515625, -0.41370391845703125, -0.3976593017578125, -0.38161468505859375, -0.365570068359375, -0.34952545166015625, -0.3334808349609375, -0.31743621826171875, -0.3013916015625, -0.28534698486328125, -0.2693023681640625, -0.25325775146484375, -0.237213134765625, -0.22116851806640625, -0.2051239013671875, -0.18907928466796875, -0.17303466796875, -0.15699005126953125, -0.1409454345703125, -0.12490081787109375, -0.108856201171875, -0.09281158447265625, -0.0767669677734375, -0.06072235107421875, -0.044677734375, -0.02863311767578125, -0.0125885009765625, 0.00345611572265625, 0.019500732421875, 0.03554534912109375, 0.0515899658203125, 0.06763458251953125, 0.08367919921875, 0.09972381591796875, 0.1157684326171875, 0.13181304931640625, 0.147857666015625, 0.16390228271484375, 0.1799468994140625, 0.19599151611328125, 0.2120361328125, 0.22808074951171875, 0.2441253662109375, 0.26016998291015625, 0.276214599609375, 0.29225921630859375, 0.3083038330078125, 0.32434844970703125, 0.34039306640625, 0.35643768310546875, 0.3724822998046875, 0.38852691650390625, 0.404571533203125, 0.42061614990234375, 0.4366607666015625, 0.45270538330078125, 0.46875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 7.0, 6.0, 9.0, 10.0, 12.0, 12.0, 19.0, 22.0, 29.0, 30.0, 28.0, 36.0, 48.0, 58.0, 52.0, 62.0, 67.0, 68.0, 64.0, 55.0, 48.0, 50.0, 33.0, 39.0, 35.0, 19.0, 19.0, 11.0, 8.0, 10.0, 10.0, 7.0, 4.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4384765625, -0.42322540283203125, -0.4079742431640625, -0.39272308349609375, -0.377471923828125, -0.36222076416015625, -0.3469696044921875, -0.33171844482421875, -0.31646728515625, -0.30121612548828125, -0.2859649658203125, -0.27071380615234375, -0.255462646484375, -0.24021148681640625, -0.2249603271484375, -0.20970916748046875, -0.1944580078125, -0.17920684814453125, -0.1639556884765625, -0.14870452880859375, -0.133453369140625, -0.11820220947265625, -0.1029510498046875, -0.08769989013671875, -0.07244873046875, -0.05719757080078125, -0.0419464111328125, -0.02669525146484375, -0.011444091796875, 0.00380706787109375, 0.0190582275390625, 0.03430938720703125, 0.049560546875, 0.06481170654296875, 0.0800628662109375, 0.09531402587890625, 0.110565185546875, 0.12581634521484375, 0.1410675048828125, 0.15631866455078125, 0.17156982421875, 0.18682098388671875, 0.2020721435546875, 0.21732330322265625, 0.232574462890625, 0.24782562255859375, 0.2630767822265625, 0.27832794189453125, 0.2935791015625, 0.30883026123046875, 0.3240814208984375, 0.33933258056640625, 0.354583740234375, 0.36983489990234375, 0.3850860595703125, 0.40033721923828125, 0.41558837890625, 0.43083953857421875, 0.4460906982421875, 0.46134185791015625, 0.476593017578125, 0.49184417724609375, 0.5070953369140625, 0.5223464965820312, 0.53759765625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 13.0, 37.0, 57.0, 124.0, 173.0, 216.0, 170.0, 91.0, 45.0, 28.0, 15.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.201919555664062, -17.713300704956055, -17.224681854248047, -16.73606300354004, -16.24744415283203, -15.75882625579834, -15.270207405090332, -14.781588554382324, -14.292969703674316, -13.804350852966309, -13.3157320022583, -12.82711410522461, -12.338495254516602, -11.849876403808594, -11.361257553100586, -10.872638702392578, -10.38401985168457, -9.895401000976562, -9.406782150268555, -8.918163299560547, -8.429545402526855, -7.940926551818848, -7.45230770111084, -6.963688850402832, -6.475070953369141, -5.986452102661133, -5.497833728790283, -5.009214878082275, -4.520596027374268, -4.031977653503418, -3.54335880279541, -3.0547399520874023, -2.5661211013793945, -2.077502489089966, -1.588883638381958, -1.1002650260925293, -0.611646294593811, -0.12302756309509277, 0.36559104919433594, 0.8542098999023438, 1.3428285121917725, 1.8314472436904907, 2.320065975189209, 2.8086845874786377, 3.2973031997680664, 3.785922050476074, 4.274540901184082, 4.76315975189209, 5.2517781257629395, 5.740396976470947, 6.229015350341797, 6.717634201049805, 7.2062530517578125, 7.69487190246582, 8.183490753173828, 8.672109603881836, 9.160727500915527, 9.649346351623535, 10.137965202331543, 10.626583099365234, 11.115201950073242, 11.60382080078125, 12.092439651489258, 12.581058502197266, 13.069677352905273]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 1.0, 3.0, 8.0, 5.0, 7.0, 8.0, 6.0, 12.0, 11.0, 22.0, 18.0, 21.0, 19.0, 35.0, 33.0, 28.0, 29.0, 32.0, 29.0, 34.0, 37.0, 44.0, 45.0, 37.0, 39.0, 47.0, 47.0, 41.0, 41.0, 37.0, 24.0, 23.0, 31.0, 22.0, 11.0, 23.0, 10.0, 14.0, 13.0, 16.0, 10.0, 4.0, 6.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 1.0], "bins": [-7.130097389221191, -6.913196086883545, -6.696294784545898, -6.479393482208252, -6.2624921798706055, -6.045590400695801, -5.828689098358154, -5.611787796020508, -5.394886493682861, -5.177985191345215, -4.961083889007568, -4.744182586669922, -4.527280807495117, -4.310379981994629, -4.093478202819824, -3.8765769004821777, -3.6596755981445312, -3.4427742958068848, -3.2258729934692383, -3.0089714527130127, -2.792070150375366, -2.5751688480377197, -2.358267307281494, -2.1413660049438477, -1.9244647026062012, -1.7075634002685547, -1.4906619787216187, -1.2737605571746826, -1.0568592548370361, -0.8399579524993896, -0.6230565309524536, -0.4061551094055176, -0.1892533302307129, 0.02764803171157837, 0.24454939365386963, 0.4614507555961609, 0.6783521175384521, 0.8952534198760986, 1.1121548414230347, 1.3290562629699707, 1.5459575653076172, 1.7628588676452637, 1.9797602891921997, 2.1966617107391357, 2.4135630130767822, 2.6304643154144287, 2.8473658561706543, 3.064267158508301, 3.2811684608459473, 3.4980697631835938, 3.7149710655212402, 3.931872606277466, 4.148774147033691, 4.36567497253418, 4.582576751708984, 4.799478054046631, 5.016379356384277, 5.233280658721924, 5.45018196105957, 5.667083263397217, 5.883984565734863, 6.100886344909668, 6.3177876472473145, 6.534688949584961, 6.751590251922607]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 8.0, 6.0, 16.0, 26.0, 27.0, 52.0, 67.0, 140.0, 241.0, 586.0, 1647.0, 8318.0, 4104591.0, 72613.0, 3931.0, 1074.0, 391.0, 208.0, 131.0, 75.0, 37.0, 24.0, 19.0, 15.0, 5.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.271331787109375, -4.15203857421875, -4.032745361328125, -3.9134521484375, -3.794158935546875, -3.67486572265625, -3.555572509765625, -3.436279296875, -3.316986083984375, -3.19769287109375, -3.078399658203125, -2.9591064453125, -2.839813232421875, -2.72052001953125, -2.601226806640625, -2.48193359375, -2.362640380859375, -2.24334716796875, -2.124053955078125, -2.0047607421875, -1.885467529296875, -1.76617431640625, -1.646881103515625, -1.527587890625, -1.408294677734375, -1.28900146484375, -1.169708251953125, -1.0504150390625, -0.931121826171875, -0.81182861328125, -0.692535400390625, -0.5732421875, -0.453948974609375, -0.33465576171875, -0.215362548828125, -0.0960693359375, 0.023223876953125, 0.14251708984375, 0.261810302734375, 0.381103515625, 0.500396728515625, 0.61968994140625, 0.738983154296875, 0.8582763671875, 0.977569580078125, 1.09686279296875, 1.216156005859375, 1.33544921875, 1.454742431640625, 1.57403564453125, 1.693328857421875, 1.8126220703125, 1.931915283203125, 2.05120849609375, 2.170501708984375, 2.289794921875, 2.409088134765625, 2.52838134765625, 2.647674560546875, 2.7669677734375, 2.886260986328125, 3.00555419921875, 3.124847412109375, 3.244140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 8.0, 10.0, 11.0, 12.0, 17.0, 7.0, 30.0, 24.0, 40.0, 36.0, 54.0, 53.0, 66.0, 68.0, 67.0, 72.0, 55.0, 69.0, 58.0, 41.0, 32.0, 27.0, 24.0, 29.0, 27.0, 21.0, 8.0, 7.0, 8.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5102920532226562, -0.4956817626953125, -0.48107147216796875, -0.466461181640625, -0.45185089111328125, -0.4372406005859375, -0.42263031005859375, -0.40802001953125, -0.39340972900390625, -0.3787994384765625, -0.36418914794921875, -0.349578857421875, -0.33496856689453125, -0.3203582763671875, -0.30574798583984375, -0.2911376953125, -0.27652740478515625, -0.2619171142578125, -0.24730682373046875, -0.232696533203125, -0.21808624267578125, -0.2034759521484375, -0.18886566162109375, -0.17425537109375, -0.15964508056640625, -0.1450347900390625, -0.13042449951171875, -0.115814208984375, -0.10120391845703125, -0.0865936279296875, -0.07198333740234375, -0.057373046875, -0.04276275634765625, -0.0281524658203125, -0.01354217529296875, 0.001068115234375, 0.01567840576171875, 0.0302886962890625, 0.04489898681640625, 0.05950927734375, 0.07411956787109375, 0.0887298583984375, 0.10334014892578125, 0.117950439453125, 0.13256072998046875, 0.1471710205078125, 0.16178131103515625, 0.1763916015625, 0.19100189208984375, 0.2056121826171875, 0.22022247314453125, 0.234832763671875, 0.24944305419921875, 0.2640533447265625, 0.27866363525390625, 0.29327392578125, 0.30788421630859375, 0.3224945068359375, 0.33710479736328125, 0.351715087890625, 0.36632537841796875, 0.3809356689453125, 0.39554595947265625, 0.41015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 16.0, 15.0, 13.0, 26.0, 24.0, 41.0, 41.0, 57.0, 68.0, 105.0, 105.0, 169.0, 262.0, 544.0, 1206.0, 3263.0, 12439.0, 135899.0, 3989635.0, 39826.0, 6603.0, 1938.0, 815.0, 351.0, 225.0, 128.0, 95.0, 76.0, 57.0, 52.0, 38.0, 34.0, 22.0, 20.0, 13.0, 13.0, 5.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.977813720703125, -1.91461181640625, -1.851409912109375, -1.7882080078125, -1.725006103515625, -1.66180419921875, -1.598602294921875, -1.535400390625, -1.472198486328125, -1.40899658203125, -1.345794677734375, -1.2825927734375, -1.219390869140625, -1.15618896484375, -1.092987060546875, -1.02978515625, -0.966583251953125, -0.90338134765625, -0.840179443359375, -0.7769775390625, -0.713775634765625, -0.65057373046875, -0.587371826171875, -0.524169921875, -0.460968017578125, -0.39776611328125, -0.334564208984375, -0.2713623046875, -0.208160400390625, -0.14495849609375, -0.081756591796875, -0.0185546875, 0.044647216796875, 0.10784912109375, 0.171051025390625, 0.2342529296875, 0.297454833984375, 0.36065673828125, 0.423858642578125, 0.487060546875, 0.550262451171875, 0.61346435546875, 0.676666259765625, 0.7398681640625, 0.803070068359375, 0.86627197265625, 0.929473876953125, 0.99267578125, 1.055877685546875, 1.11907958984375, 1.182281494140625, 1.2454833984375, 1.308685302734375, 1.37188720703125, 1.435089111328125, 1.498291015625, 1.561492919921875, 1.62469482421875, 1.687896728515625, 1.7510986328125, 1.814300537109375, 1.87750244140625, 1.940704345703125, 2.00390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 2.0, 7.0, 10.0, 18.0, 32.0, 71.0, 233.0, 3275.0, 270.0, 77.0, 33.0, 18.0, 9.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30712890625, -0.2946014404296875, -0.282073974609375, -0.2695465087890625, -0.25701904296875, -0.2444915771484375, -0.231964111328125, -0.2194366455078125, -0.2069091796875, -0.1943817138671875, -0.181854248046875, -0.1693267822265625, -0.15679931640625, -0.1442718505859375, -0.131744384765625, -0.1192169189453125, -0.106689453125, -0.0941619873046875, -0.081634521484375, -0.0691070556640625, -0.05657958984375, -0.0440521240234375, -0.031524658203125, -0.0189971923828125, -0.0064697265625, 0.0060577392578125, 0.018585205078125, 0.0311126708984375, 0.04364013671875, 0.0561676025390625, 0.068695068359375, 0.0812225341796875, 0.09375, 0.1062774658203125, 0.118804931640625, 0.1313323974609375, 0.14385986328125, 0.1563873291015625, 0.168914794921875, 0.1814422607421875, 0.1939697265625, 0.2064971923828125, 0.219024658203125, 0.2315521240234375, 0.24407958984375, 0.2566070556640625, 0.269134521484375, 0.2816619873046875, 0.294189453125, 0.3067169189453125, 0.319244384765625, 0.3317718505859375, 0.34429931640625, 0.3568267822265625, 0.369354248046875, 0.3818817138671875, 0.3944091796875, 0.4069366455078125, 0.419464111328125, 0.4319915771484375, 0.44451904296875, 0.4570465087890625, 0.469573974609375, 0.4821014404296875, 0.49462890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 8.0, 19.0, 23.0, 27.0, 41.0, 49.0, 76.0, 88.0, 107.0, 80.0, 102.0, 82.0, 79.0, 51.0, 54.0, 26.0, 23.0, 14.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.655744194984436, -0.6270523071289062, -0.5983604788780212, -0.5696685910224915, -0.5409767627716064, -0.5122848749160767, -0.48359301686286926, -0.45490115880966187, -0.4262092709541321, -0.3975174129009247, -0.3688255548477173, -0.3401336669921875, -0.3114418089389801, -0.2827499508857727, -0.2540580928325653, -0.22536621987819672, -0.1966743767261505, -0.16798251867294312, -0.13929064571857452, -0.11059878766536713, -0.08190692216157913, -0.05321505665779114, -0.02452319860458374, 0.004168674349784851, 0.03286053240299225, 0.06155239790678024, 0.09024426341056824, 0.11893612146377563, 0.14762797951698303, 0.17631985247135162, 0.20501171052455902, 0.2337035834789276, 0.262395441532135, 0.2910872995853424, 0.3197791576385498, 0.3484710454940796, 0.377162903547287, 0.4058547616004944, 0.4345466196537018, 0.4632384777069092, 0.49193036556243896, 0.5206222534179688, 0.5493140816688538, 0.5780059695243835, 0.6066977977752686, 0.6353896856307983, 0.6640815734863281, 0.6927734017372131, 0.7214652299880981, 0.7501571178436279, 0.7788489460945129, 0.8075408339500427, 0.8362326622009277, 0.8649245500564575, 0.8936164379119873, 0.9223082661628723, 0.9510001540184021, 0.9796920418739319, 1.008383870124817, 1.0370757579803467, 1.0657676458358765, 1.0944595336914062, 1.1231513023376465, 1.1518431901931763, 1.180535078048706]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 8.0, 5.0, 14.0, 15.0, 20.0, 17.0, 22.0, 16.0, 24.0, 29.0, 19.0, 33.0, 37.0, 48.0, 31.0, 30.0, 43.0, 39.0, 33.0, 37.0, 54.0, 48.0, 41.0, 25.0, 43.0, 42.0, 36.0, 25.0, 27.0, 24.0, 13.0, 11.0, 10.0, 10.0, 13.0, 8.0, 9.0, 8.0, 5.0, 9.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.539333701133728, -0.5228256583213806, -0.506317675113678, -0.48980966210365295, -0.47330164909362793, -0.4567936360836029, -0.4402856230735779, -0.42377758026123047, -0.40726959705352783, -0.3907615840435028, -0.3742535710334778, -0.35774555802345276, -0.34123754501342773, -0.3247295320034027, -0.3082215189933777, -0.2917134761810303, -0.27520546317100525, -0.2586974501609802, -0.2421894371509552, -0.22568142414093018, -0.20917341113090515, -0.19266539812088013, -0.1761573702096939, -0.15964935719966888, -0.14314134418964386, -0.12663333117961884, -0.11012531816959381, -0.09361729770898819, -0.07710928469896317, -0.06060127168893814, -0.04409325122833252, -0.027585238218307495, -0.01107722520828247, 0.005430789664387703, 0.021938804537057877, 0.0384468212723732, 0.054954834282398224, 0.07146284729242325, 0.08797086775302887, 0.1044788807630539, 0.12098689377307892, 0.13749490678310394, 0.15400291979312897, 0.17051094770431519, 0.1870189607143402, 0.20352697372436523, 0.22003498673439026, 0.23654299974441528, 0.2530510127544403, 0.26955902576446533, 0.28606703877449036, 0.3025750517845154, 0.3190830647945404, 0.33559107780456543, 0.35209912061691284, 0.3686071038246155, 0.3851151466369629, 0.4016231596469879, 0.41813117265701294, 0.43463918566703796, 0.451147198677063, 0.467655211687088, 0.48416322469711304, 0.5006712675094604, 0.5171792507171631]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 7.0, 10.0, 22.0, 21.0, 31.0, 44.0, 98.0, 168.0, 279.0, 562.0, 1235.0, 3231.0, 10478.0, 49377.0, 413206.0, 491427.0, 60219.0, 11823.0, 3518.0, 1387.0, 634.0, 305.0, 172.0, 103.0, 55.0, 39.0, 19.0, 25.0, 12.0, 12.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.279296875, -2.195037841796875, -2.11077880859375, -2.026519775390625, -1.9422607421875, -1.858001708984375, -1.77374267578125, -1.689483642578125, -1.605224609375, -1.520965576171875, -1.43670654296875, -1.352447509765625, -1.2681884765625, -1.183929443359375, -1.09967041015625, -1.015411376953125, -0.93115234375, -0.846893310546875, -0.76263427734375, -0.678375244140625, -0.5941162109375, -0.509857177734375, -0.42559814453125, -0.341339111328125, -0.257080078125, -0.172821044921875, -0.08856201171875, -0.004302978515625, 0.0799560546875, 0.164215087890625, 0.24847412109375, 0.332733154296875, 0.4169921875, 0.501251220703125, 0.58551025390625, 0.669769287109375, 0.7540283203125, 0.838287353515625, 0.92254638671875, 1.006805419921875, 1.091064453125, 1.175323486328125, 1.25958251953125, 1.343841552734375, 1.4281005859375, 1.512359619140625, 1.59661865234375, 1.680877685546875, 1.76513671875, 1.849395751953125, 1.93365478515625, 2.017913818359375, 2.1021728515625, 2.186431884765625, 2.27069091796875, 2.354949951171875, 2.439208984375, 2.523468017578125, 2.60772705078125, 2.691986083984375, 2.7762451171875, 2.860504150390625, 2.94476318359375, 3.029022216796875, 3.11328125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 9.0, 19.0, 22.0, 29.0, 37.0, 24.0, 38.0, 48.0, 52.0, 75.0, 56.0, 67.0, 75.0, 83.0, 82.0, 51.0, 37.0, 29.0, 42.0, 22.0, 22.0, 21.0, 12.0, 13.0, 5.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6474609375, -0.6308135986328125, -0.614166259765625, -0.5975189208984375, -0.58087158203125, -0.5642242431640625, -0.547576904296875, -0.5309295654296875, -0.5142822265625, -0.4976348876953125, -0.480987548828125, -0.4643402099609375, -0.44769287109375, -0.4310455322265625, -0.414398193359375, -0.3977508544921875, -0.381103515625, -0.3644561767578125, -0.347808837890625, -0.3311614990234375, -0.31451416015625, -0.2978668212890625, -0.281219482421875, -0.2645721435546875, -0.2479248046875, -0.2312774658203125, -0.214630126953125, -0.1979827880859375, -0.18133544921875, -0.1646881103515625, -0.148040771484375, -0.1313934326171875, -0.11474609375, -0.0980987548828125, -0.081451416015625, -0.0648040771484375, -0.04815673828125, -0.0315093994140625, -0.014862060546875, 0.0017852783203125, 0.0184326171875, 0.0350799560546875, 0.051727294921875, 0.0683746337890625, 0.08502197265625, 0.1016693115234375, 0.118316650390625, 0.1349639892578125, 0.151611328125, 0.1682586669921875, 0.184906005859375, 0.2015533447265625, 0.21820068359375, 0.2348480224609375, 0.251495361328125, 0.2681427001953125, 0.2847900390625, 0.3014373779296875, 0.318084716796875, 0.3347320556640625, 0.35137939453125, 0.3680267333984375, 0.384674072265625, 0.4013214111328125, 0.41796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 7.0, 19.0, 29.0, 27.0, 39.0, 44.0, 71.0, 95.0, 123.0, 175.0, 289.0, 425.0, 673.0, 1241.0, 2294.0, 4903.0, 10946.0, 27380.0, 77284.0, 249294.0, 433104.0, 155179.0, 50113.0, 18675.0, 7830.0, 3638.0, 1872.0, 979.0, 544.0, 335.0, 247.0, 156.0, 118.0, 87.0, 63.0, 50.0, 45.0, 28.0, 26.0, 18.0, 17.0, 15.0, 12.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.9013671875, -0.87060546875, -0.83984375, -0.80908203125, -0.7783203125, -0.74755859375, -0.716796875, -0.68603515625, -0.6552734375, -0.62451171875, -0.59375, -0.56298828125, -0.5322265625, -0.50146484375, -0.470703125, -0.43994140625, -0.4091796875, -0.37841796875, -0.34765625, -0.31689453125, -0.2861328125, -0.25537109375, -0.224609375, -0.19384765625, -0.1630859375, -0.13232421875, -0.1015625, -0.07080078125, -0.0400390625, -0.00927734375, 0.021484375, 0.05224609375, 0.0830078125, 0.11376953125, 0.14453125, 0.17529296875, 0.2060546875, 0.23681640625, 0.267578125, 0.29833984375, 0.3291015625, 0.35986328125, 0.390625, 0.42138671875, 0.4521484375, 0.48291015625, 0.513671875, 0.54443359375, 0.5751953125, 0.60595703125, 0.63671875, 0.66748046875, 0.6982421875, 0.72900390625, 0.759765625, 0.79052734375, 0.8212890625, 0.85205078125, 0.8828125, 0.91357421875, 0.9443359375, 0.97509765625, 1.005859375, 1.03662109375, 1.0673828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 11.0, 11.0, 18.0, 21.0, 21.0, 19.0, 30.0, 21.0, 19.0, 27.0, 35.0, 40.0, 35.0, 56.0, 43.0, 36.0, 35.0, 44.0, 45.0, 52.0, 35.0, 29.0, 33.0, 36.0, 39.0, 16.0, 25.0, 30.0, 22.0, 13.0, 17.0, 17.0, 8.0, 14.0, 11.0, 4.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.865234375, -1.813995361328125, -1.76275634765625, -1.711517333984375, -1.6602783203125, -1.609039306640625, -1.55780029296875, -1.506561279296875, -1.455322265625, -1.404083251953125, -1.35284423828125, -1.301605224609375, -1.2503662109375, -1.199127197265625, -1.14788818359375, -1.096649169921875, -1.04541015625, -0.994171142578125, -0.94293212890625, -0.891693115234375, -0.8404541015625, -0.789215087890625, -0.73797607421875, -0.686737060546875, -0.635498046875, -0.584259033203125, -0.53302001953125, -0.481781005859375, -0.4305419921875, -0.379302978515625, -0.32806396484375, -0.276824951171875, -0.2255859375, -0.174346923828125, -0.12310791015625, -0.071868896484375, -0.0206298828125, 0.030609130859375, 0.08184814453125, 0.133087158203125, 0.184326171875, 0.235565185546875, 0.28680419921875, 0.338043212890625, 0.3892822265625, 0.440521240234375, 0.49176025390625, 0.542999267578125, 0.59423828125, 0.645477294921875, 0.69671630859375, 0.747955322265625, 0.7991943359375, 0.850433349609375, 0.90167236328125, 0.952911376953125, 1.004150390625, 1.055389404296875, 1.10662841796875, 1.157867431640625, 1.2091064453125, 1.260345458984375, 1.31158447265625, 1.362823486328125, 1.4140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 13.0, 10.0, 19.0, 23.0, 41.0, 77.0, 93.0, 176.0, 227.0, 524.0, 1079.0, 3111.0, 12088.0, 106646.0, 836521.0, 73166.0, 9938.0, 2670.0, 1001.0, 456.0, 238.0, 154.0, 69.0, 59.0, 36.0, 35.0, 21.0, 11.0, 8.0, 5.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2889556884765625, -1.241973876953125, -1.1949920654296875, -1.14801025390625, -1.1010284423828125, -1.054046630859375, -1.0070648193359375, -0.9600830078125, -0.9131011962890625, -0.866119384765625, -0.8191375732421875, -0.77215576171875, -0.7251739501953125, -0.678192138671875, -0.6312103271484375, -0.584228515625, -0.5372467041015625, -0.490264892578125, -0.4432830810546875, -0.39630126953125, -0.3493194580078125, -0.302337646484375, -0.2553558349609375, -0.2083740234375, -0.1613922119140625, -0.114410400390625, -0.0674285888671875, -0.02044677734375, 0.0265350341796875, 0.073516845703125, 0.1204986572265625, 0.16748046875, 0.2144622802734375, 0.261444091796875, 0.3084259033203125, 0.35540771484375, 0.4023895263671875, 0.449371337890625, 0.4963531494140625, 0.5433349609375, 0.5903167724609375, 0.637298583984375, 0.6842803955078125, 0.73126220703125, 0.7782440185546875, 0.825225830078125, 0.8722076416015625, 0.919189453125, 0.9661712646484375, 1.013153076171875, 1.0601348876953125, 1.10711669921875, 1.1540985107421875, 1.201080322265625, 1.2480621337890625, 1.2950439453125, 1.3420257568359375, 1.389007568359375, 1.4359893798828125, 1.48297119140625, 1.5299530029296875, 1.576934814453125, 1.6239166259765625, 1.6708984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 9.0, 13.0, 18.0, 19.0, 36.0, 46.0, 77.0, 99.0, 120.0, 135.0, 118.0, 77.0, 64.0, 39.0, 25.0, 29.0, 22.0, 11.0, 5.0, 1.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002149343490600586, -0.00020903907716274261, -0.00020314380526542664, -0.00019724853336811066, -0.00019135326147079468, -0.0001854579895734787, -0.00017956271767616272, -0.00017366744577884674, -0.00016777217388153076, -0.00016187690198421478, -0.0001559816300868988, -0.00015008635818958282, -0.00014419108629226685, -0.00013829581439495087, -0.0001324005424976349, -0.0001265052706003189, -0.00012060999870300293, -0.00011471472680568695, -0.00010881945490837097, -0.00010292418301105499, -9.702891111373901e-05, -9.113363921642303e-05, -8.523836731910706e-05, -7.934309542179108e-05, -7.34478235244751e-05, -6.755255162715912e-05, -6.165727972984314e-05, -5.576200783252716e-05, -4.986673593521118e-05, -4.39714640378952e-05, -3.8076192140579224e-05, -3.2180920243263245e-05, -2.6285648345947266e-05, -2.0390376448631287e-05, -1.4495104551315308e-05, -8.599832653999329e-06, -2.7045607566833496e-06, 3.1907111406326294e-06, 9.085983037948608e-06, 1.4981254935264587e-05, 2.0876526832580566e-05, 2.6771798729896545e-05, 3.2667070627212524e-05, 3.8562342524528503e-05, 4.445761442184448e-05, 5.035288631916046e-05, 5.624815821647644e-05, 6.214343011379242e-05, 6.80387020111084e-05, 7.393397390842438e-05, 7.982924580574036e-05, 8.572451770305634e-05, 9.161978960037231e-05, 9.75150614976883e-05, 0.00010341033339500427, 0.00010930560529232025, 0.00011520087718963623, 0.00012109614908695221, 0.0001269914209842682, 0.00013288669288158417, 0.00013878196477890015, 0.00014467723667621613, 0.0001505725085735321, 0.00015646778047084808, 0.00016236305236816406]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 15.0, 14.0, 19.0, 29.0, 43.0, 64.0, 85.0, 130.0, 216.0, 330.0, 624.0, 1202.0, 2558.0, 6033.0, 19218.0, 97896.0, 676768.0, 198562.0, 29611.0, 8409.0, 3259.0, 1514.0, 769.0, 454.0, 234.0, 147.0, 104.0, 54.0, 40.0, 29.0, 18.0, 17.0, 20.0, 12.0, 8.0, 8.0, 6.0, 3.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1650390625, -1.1314239501953125, -1.097808837890625, -1.0641937255859375, -1.03057861328125, -0.9969635009765625, -0.963348388671875, -0.9297332763671875, -0.8961181640625, -0.8625030517578125, -0.828887939453125, -0.7952728271484375, -0.76165771484375, -0.7280426025390625, -0.694427490234375, -0.6608123779296875, -0.627197265625, -0.5935821533203125, -0.559967041015625, -0.5263519287109375, -0.49273681640625, -0.4591217041015625, -0.425506591796875, -0.3918914794921875, -0.3582763671875, -0.3246612548828125, -0.291046142578125, -0.2574310302734375, -0.22381591796875, -0.1902008056640625, -0.156585693359375, -0.1229705810546875, -0.08935546875, -0.0557403564453125, -0.022125244140625, 0.0114898681640625, 0.04510498046875, 0.0787200927734375, 0.112335205078125, 0.1459503173828125, 0.1795654296875, 0.2131805419921875, 0.246795654296875, 0.2804107666015625, 0.31402587890625, 0.3476409912109375, 0.381256103515625, 0.4148712158203125, 0.448486328125, 0.4821014404296875, 0.515716552734375, 0.5493316650390625, 0.58294677734375, 0.6165618896484375, 0.650177001953125, 0.6837921142578125, 0.7174072265625, 0.7510223388671875, 0.784637451171875, 0.8182525634765625, 0.85186767578125, 0.8854827880859375, 0.919097900390625, 0.9527130126953125, 0.986328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 8.0, 12.0, 7.0, 14.0, 13.0, 38.0, 40.0, 61.0, 60.0, 78.0, 94.0, 101.0, 87.0, 78.0, 67.0, 44.0, 37.0, 25.0, 28.0, 17.0, 14.0, 14.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.95361328125, -0.92413330078125, -0.8946533203125, -0.86517333984375, -0.835693359375, -0.80621337890625, -0.7767333984375, -0.74725341796875, -0.7177734375, -0.68829345703125, -0.6588134765625, -0.62933349609375, -0.599853515625, -0.57037353515625, -0.5408935546875, -0.51141357421875, -0.48193359375, -0.45245361328125, -0.4229736328125, -0.39349365234375, -0.364013671875, -0.33453369140625, -0.3050537109375, -0.27557373046875, -0.24609375, -0.21661376953125, -0.1871337890625, -0.15765380859375, -0.128173828125, -0.09869384765625, -0.0692138671875, -0.03973388671875, -0.01025390625, 0.01922607421875, 0.0487060546875, 0.07818603515625, 0.107666015625, 0.13714599609375, 0.1666259765625, 0.19610595703125, 0.2255859375, 0.25506591796875, 0.2845458984375, 0.31402587890625, 0.343505859375, 0.37298583984375, 0.4024658203125, 0.43194580078125, 0.46142578125, 0.49090576171875, 0.5203857421875, 0.54986572265625, 0.579345703125, 0.60882568359375, 0.6383056640625, 0.66778564453125, 0.697265625, 0.72674560546875, 0.7562255859375, 0.78570556640625, 0.815185546875, 0.84466552734375, 0.8741455078125, 0.90362548828125, 0.93310546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 9.0, 16.0, 32.0, 27.0, 51.0, 79.0, 100.0, 103.0, 122.0, 123.0, 98.0, 76.0, 69.0, 41.0, 22.0, 10.0, 5.0, 6.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.934856414794922, -10.563733100891113, -10.192610740661621, -9.821487426757812, -9.450364112854004, -9.079240798950195, -8.708118438720703, -8.336995124816895, -7.965871810913086, -7.5947489738464355, -7.223625659942627, -6.852502822875977, -6.481379508972168, -6.110256671905518, -5.739133834838867, -5.368010520935059, -4.996887683868408, -4.625764846801758, -4.254641532897949, -3.883518695831299, -3.5123953819274902, -3.14127254486084, -2.7701494693756104, -2.399026393890381, -2.0279033184051514, -1.6567802429199219, -1.2856571674346924, -0.9145342111587524, -0.543411135673523, -0.17228806018829346, 0.19883489608764648, 0.569957971572876, 0.9410810470581055, 1.312204122543335, 1.6833271980285645, 2.054450035095215, 2.4255733489990234, 2.796696186065674, 3.1678192615509033, 3.538942337036133, 3.9100654125213623, 4.281188488006592, 4.652311325073242, 5.023434638977051, 5.394557476043701, 5.76568078994751, 6.13680362701416, 6.507926940917969, 6.879049777984619, 7.2501726150512695, 7.621295928955078, 7.9924187660217285, 8.363541603088379, 8.734664916992188, 9.105788230895996, 9.476911544799805, 9.848033905029297, 10.219157218933105, 10.590279579162598, 10.961402893066406, 11.332526206970215, 11.703649520874023, 12.074771881103516, 12.445895195007324, 12.817018508911133]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 8.0, 11.0, 9.0, 12.0, 15.0, 19.0, 19.0, 25.0, 35.0, 34.0, 43.0, 29.0, 46.0, 53.0, 53.0, 34.0, 44.0, 56.0, 51.0, 56.0, 44.0, 39.0, 42.0, 30.0, 36.0, 16.0, 28.0, 22.0, 15.0, 16.0, 8.0, 17.0, 6.0, 7.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.743335723876953, -9.455294609069824, -9.167252540588379, -8.87921142578125, -8.591169357299805, -8.303128242492676, -8.01508617401123, -7.727045059204102, -7.4390034675598145, -7.150961875915527, -6.86292028427124, -6.574878692626953, -6.286837577819824, -5.998795509338379, -5.71075439453125, -5.422712802886963, -5.134671211242676, -4.846629619598389, -4.558588027954102, -4.2705464363098145, -3.9825050830841064, -3.6944634914398193, -3.4064221382141113, -3.118380546569824, -2.830338954925537, -2.54229736328125, -2.254255771636963, -1.9662144184112549, -1.6781728267669678, -1.3901312351226807, -1.102089762687683, -0.8140482902526855, -0.5260066986083984, -0.2379651665687561, 0.05007636547088623, 0.33811789751052856, 0.6261594295501709, 0.914201021194458, 1.2022424936294556, 1.4902839660644531, 1.7783255577087402, 2.0663671493530273, 2.3544087409973145, 2.6424500942230225, 2.9304916858673096, 3.2185332775115967, 3.5065746307373047, 3.794616222381592, 4.082657814025879, 4.370699405670166, 4.658740997314453, 4.94678258895874, 5.234824180603027, 5.522865295410156, 5.810906887054443, 6.0989484786987305, 6.386990070343018, 6.675031661987305, 6.963073253631592, 7.251114845275879, 7.539155960083008, 7.827198028564453, 8.115239143371582, 8.403280258178711, 8.691322326660156]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 14.0, 27.0, 41.0, 74.0, 104.0, 170.0, 327.0, 663.0, 1457.0, 4272.0, 22699.0, 4056233.0, 95594.0, 8132.0, 2345.0, 999.0, 482.0, 259.0, 147.0, 71.0, 63.0, 31.0, 10.0, 18.0, 12.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.330078125, -3.231353759765625, -3.13262939453125, -3.033905029296875, -2.9351806640625, -2.836456298828125, -2.73773193359375, -2.639007568359375, -2.540283203125, -2.441558837890625, -2.34283447265625, -2.244110107421875, -2.1453857421875, -2.046661376953125, -1.94793701171875, -1.849212646484375, -1.75048828125, -1.651763916015625, -1.55303955078125, -1.454315185546875, -1.3555908203125, -1.256866455078125, -1.15814208984375, -1.059417724609375, -0.960693359375, -0.861968994140625, -0.76324462890625, -0.664520263671875, -0.5657958984375, -0.467071533203125, -0.36834716796875, -0.269622802734375, -0.1708984375, -0.072174072265625, 0.02655029296875, 0.125274658203125, 0.2239990234375, 0.322723388671875, 0.42144775390625, 0.520172119140625, 0.618896484375, 0.717620849609375, 0.81634521484375, 0.915069580078125, 1.0137939453125, 1.112518310546875, 1.21124267578125, 1.309967041015625, 1.40869140625, 1.507415771484375, 1.60614013671875, 1.704864501953125, 1.8035888671875, 1.902313232421875, 2.00103759765625, 2.099761962890625, 2.198486328125, 2.297210693359375, 2.39593505859375, 2.494659423828125, 2.5933837890625, 2.692108154296875, 2.79083251953125, 2.889556884765625, 2.98828125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 12.0, 10.0, 15.0, 10.0, 19.0, 20.0, 32.0, 35.0, 30.0, 42.0, 57.0, 59.0, 69.0, 65.0, 67.0, 47.0, 62.0, 57.0, 54.0, 41.0, 52.0, 18.0, 19.0, 22.0, 19.0, 23.0, 6.0, 8.0, 6.0, 1.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.529296875, -0.5138778686523438, -0.4984588623046875, -0.48303985595703125, -0.467620849609375, -0.45220184326171875, -0.4367828369140625, -0.42136383056640625, -0.40594482421875, -0.39052581787109375, -0.3751068115234375, -0.35968780517578125, -0.344268798828125, -0.32884979248046875, -0.3134307861328125, -0.29801177978515625, -0.2825927734375, -0.26717376708984375, -0.2517547607421875, -0.23633575439453125, -0.220916748046875, -0.20549774169921875, -0.1900787353515625, -0.17465972900390625, -0.15924072265625, -0.14382171630859375, -0.1284027099609375, -0.11298370361328125, -0.097564697265625, -0.08214569091796875, -0.0667266845703125, -0.05130767822265625, -0.035888671875, -0.02046966552734375, -0.0050506591796875, 0.01036834716796875, 0.025787353515625, 0.04120635986328125, 0.0566253662109375, 0.07204437255859375, 0.08746337890625, 0.10288238525390625, 0.1183013916015625, 0.13372039794921875, 0.149139404296875, 0.16455841064453125, 0.1799774169921875, 0.19539642333984375, 0.2108154296875, 0.22623443603515625, 0.2416534423828125, 0.25707244873046875, 0.272491455078125, 0.28791046142578125, 0.3033294677734375, 0.31874847412109375, 0.33416748046875, 0.34958648681640625, 0.3650054931640625, 0.38042449951171875, 0.395843505859375, 0.41126251220703125, 0.4266815185546875, 0.44210052490234375, 0.45751953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 6.0, 10.0, 10.0, 12.0, 24.0, 40.0, 44.0, 62.0, 75.0, 123.0, 169.0, 279.0, 345.0, 518.0, 810.0, 1289.0, 2243.0, 5131.0, 18946.0, 369307.0, 3750127.0, 30601.0, 6843.0, 2876.0, 1478.0, 924.0, 624.0, 399.0, 273.0, 210.0, 135.0, 82.0, 75.0, 47.0, 30.0, 32.0, 15.0, 23.0, 9.0, 7.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.933135986328125, -3.82720947265625, -3.721282958984375, -3.6153564453125, -3.509429931640625, -3.40350341796875, -3.297576904296875, -3.191650390625, -3.085723876953125, -2.97979736328125, -2.873870849609375, -2.7679443359375, -2.662017822265625, -2.55609130859375, -2.450164794921875, -2.34423828125, -2.238311767578125, -2.13238525390625, -2.026458740234375, -1.9205322265625, -1.814605712890625, -1.70867919921875, -1.602752685546875, -1.496826171875, -1.390899658203125, -1.28497314453125, -1.179046630859375, -1.0731201171875, -0.967193603515625, -0.86126708984375, -0.755340576171875, -0.6494140625, -0.543487548828125, -0.43756103515625, -0.331634521484375, -0.2257080078125, -0.119781494140625, -0.01385498046875, 0.092071533203125, 0.197998046875, 0.303924560546875, 0.40985107421875, 0.515777587890625, 0.6217041015625, 0.727630615234375, 0.83355712890625, 0.939483642578125, 1.04541015625, 1.151336669921875, 1.25726318359375, 1.363189697265625, 1.4691162109375, 1.575042724609375, 1.68096923828125, 1.786895751953125, 1.892822265625, 1.998748779296875, 2.10467529296875, 2.210601806640625, 2.3165283203125, 2.422454833984375, 2.52838134765625, 2.634307861328125, 2.740234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 6.0, 12.0, 19.0, 31.0, 55.0, 144.0, 737.0, 2718.0, 199.0, 60.0, 27.0, 11.0, 15.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54052734375, -0.5161514282226562, -0.4917755126953125, -0.46739959716796875, -0.443023681640625, -0.41864776611328125, -0.3942718505859375, -0.36989593505859375, -0.34552001953125, -0.32114410400390625, -0.2967681884765625, -0.27239227294921875, -0.248016357421875, -0.22364044189453125, -0.1992645263671875, -0.17488861083984375, -0.1505126953125, -0.12613677978515625, -0.1017608642578125, -0.07738494873046875, -0.053009033203125, -0.02863311767578125, -0.0042572021484375, 0.02011871337890625, 0.04449462890625, 0.06887054443359375, 0.0932464599609375, 0.11762237548828125, 0.141998291015625, 0.16637420654296875, 0.1907501220703125, 0.21512603759765625, 0.239501953125, 0.26387786865234375, 0.2882537841796875, 0.31262969970703125, 0.337005615234375, 0.36138153076171875, 0.3857574462890625, 0.41013336181640625, 0.43450927734375, 0.45888519287109375, 0.4832611083984375, 0.5076370239257812, 0.532012939453125, 0.5563888549804688, 0.5807647705078125, 0.6051406860351562, 0.6295166015625, 0.6538925170898438, 0.6782684326171875, 0.7026443481445312, 0.727020263671875, 0.7513961791992188, 0.7757720947265625, 0.8001480102539062, 0.82452392578125, 0.8488998413085938, 0.8732757568359375, 0.8976516723632812, 0.922027587890625, 0.9464035034179688, 0.9707794189453125, 0.9951553344726562, 1.01953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 12.0, 23.0, 31.0, 53.0, 100.0, 159.0, 184.0, 130.0, 104.0, 57.0, 42.0, 24.0, 19.0, 16.0, 5.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.534883499145508, -4.373327255249023, -4.211770534515381, -4.0502142906188965, -3.888657808303833, -3.7271013259887695, -3.565545082092285, -3.4039885997772217, -3.242432117462158, -3.0808756351470947, -2.9193191528320312, -2.757762908935547, -2.5962064266204834, -2.43464994430542, -2.2730937004089355, -2.111537218093872, -1.9499807357788086, -1.7884242534637451, -1.6268678903579712, -1.4653115272521973, -1.3037550449371338, -1.1421985626220703, -0.9806421995162964, -0.8190858364105225, -0.657529354095459, -0.4959729313850403, -0.3344165086746216, -0.17286008596420288, -0.01130366325378418, 0.15025275945663452, 0.3118091821670532, 0.47336554527282715, 0.6349220275878906, 0.7964784502983093, 0.958034873008728, 1.119591236114502, 1.2811477184295654, 1.442704200744629, 1.6042605638504028, 1.7658169269561768, 1.9273734092712402, 2.0889298915863037, 2.250486373901367, 2.4120426177978516, 2.573599100112915, 2.7351555824279785, 2.896711826324463, 3.0582683086395264, 3.21982479095459, 3.3813812732696533, 3.542937755584717, 3.704493999481201, 3.8660504817962646, 4.027606964111328, 4.1891632080078125, 4.350719451904297, 4.5122761726379395, 4.673832416534424, 4.835389137268066, 4.996945381164551, 5.158501625061035, 5.320058345794678, 5.481614589691162, 5.643171310424805, 5.804727554321289]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 9.0, 14.0, 17.0, 10.0, 15.0, 20.0, 19.0, 16.0, 27.0, 30.0, 27.0, 33.0, 33.0, 41.0, 37.0, 30.0, 32.0, 47.0, 36.0, 44.0, 39.0, 37.0, 32.0, 31.0, 36.0, 35.0, 36.0, 35.0, 21.0, 18.0, 23.0, 12.0, 16.0, 12.0, 14.0, 13.0, 7.0, 9.0, 4.0, 6.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.083937406539917, -2.0216033458709717, -1.959269404411316, -1.8969354629516602, -1.8346015214920044, -1.7722675800323486, -1.7099335193634033, -1.6475995779037476, -1.5852656364440918, -1.522931694984436, -1.4605976343154907, -1.398263692855835, -1.3359297513961792, -1.2735958099365234, -1.2112617492675781, -1.1489278078079224, -1.0865938663482666, -1.0242599248886108, -0.9619259238243103, -0.8995919227600098, -0.837257981300354, -0.7749239802360535, -0.7125899791717529, -0.6502560377120972, -0.5879219770431519, -0.5255879759788513, -0.46325403451919556, -0.400920033454895, -0.33858609199523926, -0.2762520909309387, -0.21391811966896057, -0.15158414840698242, -0.08925020694732666, -0.026916231960058212, 0.035417743027210236, 0.09775172173976898, 0.16008569300174713, 0.22241967916488647, 0.2847536504268646, 0.3470876216888428, 0.4094215929508209, 0.4717555642127991, 0.5340895652770996, 0.5964235067367554, 0.6587575078010559, 0.7210915088653564, 0.7834254503250122, 0.845759391784668, 0.9080933928489685, 0.970427393913269, 1.0327613353729248, 1.0950952768325806, 1.1574293375015259, 1.2197632789611816, 1.2820972204208374, 1.3444311618804932, 1.4067652225494385, 1.4690991640090942, 1.5314332246780396, 1.5937671661376953, 1.656101107597351, 1.7184350490570068, 1.7807691097259521, 1.843103051185608, 1.9054369926452637]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 5.0, 16.0, 15.0, 34.0, 39.0, 56.0, 98.0, 169.0, 379.0, 980.0, 2652.0, 10109.0, 51604.0, 380506.0, 508559.0, 74695.0, 13139.0, 3363.0, 1187.0, 451.0, 207.0, 106.0, 74.0, 34.0, 21.0, 22.0, 9.0, 10.0, 8.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.212890625, -2.146026611328125, -2.07916259765625, -2.012298583984375, -1.9454345703125, -1.878570556640625, -1.81170654296875, -1.744842529296875, -1.677978515625, -1.611114501953125, -1.54425048828125, -1.477386474609375, -1.4105224609375, -1.343658447265625, -1.27679443359375, -1.209930419921875, -1.14306640625, -1.076202392578125, -1.00933837890625, -0.942474365234375, -0.8756103515625, -0.808746337890625, -0.74188232421875, -0.675018310546875, -0.608154296875, -0.541290283203125, -0.47442626953125, -0.407562255859375, -0.3406982421875, -0.273834228515625, -0.20697021484375, -0.140106201171875, -0.0732421875, -0.006378173828125, 0.06048583984375, 0.127349853515625, 0.1942138671875, 0.261077880859375, 0.32794189453125, 0.394805908203125, 0.461669921875, 0.528533935546875, 0.59539794921875, 0.662261962890625, 0.7291259765625, 0.795989990234375, 0.86285400390625, 0.929718017578125, 0.99658203125, 1.063446044921875, 1.13031005859375, 1.197174072265625, 1.2640380859375, 1.330902099609375, 1.39776611328125, 1.464630126953125, 1.531494140625, 1.598358154296875, 1.66522216796875, 1.732086181640625, 1.7989501953125, 1.865814208984375, 1.93267822265625, 1.999542236328125, 2.06640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 10.0, 17.0, 13.0, 18.0, 18.0, 32.0, 35.0, 40.0, 30.0, 57.0, 50.0, 57.0, 60.0, 54.0, 64.0, 55.0, 43.0, 52.0, 36.0, 41.0, 37.0, 22.0, 38.0, 21.0, 22.0, 11.0, 20.0, 8.0, 8.0, 9.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.5492706298828125, -0.529693603515625, -0.5101165771484375, -0.49053955078125, -0.4709625244140625, -0.451385498046875, -0.4318084716796875, -0.4122314453125, -0.3926544189453125, -0.373077392578125, -0.3535003662109375, -0.33392333984375, -0.3143463134765625, -0.294769287109375, -0.2751922607421875, -0.255615234375, -0.2360382080078125, -0.216461181640625, -0.1968841552734375, -0.17730712890625, -0.1577301025390625, -0.138153076171875, -0.1185760498046875, -0.0989990234375, -0.0794219970703125, -0.059844970703125, -0.0402679443359375, -0.02069091796875, -0.0011138916015625, 0.018463134765625, 0.0380401611328125, 0.0576171875, 0.0771942138671875, 0.096771240234375, 0.1163482666015625, 0.13592529296875, 0.1555023193359375, 0.175079345703125, 0.1946563720703125, 0.2142333984375, 0.2338104248046875, 0.253387451171875, 0.2729644775390625, 0.29254150390625, 0.3121185302734375, 0.331695556640625, 0.3512725830078125, 0.370849609375, 0.3904266357421875, 0.410003662109375, 0.4295806884765625, 0.44915771484375, 0.4687347412109375, 0.488311767578125, 0.5078887939453125, 0.5274658203125, 0.5470428466796875, 0.566619873046875, 0.5861968994140625, 0.60577392578125, 0.6253509521484375, 0.644927978515625, 0.6645050048828125, 0.68408203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 13.0, 26.0, 36.0, 53.0, 112.0, 240.0, 476.0, 1457.0, 9876.0, 466220.0, 556375.0, 11175.0, 1547.0, 469.0, 223.0, 111.0, 55.0, 29.0, 24.0, 17.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.761566162109375, -2.59930419921875, -2.437042236328125, -2.2747802734375, -2.112518310546875, -1.95025634765625, -1.787994384765625, -1.625732421875, -1.463470458984375, -1.30120849609375, -1.138946533203125, -0.9766845703125, -0.814422607421875, -0.65216064453125, -0.489898681640625, -0.32763671875, -0.165374755859375, -0.00311279296875, 0.159149169921875, 0.3214111328125, 0.483673095703125, 0.64593505859375, 0.808197021484375, 0.970458984375, 1.132720947265625, 1.29498291015625, 1.457244873046875, 1.6195068359375, 1.781768798828125, 1.94403076171875, 2.106292724609375, 2.2685546875, 2.430816650390625, 2.59307861328125, 2.755340576171875, 2.9176025390625, 3.079864501953125, 3.24212646484375, 3.404388427734375, 3.566650390625, 3.728912353515625, 3.89117431640625, 4.053436279296875, 4.2156982421875, 4.377960205078125, 4.54022216796875, 4.702484130859375, 4.86474609375, 5.027008056640625, 5.18927001953125, 5.351531982421875, 5.5137939453125, 5.676055908203125, 5.83831787109375, 6.000579833984375, 6.162841796875, 6.325103759765625, 6.48736572265625, 6.649627685546875, 6.8118896484375, 6.974151611328125, 7.13641357421875, 7.298675537109375, 7.4609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 2.0, 4.0, 8.0, 13.0, 15.0, 20.0, 22.0, 23.0, 30.0, 42.0, 49.0, 43.0, 38.0, 57.0, 44.0, 65.0, 58.0, 50.0, 58.0, 43.0, 42.0, 33.0, 43.0, 32.0, 41.0, 23.0, 19.0, 22.0, 13.0, 8.0, 7.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06640625, -2.969482421875, -2.87255859375, -2.775634765625, -2.6787109375, -2.581787109375, -2.48486328125, -2.387939453125, -2.291015625, -2.194091796875, -2.09716796875, -2.000244140625, -1.9033203125, -1.806396484375, -1.70947265625, -1.612548828125, -1.515625, -1.418701171875, -1.32177734375, -1.224853515625, -1.1279296875, -1.031005859375, -0.93408203125, -0.837158203125, -0.740234375, -0.643310546875, -0.54638671875, -0.449462890625, -0.3525390625, -0.255615234375, -0.15869140625, -0.061767578125, 0.03515625, 0.132080078125, 0.22900390625, 0.325927734375, 0.4228515625, 0.519775390625, 0.61669921875, 0.713623046875, 0.810546875, 0.907470703125, 1.00439453125, 1.101318359375, 1.1982421875, 1.295166015625, 1.39208984375, 1.489013671875, 1.5859375, 1.682861328125, 1.77978515625, 1.876708984375, 1.9736328125, 2.070556640625, 2.16748046875, 2.264404296875, 2.361328125, 2.458251953125, 2.55517578125, 2.652099609375, 2.7490234375, 2.845947265625, 2.94287109375, 3.039794921875, 3.13671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 16.0, 13.0, 30.0, 32.0, 60.0, 92.0, 154.0, 276.0, 651.0, 1552.0, 5613.0, 39073.0, 792539.0, 190972.0, 12812.0, 2780.0, 920.0, 442.0, 197.0, 100.0, 73.0, 52.0, 26.0, 25.0, 13.0, 11.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.033203125, -1.97296142578125, -1.9127197265625, -1.85247802734375, -1.792236328125, -1.73199462890625, -1.6717529296875, -1.61151123046875, -1.55126953125, -1.49102783203125, -1.4307861328125, -1.37054443359375, -1.310302734375, -1.25006103515625, -1.1898193359375, -1.12957763671875, -1.0693359375, -1.00909423828125, -0.9488525390625, -0.88861083984375, -0.828369140625, -0.76812744140625, -0.7078857421875, -0.64764404296875, -0.58740234375, -0.52716064453125, -0.4669189453125, -0.40667724609375, -0.346435546875, -0.28619384765625, -0.2259521484375, -0.16571044921875, -0.10546875, -0.04522705078125, 0.0150146484375, 0.07525634765625, 0.135498046875, 0.19573974609375, 0.2559814453125, 0.31622314453125, 0.37646484375, 0.43670654296875, 0.4969482421875, 0.55718994140625, 0.617431640625, 0.67767333984375, 0.7379150390625, 0.79815673828125, 0.8583984375, 0.91864013671875, 0.9788818359375, 1.03912353515625, 1.099365234375, 1.15960693359375, 1.2198486328125, 1.28009033203125, 1.34033203125, 1.40057373046875, 1.4608154296875, 1.52105712890625, 1.581298828125, 1.64154052734375, 1.7017822265625, 1.76202392578125, 1.822265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 9.0, 6.0, 7.0, 16.0, 13.0, 23.0, 19.0, 34.0, 43.0, 64.0, 71.0, 85.0, 96.0, 104.0, 97.0, 70.0, 49.0, 53.0, 26.0, 21.0, 16.0, 5.0, 10.0, 5.0, 6.0, 8.0, 2.0, 5.0, 8.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017321109771728516, -0.00016699917614459991, -0.00016078725457191467, -0.00015457533299922943, -0.0001483634114265442, -0.00014215148985385895, -0.0001359395682811737, -0.00012972764670848846, -0.00012351572513580322, -0.00011730380356311798, -0.00011109188199043274, -0.0001048799604177475, -9.866803884506226e-05, -9.245611727237701e-05, -8.624419569969177e-05, -8.003227412700653e-05, -7.382035255432129e-05, -6.760843098163605e-05, -6.13965094089508e-05, -5.5184587836265564e-05, -4.897266626358032e-05, -4.276074469089508e-05, -3.654882311820984e-05, -3.0336901545524597e-05, -2.4124979972839355e-05, -1.7913058400154114e-05, -1.1701136827468872e-05, -5.48921525478363e-06, 7.227063179016113e-07, 6.934627890586853e-06, 1.3146549463272095e-05, 1.9358471035957336e-05, 2.5570392608642578e-05, 3.178231418132782e-05, 3.799423575401306e-05, 4.42061573266983e-05, 5.0418078899383545e-05, 5.663000047206879e-05, 6.284192204475403e-05, 6.905384361743927e-05, 7.526576519012451e-05, 8.147768676280975e-05, 8.7689608335495e-05, 9.390152990818024e-05, 0.00010011345148086548, 0.00010632537305355072, 0.00011253729462623596, 0.0001187492161989212, 0.00012496113777160645, 0.0001311730593442917, 0.00013738498091697693, 0.00014359690248966217, 0.0001498088240623474, 0.00015602074563503265, 0.0001622326672077179, 0.00016844458878040314, 0.00017465651035308838, 0.00018086843192577362, 0.00018708035349845886, 0.0001932922750711441, 0.00019950419664382935, 0.0002057161182165146, 0.00021192803978919983, 0.00021813996136188507, 0.0002243518829345703]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 13.0, 14.0, 16.0, 43.0, 89.0, 140.0, 260.0, 560.0, 1670.0, 9561.0, 483700.0, 539474.0, 10019.0, 1799.0, 569.0, 278.0, 130.0, 79.0, 35.0, 20.0, 23.0, 14.0, 7.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.130859375, -2.0421142578125, -1.953369140625, -1.8646240234375, -1.77587890625, -1.6871337890625, -1.598388671875, -1.5096435546875, -1.4208984375, -1.3321533203125, -1.243408203125, -1.1546630859375, -1.06591796875, -0.9771728515625, -0.888427734375, -0.7996826171875, -0.7109375, -0.6221923828125, -0.533447265625, -0.4447021484375, -0.35595703125, -0.2672119140625, -0.178466796875, -0.0897216796875, -0.0009765625, 0.0877685546875, 0.176513671875, 0.2652587890625, 0.35400390625, 0.4427490234375, 0.531494140625, 0.6202392578125, 0.708984375, 0.7977294921875, 0.886474609375, 0.9752197265625, 1.06396484375, 1.1527099609375, 1.241455078125, 1.3302001953125, 1.4189453125, 1.5076904296875, 1.596435546875, 1.6851806640625, 1.77392578125, 1.8626708984375, 1.951416015625, 2.0401611328125, 2.12890625, 2.2176513671875, 2.306396484375, 2.3951416015625, 2.48388671875, 2.5726318359375, 2.661376953125, 2.7501220703125, 2.8388671875, 2.9276123046875, 3.016357421875, 3.1051025390625, 3.19384765625, 3.2825927734375, 3.371337890625, 3.4600830078125, 3.548828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 13.0, 8.0, 19.0, 41.0, 76.0, 127.0, 165.0, 190.0, 151.0, 84.0, 63.0, 26.0, 12.0, 13.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.4765625, -3.4074172973632812, -3.3382720947265625, -3.2691268920898438, -3.199981689453125, -3.1308364868164062, -3.0616912841796875, -2.9925460815429688, -2.92340087890625, -2.8542556762695312, -2.7851104736328125, -2.7159652709960938, -2.646820068359375, -2.5776748657226562, -2.5085296630859375, -2.4393844604492188, -2.3702392578125, -2.3010940551757812, -2.2319488525390625, -2.1628036499023438, -2.093658447265625, -2.0245132446289062, -1.9553680419921875, -1.8862228393554688, -1.81707763671875, -1.7479324340820312, -1.6787872314453125, -1.6096420288085938, -1.540496826171875, -1.4713516235351562, -1.4022064208984375, -1.3330612182617188, -1.263916015625, -1.1947708129882812, -1.1256256103515625, -1.0564804077148438, -0.987335205078125, -0.9181900024414062, -0.8490447998046875, -0.7798995971679688, -0.71075439453125, -0.6416091918945312, -0.5724639892578125, -0.5033187866210938, -0.434173583984375, -0.36502838134765625, -0.2958831787109375, -0.22673797607421875, -0.1575927734375, -0.08844757080078125, -0.0193023681640625, 0.04984283447265625, 0.118988037109375, 0.18813323974609375, 0.2572784423828125, 0.32642364501953125, 0.39556884765625, 0.46471405029296875, 0.5338592529296875, 0.6030044555664062, 0.672149658203125, 0.7412948608398438, 0.8104400634765625, 0.8795852661132812, 0.94873046875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 13.0, 34.0, 74.0, 180.0, 286.0, 231.0, 122.0, 36.0, 12.0, 12.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703693389892578, -15.476158142089844, -14.248623847961426, -13.021089553833008, -11.793554306030273, -10.566019058227539, -9.338484764099121, -8.110950469970703, -6.883415222167969, -5.655880451202393, -4.428345680236816, -3.2008109092712402, -1.973276138305664, -0.7457413673400879, 0.4817934036254883, 1.7093276977539062, 2.9368629455566406, 4.164397716522217, 5.391932487487793, 6.619467258453369, 7.847002029418945, 9.07453727722168, 10.302071571350098, 11.529605865478516, 12.75714111328125, 13.984676361083984, 15.212210655212402, 16.43974494934082, 17.667280197143555, 18.89481544494629, 20.12234878540039, 21.349884033203125, 22.577415466308594, 23.804950714111328, 25.032485961914062, 26.260019302368164, 27.4875545501709, 28.715089797973633, 29.942623138427734, 31.17015838623047, 32.3976936340332, 33.62522888183594, 34.85276412963867, 36.080299377441406, 37.307830810546875, 38.53536605834961, 39.762901306152344, 40.99043655395508, 42.21797180175781, 43.44550704956055, 44.67304229736328, 45.900577545166016, 47.12811279296875, 48.35564422607422, 49.58317947387695, 50.81071472167969, 52.03824996948242, 53.265785217285156, 54.49332046508789, 55.720855712890625, 56.948387145996094, 58.17592239379883, 59.40345764160156, 60.6309928894043, 61.85852813720703]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 9.0, 13.0, 22.0, 21.0, 19.0, 21.0, 35.0, 35.0, 29.0, 47.0, 55.0, 71.0, 53.0, 70.0, 53.0, 75.0, 52.0, 47.0, 47.0, 49.0, 32.0, 29.0, 17.0, 15.0, 16.0, 14.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.874217987060547, -18.343677520751953, -17.813138961791992, -17.2825984954834, -16.752058029174805, -16.221519470214844, -15.69097900390625, -15.160439491271973, -14.629899978637695, -14.099360466003418, -13.568819999694824, -13.038280487060547, -12.50774097442627, -11.977201461791992, -11.446660995483398, -10.916121482849121, -10.385581016540527, -9.85504150390625, -9.324501037597656, -8.793961524963379, -8.263422012329102, -7.732882022857666, -7.2023420333862305, -6.671802520751953, -6.141262531280518, -5.610722541809082, -5.080183029174805, -4.549643039703369, -4.019103050231934, -3.4885635375976562, -2.9580235481262207, -2.4274837970733643, -1.8969440460205078, -1.3664042949676514, -0.8358644247055054, -0.3053245544433594, 0.22521519660949707, 0.7557549476623535, 1.286294937133789, 1.8168346881866455, 2.347374439239502, 2.8779141902923584, 3.408453941345215, 3.9389939308166504, 4.469533920288086, 5.000073432922363, 5.530613422393799, 6.061153411865234, 6.591692924499512, 7.122232913970947, 7.652772426605225, 8.18331241607666, 8.713851928710938, 9.244392395019531, 9.774931907653809, 10.305471420288086, 10.83601188659668, 11.366551399230957, 11.89709186553955, 12.427631378173828, 12.958170890808105, 13.488710403442383, 14.019250869750977, 14.549790382385254, 15.080329895019531]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 10.0, 25.0, 36.0, 37.0, 64.0, 76.0, 125.0, 161.0, 311.0, 541.0, 1045.0, 2609.0, 9764.0, 304368.0, 3857752.0, 11778.0, 2905.0, 1116.0, 563.0, 315.0, 220.0, 144.0, 82.0, 58.0, 35.0, 36.0, 27.0, 11.0, 9.0, 5.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.896484375, -1.823699951171875, -1.75091552734375, -1.678131103515625, -1.6053466796875, -1.532562255859375, -1.45977783203125, -1.386993408203125, -1.314208984375, -1.241424560546875, -1.16864013671875, -1.095855712890625, -1.0230712890625, -0.950286865234375, -0.87750244140625, -0.804718017578125, -0.73193359375, -0.659149169921875, -0.58636474609375, -0.513580322265625, -0.4407958984375, -0.368011474609375, -0.29522705078125, -0.222442626953125, -0.149658203125, -0.076873779296875, -0.00408935546875, 0.068695068359375, 0.1414794921875, 0.214263916015625, 0.28704833984375, 0.359832763671875, 0.4326171875, 0.505401611328125, 0.57818603515625, 0.650970458984375, 0.7237548828125, 0.796539306640625, 0.86932373046875, 0.942108154296875, 1.014892578125, 1.087677001953125, 1.16046142578125, 1.233245849609375, 1.3060302734375, 1.378814697265625, 1.45159912109375, 1.524383544921875, 1.59716796875, 1.669952392578125, 1.74273681640625, 1.815521240234375, 1.8883056640625, 1.961090087890625, 2.03387451171875, 2.106658935546875, 2.179443359375, 2.252227783203125, 2.32501220703125, 2.397796630859375, 2.4705810546875, 2.543365478515625, 2.61614990234375, 2.688934326171875, 2.76171875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 13.0, 7.0, 19.0, 27.0, 21.0, 29.0, 46.0, 67.0, 65.0, 67.0, 71.0, 62.0, 82.0, 71.0, 61.0, 54.0, 54.0, 40.0, 40.0, 21.0, 13.0, 12.0, 14.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8837890625, -0.8555984497070312, -0.8274078369140625, -0.7992172241210938, -0.771026611328125, -0.7428359985351562, -0.7146453857421875, -0.6864547729492188, -0.65826416015625, -0.6300735473632812, -0.6018829345703125, -0.5736923217773438, -0.545501708984375, -0.5173110961914062, -0.4891204833984375, -0.46092987060546875, -0.4327392578125, -0.40454864501953125, -0.3763580322265625, -0.34816741943359375, -0.319976806640625, -0.29178619384765625, -0.2635955810546875, -0.23540496826171875, -0.20721435546875, -0.17902374267578125, -0.1508331298828125, -0.12264251708984375, -0.094451904296875, -0.06626129150390625, -0.0380706787109375, -0.00988006591796875, 0.018310546875, 0.04650115966796875, 0.0746917724609375, 0.10288238525390625, 0.131072998046875, 0.15926361083984375, 0.1874542236328125, 0.21564483642578125, 0.24383544921875, 0.27202606201171875, 0.3002166748046875, 0.32840728759765625, 0.356597900390625, 0.38478851318359375, 0.4129791259765625, 0.44116973876953125, 0.4693603515625, 0.49755096435546875, 0.5257415771484375, 0.5539321899414062, 0.582122802734375, 0.6103134155273438, 0.6385040283203125, 0.6666946411132812, 0.69488525390625, 0.7230758666992188, 0.7512664794921875, 0.7794570922851562, 0.807647705078125, 0.8358383178710938, 0.8640289306640625, 0.8922195434570312, 0.92041015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 11.0, 8.0, 10.0, 16.0, 21.0, 22.0, 33.0, 22.0, 34.0, 51.0, 66.0, 103.0, 138.0, 251.0, 483.0, 914.0, 1985.0, 5531.0, 25656.0, 3917987.0, 219870.0, 13881.0, 3851.0, 1481.0, 722.0, 391.0, 211.0, 138.0, 103.0, 55.0, 51.0, 34.0, 29.0, 26.0, 24.0, 15.0, 13.0, 11.0, 9.0, 5.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.845703125, -2.756317138671875, -2.66693115234375, -2.577545166015625, -2.4881591796875, -2.398773193359375, -2.30938720703125, -2.220001220703125, -2.130615234375, -2.041229248046875, -1.95184326171875, -1.862457275390625, -1.7730712890625, -1.683685302734375, -1.59429931640625, -1.504913330078125, -1.41552734375, -1.326141357421875, -1.23675537109375, -1.147369384765625, -1.0579833984375, -0.968597412109375, -0.87921142578125, -0.789825439453125, -0.700439453125, -0.611053466796875, -0.52166748046875, -0.432281494140625, -0.3428955078125, -0.253509521484375, -0.16412353515625, -0.074737548828125, 0.0146484375, 0.104034423828125, 0.19342041015625, 0.282806396484375, 0.3721923828125, 0.461578369140625, 0.55096435546875, 0.640350341796875, 0.729736328125, 0.819122314453125, 0.90850830078125, 0.997894287109375, 1.0872802734375, 1.176666259765625, 1.26605224609375, 1.355438232421875, 1.44482421875, 1.534210205078125, 1.62359619140625, 1.712982177734375, 1.8023681640625, 1.891754150390625, 1.98114013671875, 2.070526123046875, 2.159912109375, 2.249298095703125, 2.33868408203125, 2.428070068359375, 2.5174560546875, 2.606842041015625, 2.69622802734375, 2.785614013671875, 2.875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 6.0, 19.0, 26.0, 92.0, 497.0, 3242.0, 112.0, 41.0, 14.0, 15.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8322677612304688, -0.8046722412109375, -0.7770767211914062, -0.749481201171875, -0.7218856811523438, -0.6942901611328125, -0.6666946411132812, -0.63909912109375, -0.6115036010742188, -0.5839080810546875, -0.5563125610351562, -0.528717041015625, -0.5011215209960938, -0.4735260009765625, -0.44593048095703125, -0.4183349609375, -0.39073944091796875, -0.3631439208984375, -0.33554840087890625, -0.307952880859375, -0.28035736083984375, -0.2527618408203125, -0.22516632080078125, -0.19757080078125, -0.16997528076171875, -0.1423797607421875, -0.11478424072265625, -0.087188720703125, -0.05959320068359375, -0.0319976806640625, -0.00440216064453125, 0.023193359375, 0.05078887939453125, 0.0783843994140625, 0.10597991943359375, 0.133575439453125, 0.16117095947265625, 0.1887664794921875, 0.21636199951171875, 0.24395751953125, 0.27155303955078125, 0.2991485595703125, 0.32674407958984375, 0.354339599609375, 0.38193511962890625, 0.4095306396484375, 0.43712615966796875, 0.4647216796875, 0.49231719970703125, 0.5199127197265625, 0.5475082397460938, 0.575103759765625, 0.6026992797851562, 0.6302947998046875, 0.6578903198242188, 0.68548583984375, 0.7130813598632812, 0.7406768798828125, 0.7682723999023438, 0.795867919921875, 0.8234634399414062, 0.8510589599609375, 0.8786544799804688, 0.90625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 13.0, 28.0, 38.0, 57.0, 103.0, 162.0, 177.0, 158.0, 119.0, 56.0, 27.0, 14.0, 14.0, 10.0, 7.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.837955951690674, -2.7528116703033447, -2.6676676273345947, -2.5825233459472656, -2.4973790645599365, -2.4122347831726074, -2.3270907402038574, -2.2419464588165283, -2.156802177429199, -2.07165789604187, -1.9865137338638306, -1.901369571685791, -1.816225290298462, -1.7310811281204224, -1.6459369659423828, -1.5607926845550537, -1.4756485223770142, -1.3905043601989746, -1.3053600788116455, -1.220215916633606, -1.1350716352462769, -1.0499274730682373, -0.964783251285553, -0.8796390295028687, -0.7944948077201843, -0.7093505859375, -0.6242063641548157, -0.5390621423721313, -0.4539179503917694, -0.3687737286090851, -0.28362953662872314, -0.19848531484603882, -0.11334109306335449, -0.028196878731250763, 0.056947335600852966, 0.1420915424823761, 0.22723576426506042, 0.31237998604774475, 0.3975241780281067, 0.482668399810791, 0.5678126215934753, 0.6529568433761597, 0.738101065158844, 0.8232452869415283, 0.9083894491195679, 0.993533730506897, 1.0786778926849365, 1.1638221740722656, 1.2489663362503052, 1.3341104984283447, 1.4192547798156738, 1.5043989419937134, 1.5895432233810425, 1.674687385559082, 1.7598316669464111, 1.8449758291244507, 1.9301199913024902, 2.0152642726898193, 2.1004083156585693, 2.1855525970458984, 2.2706968784332275, 2.3558411598205566, 2.4409852027893066, 2.5261294841766357, 2.611273765563965]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 9.0, 5.0, 10.0, 3.0, 2.0, 10.0, 11.0, 13.0, 16.0, 19.0, 18.0, 18.0, 13.0, 16.0, 30.0, 36.0, 35.0, 28.0, 43.0, 48.0, 35.0, 52.0, 38.0, 46.0, 44.0, 51.0, 41.0, 44.0, 42.0, 30.0, 27.0, 25.0, 15.0, 25.0, 19.0, 15.0, 16.0, 10.0, 7.0, 10.0, 11.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.004260778427124, -0.9713153839111328, -0.9383699893951416, -0.9054246544837952, -0.872479259967804, -0.8395338654518127, -0.8065885305404663, -0.7736431360244751, -0.7406977415084839, -0.7077523469924927, -0.6748069524765015, -0.641861617565155, -0.6089162230491638, -0.5759708285331726, -0.5430254936218262, -0.510080099105835, -0.47713470458984375, -0.44418931007385254, -0.4112439453601837, -0.3782985806465149, -0.3453531861305237, -0.31240779161453247, -0.27946242690086365, -0.24651704728603363, -0.2135716676712036, -0.1806262880563736, -0.14768090844154358, -0.11473552882671356, -0.08179014921188354, -0.04884476959705353, -0.01589938998222351, 0.017045989632606506, 0.04999136924743652, 0.08293674886226654, 0.11588212847709656, 0.14882750809192657, 0.1817728877067566, 0.2147182673215866, 0.24766364693641663, 0.28060901165008545, 0.31355440616607666, 0.34649980068206787, 0.3794451653957367, 0.4123905301094055, 0.44533592462539673, 0.47828131914138794, 0.5112266540527344, 0.5441720485687256, 0.5771174430847168, 0.610062837600708, 0.6430082321166992, 0.6759535670280457, 0.7088989615440369, 0.7418443560600281, 0.7747896909713745, 0.8077350854873657, 0.8406804800033569, 0.8736258745193481, 0.9065712690353394, 0.9395166039466858, 0.972461998462677, 1.0054073333740234, 1.0383527278900146, 1.0712981224060059, 1.104243516921997]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 8.0, 7.0, 6.0, 9.0, 8.0, 20.0, 44.0, 54.0, 99.0, 187.0, 358.0, 706.0, 1509.0, 3615.0, 9928.0, 32428.0, 135364.0, 510995.0, 268633.0, 58627.0, 16090.0, 5502.0, 2235.0, 1005.0, 517.0, 268.0, 133.0, 80.0, 52.0, 25.0, 17.0, 12.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.67413330078125, -1.6285400390625, -1.58294677734375, -1.537353515625, -1.49176025390625, -1.4461669921875, -1.40057373046875, -1.35498046875, -1.30938720703125, -1.2637939453125, -1.21820068359375, -1.172607421875, -1.12701416015625, -1.0814208984375, -1.03582763671875, -0.990234375, -0.94464111328125, -0.8990478515625, -0.85345458984375, -0.807861328125, -0.76226806640625, -0.7166748046875, -0.67108154296875, -0.62548828125, -0.57989501953125, -0.5343017578125, -0.48870849609375, -0.443115234375, -0.39752197265625, -0.3519287109375, -0.30633544921875, -0.2607421875, -0.21514892578125, -0.1695556640625, -0.12396240234375, -0.078369140625, -0.03277587890625, 0.0128173828125, 0.05841064453125, 0.10400390625, 0.14959716796875, 0.1951904296875, 0.24078369140625, 0.286376953125, 0.33197021484375, 0.3775634765625, 0.42315673828125, 0.46875, 0.51434326171875, 0.5599365234375, 0.60552978515625, 0.651123046875, 0.69671630859375, 0.7423095703125, 0.78790283203125, 0.83349609375, 0.87908935546875, 0.9246826171875, 0.97027587890625, 1.015869140625, 1.06146240234375, 1.1070556640625, 1.15264892578125, 1.1982421875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 9.0, 13.0, 19.0, 18.0, 25.0, 27.0, 33.0, 30.0, 56.0, 42.0, 54.0, 55.0, 52.0, 56.0, 57.0, 58.0, 49.0, 48.0, 50.0, 48.0, 43.0, 25.0, 26.0, 21.0, 11.0, 14.0, 7.0, 11.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7079238891601562, -0.6829376220703125, -0.6579513549804688, -0.632965087890625, -0.6079788208007812, -0.5829925537109375, -0.5580062866210938, -0.53302001953125, -0.5080337524414062, -0.4830474853515625, -0.45806121826171875, -0.433074951171875, -0.40808868408203125, -0.3831024169921875, -0.35811614990234375, -0.3331298828125, -0.30814361572265625, -0.2831573486328125, -0.25817108154296875, -0.233184814453125, -0.20819854736328125, -0.1832122802734375, -0.15822601318359375, -0.13323974609375, -0.10825347900390625, -0.0832672119140625, -0.05828094482421875, -0.033294677734375, -0.00830841064453125, 0.0166778564453125, 0.04166412353515625, 0.066650390625, 0.09163665771484375, 0.1166229248046875, 0.14160919189453125, 0.166595458984375, 0.19158172607421875, 0.2165679931640625, 0.24155426025390625, 0.26654052734375, 0.29152679443359375, 0.3165130615234375, 0.34149932861328125, 0.366485595703125, 0.39147186279296875, 0.4164581298828125, 0.44144439697265625, 0.4664306640625, 0.49141693115234375, 0.5164031982421875, 0.5413894653320312, 0.566375732421875, 0.5913619995117188, 0.6163482666015625, 0.6413345336914062, 0.66632080078125, 0.6913070678710938, 0.7162933349609375, 0.7412796020507812, 0.766265869140625, 0.7912521362304688, 0.8162384033203125, 0.8412246704101562, 0.8662109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 19.0, 13.0, 37.0, 42.0, 69.0, 109.0, 216.0, 434.0, 911.0, 2455.0, 10777.0, 98940.0, 811096.0, 107570.0, 11226.0, 2640.0, 975.0, 446.0, 203.0, 122.0, 75.0, 50.0, 31.0, 22.0, 15.0, 14.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.93902587890625, -1.8565673828125, -1.77410888671875, -1.691650390625, -1.60919189453125, -1.5267333984375, -1.44427490234375, -1.36181640625, -1.27935791015625, -1.1968994140625, -1.11444091796875, -1.031982421875, -0.94952392578125, -0.8670654296875, -0.78460693359375, -0.7021484375, -0.61968994140625, -0.5372314453125, -0.45477294921875, -0.372314453125, -0.28985595703125, -0.2073974609375, -0.12493896484375, -0.04248046875, 0.03997802734375, 0.1224365234375, 0.20489501953125, 0.287353515625, 0.36981201171875, 0.4522705078125, 0.53472900390625, 0.6171875, 0.69964599609375, 0.7821044921875, 0.86456298828125, 0.947021484375, 1.02947998046875, 1.1119384765625, 1.19439697265625, 1.27685546875, 1.35931396484375, 1.4417724609375, 1.52423095703125, 1.606689453125, 1.68914794921875, 1.7716064453125, 1.85406494140625, 1.9365234375, 2.01898193359375, 2.1014404296875, 2.18389892578125, 2.266357421875, 2.34881591796875, 2.4312744140625, 2.51373291015625, 2.59619140625, 2.67864990234375, 2.7611083984375, 2.84356689453125, 2.926025390625, 3.00848388671875, 3.0909423828125, 3.17340087890625, 3.255859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 14.0, 16.0, 17.0, 20.0, 31.0, 42.0, 36.0, 52.0, 73.0, 67.0, 82.0, 77.0, 58.0, 58.0, 60.0, 67.0, 56.0, 52.0, 29.0, 27.0, 20.0, 14.0, 13.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.291046142578125, -6.14068603515625, -5.990325927734375, -5.8399658203125, -5.689605712890625, -5.53924560546875, -5.388885498046875, -5.238525390625, -5.088165283203125, -4.93780517578125, -4.787445068359375, -4.6370849609375, -4.486724853515625, -4.33636474609375, -4.186004638671875, -4.03564453125, -3.885284423828125, -3.73492431640625, -3.584564208984375, -3.4342041015625, -3.283843994140625, -3.13348388671875, -2.983123779296875, -2.832763671875, -2.682403564453125, -2.53204345703125, -2.381683349609375, -2.2313232421875, -2.080963134765625, -1.93060302734375, -1.780242919921875, -1.6298828125, -1.479522705078125, -1.32916259765625, -1.178802490234375, -1.0284423828125, -0.878082275390625, -0.72772216796875, -0.577362060546875, -0.427001953125, -0.276641845703125, -0.12628173828125, 0.024078369140625, 0.1744384765625, 0.324798583984375, 0.47515869140625, 0.625518798828125, 0.77587890625, 0.926239013671875, 1.07659912109375, 1.226959228515625, 1.3773193359375, 1.527679443359375, 1.67803955078125, 1.828399658203125, 1.978759765625, 2.129119873046875, 2.27947998046875, 2.429840087890625, 2.5802001953125, 2.730560302734375, 2.88092041015625, 3.031280517578125, 3.181640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 12.0, 13.0, 28.0, 46.0, 125.0, 325.0, 1548.0, 28577.0, 999236.0, 16801.0, 1319.0, 306.0, 99.0, 42.0, 13.0, 14.0, 15.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8828125, -2.8078155517578125, -2.732818603515625, -2.6578216552734375, -2.58282470703125, -2.5078277587890625, -2.432830810546875, -2.3578338623046875, -2.2828369140625, -2.2078399658203125, -2.132843017578125, -2.0578460693359375, -1.98284912109375, -1.9078521728515625, -1.832855224609375, -1.7578582763671875, -1.682861328125, -1.6078643798828125, -1.532867431640625, -1.4578704833984375, -1.38287353515625, -1.3078765869140625, -1.232879638671875, -1.1578826904296875, -1.0828857421875, -1.0078887939453125, -0.932891845703125, -0.8578948974609375, -0.78289794921875, -0.7079010009765625, -0.632904052734375, -0.5579071044921875, -0.48291015625, -0.4079132080078125, -0.332916259765625, -0.2579193115234375, -0.18292236328125, -0.1079254150390625, -0.032928466796875, 0.0420684814453125, 0.1170654296875, 0.1920623779296875, 0.267059326171875, 0.3420562744140625, 0.41705322265625, 0.4920501708984375, 0.567047119140625, 0.6420440673828125, 0.717041015625, 0.7920379638671875, 0.867034912109375, 0.9420318603515625, 1.01702880859375, 1.0920257568359375, 1.167022705078125, 1.2420196533203125, 1.3170166015625, 1.3920135498046875, 1.467010498046875, 1.5420074462890625, 1.61700439453125, 1.6920013427734375, 1.766998291015625, 1.8419952392578125, 1.9169921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 9.0, 11.0, 14.0, 37.0, 53.0, 100.0, 161.0, 207.0, 172.0, 100.0, 53.0, 40.0, 16.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002536773681640625, -0.00024447590112686157, -0.00023527443408966064, -0.00022607296705245972, -0.0002168715000152588, -0.00020767003297805786, -0.00019846856594085693, -0.000189267098903656, -0.00018006563186645508, -0.00017086416482925415, -0.00016166269779205322, -0.0001524612307548523, -0.00014325976371765137, -0.00013405829668045044, -0.0001248568296432495, -0.00011565536260604858, -0.00010645389556884766, -9.725242853164673e-05, -8.80509614944458e-05, -7.884949445724487e-05, -6.964802742004395e-05, -6.044656038284302e-05, -5.124509334564209e-05, -4.204362630844116e-05, -3.2842159271240234e-05, -2.3640692234039307e-05, -1.4439225196838379e-05, -5.237758159637451e-06, 3.9637088775634766e-06, 1.3165175914764404e-05, 2.2366642951965332e-05, 3.156810998916626e-05, 4.076957702636719e-05, 4.9971044063568115e-05, 5.917251110076904e-05, 6.837397813796997e-05, 7.75754451751709e-05, 8.677691221237183e-05, 9.597837924957275e-05, 0.00010517984628677368, 0.00011438131332397461, 0.00012358278036117554, 0.00013278424739837646, 0.0001419857144355774, 0.00015118718147277832, 0.00016038864850997925, 0.00016959011554718018, 0.0001787915825843811, 0.00018799304962158203, 0.00019719451665878296, 0.0002063959836959839, 0.00021559745073318481, 0.00022479891777038574, 0.00023400038480758667, 0.0002432018518447876, 0.0002524033188819885, 0.00026160478591918945, 0.0002708062529563904, 0.0002800077199935913, 0.00028920918703079224, 0.00029841065406799316, 0.0003076121211051941, 0.000316813588142395, 0.00032601505517959595, 0.0003352165222167969]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 22.0, 37.0, 100.0, 216.0, 569.0, 1768.0, 9956.0, 290515.0, 724286.0, 17338.0, 2447.0, 734.0, 260.0, 124.0, 68.0, 36.0, 14.0, 11.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6318359375, -1.5793914794921875, -1.526947021484375, -1.4745025634765625, -1.42205810546875, -1.3696136474609375, -1.317169189453125, -1.2647247314453125, -1.2122802734375, -1.1598358154296875, -1.107391357421875, -1.0549468994140625, -1.00250244140625, -0.9500579833984375, -0.897613525390625, -0.8451690673828125, -0.792724609375, -0.7402801513671875, -0.687835693359375, -0.6353912353515625, -0.58294677734375, -0.5305023193359375, -0.478057861328125, -0.4256134033203125, -0.3731689453125, -0.3207244873046875, -0.268280029296875, -0.2158355712890625, -0.16339111328125, -0.1109466552734375, -0.058502197265625, -0.0060577392578125, 0.04638671875, 0.0988311767578125, 0.151275634765625, 0.2037200927734375, 0.25616455078125, 0.3086090087890625, 0.361053466796875, 0.4134979248046875, 0.4659423828125, 0.5183868408203125, 0.570831298828125, 0.6232757568359375, 0.67572021484375, 0.7281646728515625, 0.780609130859375, 0.8330535888671875, 0.885498046875, 0.9379425048828125, 0.990386962890625, 1.0428314208984375, 1.09527587890625, 1.1477203369140625, 1.200164794921875, 1.2526092529296875, 1.3050537109375, 1.3574981689453125, 1.409942626953125, 1.4623870849609375, 1.51483154296875, 1.5672760009765625, 1.619720458984375, 1.6721649169921875, 1.724609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 12.0, 8.0, 24.0, 27.0, 48.0, 60.0, 84.0, 133.0, 130.0, 121.0, 112.0, 82.0, 55.0, 37.0, 23.0, 17.0, 6.0, 5.0, 8.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8916091918945312, -0.8569488525390625, -0.8222885131835938, -0.787628173828125, -0.7529678344726562, -0.7183074951171875, -0.6836471557617188, -0.64898681640625, -0.6143264770507812, -0.5796661376953125, -0.5450057983398438, -0.510345458984375, -0.47568511962890625, -0.4410247802734375, -0.40636444091796875, -0.3717041015625, -0.33704376220703125, -0.3023834228515625, -0.26772308349609375, -0.233062744140625, -0.19840240478515625, -0.1637420654296875, -0.12908172607421875, -0.09442138671875, -0.05976104736328125, -0.0251007080078125, 0.00955963134765625, 0.044219970703125, 0.07888031005859375, 0.1135406494140625, 0.14820098876953125, 0.182861328125, 0.21752166748046875, 0.2521820068359375, 0.28684234619140625, 0.321502685546875, 0.35616302490234375, 0.3908233642578125, 0.42548370361328125, 0.46014404296875, 0.49480438232421875, 0.5294647216796875, 0.5641250610351562, 0.598785400390625, 0.6334457397460938, 0.6681060791015625, 0.7027664184570312, 0.7374267578125, 0.7720870971679688, 0.8067474365234375, 0.8414077758789062, 0.876068115234375, 0.9107284545898438, 0.9453887939453125, 0.9800491333007812, 1.01470947265625, 1.0493698120117188, 1.0840301513671875, 1.1186904907226562, 1.153350830078125, 1.1880111694335938, 1.2226715087890625, 1.2573318481445312, 1.2919921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 12.0, 25.0, 25.0, 47.0, 107.0, 141.0, 190.0, 191.0, 117.0, 54.0, 27.0, 25.0, 9.0, 6.0, 1.0, 5.0, 1.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.30942153930664, -13.776330947875977, -13.243239402770996, -12.710147857666016, -12.177057266235352, -11.643966674804688, -11.110875129699707, -10.577783584594727, -10.044692993164062, -9.511602401733398, -8.978510856628418, -8.445419311523438, -7.912328720092773, -7.379237651824951, -6.846146583557129, -6.313055515289307, -5.779964447021484, -5.246873378753662, -4.71378231048584, -4.180691242218018, -3.6476001739501953, -3.114509105682373, -2.581418037414551, -2.0483269691467285, -1.5152359008789062, -0.982144832611084, -0.4490537643432617, 0.08403730392456055, 0.6171283721923828, 1.150219440460205, 1.6833105087280273, 2.2164015769958496, 2.749490737915039, 3.2825818061828613, 3.8156728744506836, 4.348763942718506, 4.881855010986328, 5.41494607925415, 5.948037147521973, 6.481128215789795, 7.014219284057617, 7.5473103523254395, 8.080401420593262, 8.613492965698242, 9.146583557128906, 9.67967414855957, 10.21276569366455, 10.745857238769531, 11.278947830200195, 11.81203842163086, 12.34512996673584, 12.87822151184082, 13.411312103271484, 13.944402694702148, 14.477494239807129, 15.01058578491211, 15.543676376342773, 16.076766967773438, 16.609859466552734, 17.1429500579834, 17.676040649414062, 18.209131240844727, 18.74222183227539, 19.275314331054688, 19.80840492248535]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 11.0, 7.0, 7.0, 10.0, 12.0, 18.0, 22.0, 25.0, 26.0, 30.0, 30.0, 55.0, 53.0, 62.0, 64.0, 70.0, 56.0, 63.0, 53.0, 57.0, 51.0, 41.0, 32.0, 31.0, 19.0, 20.0, 16.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.503167152404785, -14.96397590637207, -14.424785614013672, -13.885594367980957, -13.346403121948242, -12.807212829589844, -12.268021583557129, -11.728830337524414, -11.189640045166016, -10.6504487991333, -10.111258506774902, -9.572067260742188, -9.032876968383789, -8.493685722351074, -7.954494476318359, -7.415303707122803, -6.876112937927246, -6.3369221687316895, -5.797731399536133, -5.258540153503418, -4.719349384307861, -4.180158615112305, -3.640967607498169, -3.101776599884033, -2.5625858306884766, -2.02339506149292, -1.4842040538787842, -0.945013165473938, -0.4058222770690918, 0.13336849212646484, 0.6725594997406006, 1.2117505073547363, 1.7509422302246094, 2.290132999420166, 2.8293240070343018, 3.3685150146484375, 3.907705783843994, 4.446896553039551, 4.986087799072266, 5.525278568267822, 6.064469337463379, 6.6036601066589355, 7.142850875854492, 7.682042121887207, 8.221233367919922, 8.76042366027832, 9.299614906311035, 9.83880615234375, 10.377996444702148, 10.917187690734863, 11.456377983093262, 11.995569229125977, 12.534759521484375, 13.07395076751709, 13.613142013549805, 14.152332305908203, 14.691523551940918, 15.230714797973633, 15.769905090332031, 16.30909538269043, 16.84828758239746, 17.38747787475586, 17.926668167114258, 18.46586036682129, 19.005050659179688]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 16.0, 21.0, 32.0, 46.0, 53.0, 82.0, 118.0, 194.0, 353.0, 675.0, 1837.0, 6241.0, 85784.0, 4073411.0, 19542.0, 3417.0, 1171.0, 517.0, 279.0, 151.0, 108.0, 80.0, 52.0, 43.0, 21.0, 12.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.478515625, -2.3992919921875, -2.320068359375, -2.2408447265625, -2.16162109375, -2.0823974609375, -2.003173828125, -1.9239501953125, -1.8447265625, -1.7655029296875, -1.686279296875, -1.6070556640625, -1.52783203125, -1.4486083984375, -1.369384765625, -1.2901611328125, -1.2109375, -1.1317138671875, -1.052490234375, -0.9732666015625, -0.89404296875, -0.8148193359375, -0.735595703125, -0.6563720703125, -0.5771484375, -0.4979248046875, -0.418701171875, -0.3394775390625, -0.26025390625, -0.1810302734375, -0.101806640625, -0.0225830078125, 0.056640625, 0.1358642578125, 0.215087890625, 0.2943115234375, 0.37353515625, 0.4527587890625, 0.531982421875, 0.6112060546875, 0.6904296875, 0.7696533203125, 0.848876953125, 0.9281005859375, 1.00732421875, 1.0865478515625, 1.165771484375, 1.2449951171875, 1.32421875, 1.4034423828125, 1.482666015625, 1.5618896484375, 1.64111328125, 1.7203369140625, 1.799560546875, 1.8787841796875, 1.9580078125, 2.0372314453125, 2.116455078125, 2.1956787109375, 2.27490234375, 2.3541259765625, 2.433349609375, 2.5125732421875, 2.591796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 10.0, 25.0, 24.0, 41.0, 50.0, 74.0, 83.0, 108.0, 88.0, 105.0, 94.0, 78.0, 88.0, 46.0, 32.0, 14.0, 15.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.787109375, -1.7452392578125, -1.703369140625, -1.6614990234375, -1.61962890625, -1.5777587890625, -1.535888671875, -1.4940185546875, -1.4521484375, -1.4102783203125, -1.368408203125, -1.3265380859375, -1.28466796875, -1.2427978515625, -1.200927734375, -1.1590576171875, -1.1171875, -1.0753173828125, -1.033447265625, -0.9915771484375, -0.94970703125, -0.9078369140625, -0.865966796875, -0.8240966796875, -0.7822265625, -0.7403564453125, -0.698486328125, -0.6566162109375, -0.61474609375, -0.5728759765625, -0.531005859375, -0.4891357421875, -0.447265625, -0.4053955078125, -0.363525390625, -0.3216552734375, -0.27978515625, -0.2379150390625, -0.196044921875, -0.1541748046875, -0.1123046875, -0.0704345703125, -0.028564453125, 0.0133056640625, 0.05517578125, 0.0970458984375, 0.138916015625, 0.1807861328125, 0.22265625, 0.2645263671875, 0.306396484375, 0.3482666015625, 0.39013671875, 0.4320068359375, 0.473876953125, 0.5157470703125, 0.5576171875, 0.5994873046875, 0.641357421875, 0.6832275390625, 0.72509765625, 0.7669677734375, 0.808837890625, 0.8507080078125, 0.892578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 8.0, 7.0, 6.0, 8.0, 15.0, 19.0, 24.0, 35.0, 41.0, 69.0, 70.0, 120.0, 199.0, 254.0, 420.0, 735.0, 1528.0, 3866.0, 18520.0, 390544.0, 3734189.0, 33459.0, 5948.0, 1900.0, 833.0, 482.0, 316.0, 196.0, 126.0, 90.0, 61.0, 49.0, 28.0, 26.0, 25.0, 8.0, 19.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.94647216796875, -1.8773193359375, -1.80816650390625, -1.739013671875, -1.66986083984375, -1.6007080078125, -1.53155517578125, -1.46240234375, -1.39324951171875, -1.3240966796875, -1.25494384765625, -1.185791015625, -1.11663818359375, -1.0474853515625, -0.97833251953125, -0.9091796875, -0.84002685546875, -0.7708740234375, -0.70172119140625, -0.632568359375, -0.56341552734375, -0.4942626953125, -0.42510986328125, -0.35595703125, -0.28680419921875, -0.2176513671875, -0.14849853515625, -0.079345703125, -0.01019287109375, 0.0589599609375, 0.12811279296875, 0.197265625, 0.26641845703125, 0.3355712890625, 0.40472412109375, 0.473876953125, 0.54302978515625, 0.6121826171875, 0.68133544921875, 0.75048828125, 0.81964111328125, 0.8887939453125, 0.95794677734375, 1.027099609375, 1.09625244140625, 1.1654052734375, 1.23455810546875, 1.3037109375, 1.37286376953125, 1.4420166015625, 1.51116943359375, 1.580322265625, 1.64947509765625, 1.7186279296875, 1.78778076171875, 1.85693359375, 1.92608642578125, 1.9952392578125, 2.06439208984375, 2.133544921875, 2.20269775390625, 2.2718505859375, 2.34100341796875, 2.41015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 11.0, 16.0, 25.0, 56.0, 139.0, 593.0, 2767.0, 271.0, 96.0, 37.0, 19.0, 15.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -1.0012893676757812, -0.9703521728515625, -0.9394149780273438, -0.908477783203125, -0.8775405883789062, -0.8466033935546875, -0.8156661987304688, -0.78472900390625, -0.7537918090820312, -0.7228546142578125, -0.6919174194335938, -0.660980224609375, -0.6300430297851562, -0.5991058349609375, -0.5681686401367188, -0.5372314453125, -0.5062942504882812, -0.4753570556640625, -0.44441986083984375, -0.413482666015625, -0.38254547119140625, -0.3516082763671875, -0.32067108154296875, -0.28973388671875, -0.25879669189453125, -0.2278594970703125, -0.19692230224609375, -0.165985107421875, -0.13504791259765625, -0.1041107177734375, -0.07317352294921875, -0.042236328125, -0.01129913330078125, 0.0196380615234375, 0.05057525634765625, 0.081512451171875, 0.11244964599609375, 0.1433868408203125, 0.17432403564453125, 0.20526123046875, 0.23619842529296875, 0.2671356201171875, 0.29807281494140625, 0.329010009765625, 0.35994720458984375, 0.3908843994140625, 0.42182159423828125, 0.4527587890625, 0.48369598388671875, 0.5146331787109375, 0.5455703735351562, 0.576507568359375, 0.6074447631835938, 0.6383819580078125, 0.6693191528320312, 0.70025634765625, 0.7311935424804688, 0.7621307373046875, 0.7930679321289062, 0.824005126953125, 0.8549423217773438, 0.8858795166015625, 0.9168167114257812, 0.94775390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 15.0, 22.0, 48.0, 98.0, 176.0, 255.0, 221.0, 90.0, 49.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.740829467773438, -8.528131484985352, -8.315434455871582, -8.102736473083496, -7.89003849029541, -7.677340984344482, -7.464643478393555, -7.251945495605469, -7.039247989654541, -6.826550483703613, -6.613852500915527, -6.4011549949646, -6.188457489013672, -5.975759506225586, -5.763062000274658, -5.5503644943237305, -5.3376665115356445, -5.124969005584717, -4.912271022796631, -4.699573516845703, -4.486875534057617, -4.2741780281066895, -4.061480522155762, -3.848782777786255, -3.636085033416748, -3.423387289047241, -3.2106895446777344, -2.9979920387268066, -2.7852942943573, -2.572596549987793, -2.3598990440368652, -2.1472012996673584, -1.9345040321350098, -1.721806287765503, -1.5091086626052856, -1.2964110374450684, -1.0837132930755615, -0.8710155487060547, -0.6583179235458374, -0.4456202983856201, -0.23292255401611328, -0.02022486925125122, 0.19247281551361084, 0.4051705002784729, 0.617868185043335, 0.8305659294128418, 1.043263554573059, 1.2559611797332764, 1.4686589241027832, 1.68135666847229, 1.8940542936325073, 2.1067519187927246, 2.3194496631622314, 2.5321474075317383, 2.744844913482666, 2.957542657852173, 3.1702404022216797, 3.3829381465911865, 3.5956358909606934, 3.808333396911621, 4.021031379699707, 4.233728885650635, 4.4464263916015625, 4.659124374389648, 4.871821880340576]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 5.0, 8.0, 7.0, 8.0, 10.0, 15.0, 14.0, 28.0, 25.0, 24.0, 19.0, 49.0, 31.0, 44.0, 51.0, 40.0, 30.0, 27.0, 43.0, 54.0, 43.0, 32.0, 35.0, 42.0, 41.0, 32.0, 32.0, 29.0, 24.0, 19.0, 24.0, 18.0, 22.0, 19.0, 11.0, 9.0, 6.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9902310371398926, -1.9276185035705566, -1.8650058507919312, -1.8023933172225952, -1.7397806644439697, -1.6771681308746338, -1.6145555973052979, -1.5519429445266724, -1.4893302917480469, -1.426717758178711, -1.3641051054000854, -1.3014925718307495, -1.238879919052124, -1.176267385482788, -1.1136548519134521, -1.0510421991348267, -0.9884296655654907, -0.92581707239151, -0.8632044792175293, -0.8005919456481934, -0.7379792928695679, -0.6753667593002319, -0.6127541661262512, -0.5501415729522705, -0.4875289797782898, -0.4249163866043091, -0.36230379343032837, -0.29969123005867004, -0.23707863688468933, -0.17446604371070862, -0.11185348033905029, -0.04924088716506958, 0.013371706008911133, 0.07598429173231125, 0.13859687745571136, 0.20120945572853088, 0.2638220489025116, 0.3264346420764923, 0.38904720544815063, 0.45165979862213135, 0.5142723917961121, 0.5768849849700928, 0.6394975781440735, 0.7021101713180542, 0.7647227048873901, 0.8273353576660156, 0.8899478912353516, 0.9525604844093323, 1.015173077583313, 1.077785611152649, 1.1403982639312744, 1.2030107975006104, 1.2656234502792358, 1.3282359838485718, 1.3908486366271973, 1.4534611701965332, 1.5160737037658691, 1.578686237335205, 1.6412988901138306, 1.7039114236831665, 1.766524076461792, 1.829136610031128, 1.8917491436004639, 1.9543617963790894, 2.016974449157715]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 4.0, 7.0, 14.0, 15.0, 33.0, 57.0, 45.0, 72.0, 122.0, 224.0, 413.0, 655.0, 1446.0, 2870.0, 6991.0, 20501.0, 71745.0, 277767.0, 460655.0, 145327.0, 38844.0, 11949.0, 4526.0, 1954.0, 984.0, 522.0, 305.0, 171.0, 95.0, 84.0, 41.0, 26.0, 21.0, 14.0, 16.0, 3.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0785980224609375, -1.039031982421875, -0.9994659423828125, -0.95989990234375, -0.9203338623046875, -0.880767822265625, -0.8412017822265625, -0.8016357421875, -0.7620697021484375, -0.722503662109375, -0.6829376220703125, -0.64337158203125, -0.6038055419921875, -0.564239501953125, -0.5246734619140625, -0.485107421875, -0.4455413818359375, -0.405975341796875, -0.3664093017578125, -0.32684326171875, -0.2872772216796875, -0.247711181640625, -0.2081451416015625, -0.1685791015625, -0.1290130615234375, -0.089447021484375, -0.0498809814453125, -0.01031494140625, 0.0292510986328125, 0.068817138671875, 0.1083831787109375, 0.14794921875, 0.1875152587890625, 0.227081298828125, 0.2666473388671875, 0.30621337890625, 0.3457794189453125, 0.385345458984375, 0.4249114990234375, 0.4644775390625, 0.5040435791015625, 0.543609619140625, 0.5831756591796875, 0.62274169921875, 0.6623077392578125, 0.701873779296875, 0.7414398193359375, 0.781005859375, 0.8205718994140625, 0.860137939453125, 0.8997039794921875, 0.93927001953125, 0.9788360595703125, 1.018402099609375, 1.0579681396484375, 1.0975341796875, 1.1371002197265625, 1.176666259765625, 1.2162322998046875, 1.25579833984375, 1.2953643798828125, 1.334930419921875, 1.3744964599609375, 1.4140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 17.0, 31.0, 33.0, 53.0, 65.0, 74.0, 85.0, 91.0, 89.0, 88.0, 85.0, 74.0, 49.0, 59.0, 29.0, 19.0, 14.0, 9.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.435943603515625, -1.39727783203125, -1.358612060546875, -1.3199462890625, -1.281280517578125, -1.24261474609375, -1.203948974609375, -1.165283203125, -1.126617431640625, -1.08795166015625, -1.049285888671875, -1.0106201171875, -0.971954345703125, -0.93328857421875, -0.894622802734375, -0.85595703125, -0.817291259765625, -0.77862548828125, -0.739959716796875, -0.7012939453125, -0.662628173828125, -0.62396240234375, -0.585296630859375, -0.546630859375, -0.507965087890625, -0.46929931640625, -0.430633544921875, -0.3919677734375, -0.353302001953125, -0.31463623046875, -0.275970458984375, -0.2373046875, -0.198638916015625, -0.15997314453125, -0.121307373046875, -0.0826416015625, -0.043975830078125, -0.00531005859375, 0.033355712890625, 0.072021484375, 0.110687255859375, 0.14935302734375, 0.188018798828125, 0.2266845703125, 0.265350341796875, 0.30401611328125, 0.342681884765625, 0.38134765625, 0.420013427734375, 0.45867919921875, 0.497344970703125, 0.5360107421875, 0.574676513671875, 0.61334228515625, 0.652008056640625, 0.690673828125, 0.729339599609375, 0.76800537109375, 0.806671142578125, 0.8453369140625, 0.884002685546875, 0.92266845703125, 0.961334228515625, 1.0]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 4.0, 10.0, 9.0, 15.0, 14.0, 19.0, 29.0, 33.0, 54.0, 62.0, 110.0, 154.0, 222.0, 330.0, 605.0, 1115.0, 2348.0, 6888.0, 29306.0, 211395.0, 659628.0, 109031.0, 17980.0, 4999.0, 1840.0, 913.0, 532.0, 284.0, 200.0, 126.0, 81.0, 45.0, 39.0, 28.0, 28.0, 21.0, 14.0, 6.0, 3.0, 6.0, 10.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.685546875, -1.6300048828125, -1.574462890625, -1.5189208984375, -1.46337890625, -1.4078369140625, -1.352294921875, -1.2967529296875, -1.2412109375, -1.1856689453125, -1.130126953125, -1.0745849609375, -1.01904296875, -0.9635009765625, -0.907958984375, -0.8524169921875, -0.796875, -0.7413330078125, -0.685791015625, -0.6302490234375, -0.57470703125, -0.5191650390625, -0.463623046875, -0.4080810546875, -0.3525390625, -0.2969970703125, -0.241455078125, -0.1859130859375, -0.13037109375, -0.0748291015625, -0.019287109375, 0.0362548828125, 0.091796875, 0.1473388671875, 0.202880859375, 0.2584228515625, 0.31396484375, 0.3695068359375, 0.425048828125, 0.4805908203125, 0.5361328125, 0.5916748046875, 0.647216796875, 0.7027587890625, 0.75830078125, 0.8138427734375, 0.869384765625, 0.9249267578125, 0.98046875, 1.0360107421875, 1.091552734375, 1.1470947265625, 1.20263671875, 1.2581787109375, 1.313720703125, 1.3692626953125, 1.4248046875, 1.4803466796875, 1.535888671875, 1.5914306640625, 1.64697265625, 1.7025146484375, 1.758056640625, 1.8135986328125, 1.869140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 14.0, 9.0, 16.0, 19.0, 22.0, 27.0, 47.0, 47.0, 52.0, 56.0, 57.0, 57.0, 39.0, 46.0, 60.0, 59.0, 41.0, 47.0, 38.0, 36.0, 38.0, 34.0, 20.0, 26.0, 11.0, 16.0, 16.0, 7.0, 6.0, 5.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.494140625, -2.395843505859375, -2.29754638671875, -2.199249267578125, -2.1009521484375, -2.002655029296875, -1.90435791015625, -1.806060791015625, -1.707763671875, -1.609466552734375, -1.51116943359375, -1.412872314453125, -1.3145751953125, -1.216278076171875, -1.11798095703125, -1.019683837890625, -0.92138671875, -0.823089599609375, -0.72479248046875, -0.626495361328125, -0.5281982421875, -0.429901123046875, -0.33160400390625, -0.233306884765625, -0.135009765625, -0.036712646484375, 0.06158447265625, 0.159881591796875, 0.2581787109375, 0.356475830078125, 0.45477294921875, 0.553070068359375, 0.6513671875, 0.749664306640625, 0.84796142578125, 0.946258544921875, 1.0445556640625, 1.142852783203125, 1.24114990234375, 1.339447021484375, 1.437744140625, 1.536041259765625, 1.63433837890625, 1.732635498046875, 1.8309326171875, 1.929229736328125, 2.02752685546875, 2.125823974609375, 2.22412109375, 2.322418212890625, 2.42071533203125, 2.519012451171875, 2.6173095703125, 2.715606689453125, 2.81390380859375, 2.912200927734375, 3.010498046875, 3.108795166015625, 3.20709228515625, 3.305389404296875, 3.4036865234375, 3.501983642578125, 3.60028076171875, 3.698577880859375, 3.796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 15.0, 27.0, 31.0, 65.0, 84.0, 152.0, 273.0, 662.0, 1614.0, 5531.0, 32070.0, 608253.0, 368223.0, 24293.0, 4656.0, 1405.0, 585.0, 259.0, 114.0, 79.0, 34.0, 30.0, 20.0, 15.0, 10.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.216796875, -1.1863250732421875, -1.155853271484375, -1.1253814697265625, -1.09490966796875, -1.0644378662109375, -1.033966064453125, -1.0034942626953125, -0.9730224609375, -0.9425506591796875, -0.912078857421875, -0.8816070556640625, -0.85113525390625, -0.8206634521484375, -0.790191650390625, -0.7597198486328125, -0.729248046875, -0.6987762451171875, -0.668304443359375, -0.6378326416015625, -0.60736083984375, -0.5768890380859375, -0.546417236328125, -0.5159454345703125, -0.4854736328125, -0.4550018310546875, -0.424530029296875, -0.3940582275390625, -0.36358642578125, -0.3331146240234375, -0.302642822265625, -0.2721710205078125, -0.24169921875, -0.2112274169921875, -0.180755615234375, -0.1502838134765625, -0.11981201171875, -0.0893402099609375, -0.058868408203125, -0.0283966064453125, 0.0020751953125, 0.0325469970703125, 0.063018798828125, 0.0934906005859375, 0.12396240234375, 0.1544342041015625, 0.184906005859375, 0.2153778076171875, 0.245849609375, 0.2763214111328125, 0.306793212890625, 0.3372650146484375, 0.36773681640625, 0.3982086181640625, 0.428680419921875, 0.4591522216796875, 0.4896240234375, 0.5200958251953125, 0.550567626953125, 0.5810394287109375, 0.61151123046875, 0.6419830322265625, 0.672454833984375, 0.7029266357421875, 0.7333984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 12.0, 9.0, 2.0, 12.0, 12.0, 20.0, 26.0, 28.0, 47.0, 48.0, 82.0, 133.0, 167.0, 98.0, 69.0, 31.0, 41.0, 35.0, 27.0, 24.0, 18.0, 13.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00022590160369873047, -0.00021999888122081757, -0.00021409615874290466, -0.00020819343626499176, -0.00020229071378707886, -0.00019638799130916595, -0.00019048526883125305, -0.00018458254635334015, -0.00017867982387542725, -0.00017277710139751434, -0.00016687437891960144, -0.00016097165644168854, -0.00015506893396377563, -0.00014916621148586273, -0.00014326348900794983, -0.00013736076653003693, -0.00013145804405212402, -0.00012555532157421112, -0.00011965259909629822, -0.00011374987661838531, -0.00010784715414047241, -0.00010194443166255951, -9.60417091846466e-05, -9.01389867067337e-05, -8.42362642288208e-05, -7.83335417509079e-05, -7.2430819272995e-05, -6.652809679508209e-05, -6.062537431716919e-05, -5.472265183925629e-05, -4.8819929361343384e-05, -4.291720688343048e-05, -3.701448440551758e-05, -3.1111761927604675e-05, -2.5209039449691772e-05, -1.930631697177887e-05, -1.3403594493865967e-05, -7.500872015953064e-06, -1.5981495380401611e-06, 4.304572939872742e-06, 1.0207295417785645e-05, 1.6110017895698547e-05, 2.201274037361145e-05, 2.7915462851524353e-05, 3.3818185329437256e-05, 3.972090780735016e-05, 4.562363028526306e-05, 5.1526352763175964e-05, 5.742907524108887e-05, 6.333179771900177e-05, 6.923452019691467e-05, 7.513724267482758e-05, 8.103996515274048e-05, 8.694268763065338e-05, 9.284541010856628e-05, 9.874813258647919e-05, 0.00010465085506439209, 0.00011055357754230499, 0.0001164563000202179, 0.0001223590224981308, 0.0001282617449760437, 0.0001341644674539566, 0.0001400671899318695, 0.0001459699124097824, 0.0001518726348876953]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 22.0, 27.0, 45.0, 79.0, 139.0, 245.0, 523.0, 1334.0, 4683.0, 36203.0, 764433.0, 222998.0, 13369.0, 2660.0, 918.0, 382.0, 200.0, 104.0, 59.0, 35.0, 19.0, 19.0, 11.0, 7.0, 9.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.5498046875, -1.511810302734375, -1.47381591796875, -1.435821533203125, -1.3978271484375, -1.359832763671875, -1.32183837890625, -1.283843994140625, -1.245849609375, -1.207855224609375, -1.16986083984375, -1.131866455078125, -1.0938720703125, -1.055877685546875, -1.01788330078125, -0.979888916015625, -0.94189453125, -0.903900146484375, -0.86590576171875, -0.827911376953125, -0.7899169921875, -0.751922607421875, -0.71392822265625, -0.675933837890625, -0.637939453125, -0.599945068359375, -0.56195068359375, -0.523956298828125, -0.4859619140625, -0.447967529296875, -0.40997314453125, -0.371978759765625, -0.333984375, -0.295989990234375, -0.25799560546875, -0.220001220703125, -0.1820068359375, -0.144012451171875, -0.10601806640625, -0.068023681640625, -0.030029296875, 0.007965087890625, 0.04595947265625, 0.083953857421875, 0.1219482421875, 0.159942626953125, 0.19793701171875, 0.235931396484375, 0.27392578125, 0.311920166015625, 0.34991455078125, 0.387908935546875, 0.4259033203125, 0.463897705078125, 0.50189208984375, 0.539886474609375, 0.577880859375, 0.615875244140625, 0.65386962890625, 0.691864013671875, 0.7298583984375, 0.767852783203125, 0.80584716796875, 0.843841552734375, 0.8818359375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 2.0, 11.0, 13.0, 12.0, 25.0, 25.0, 31.0, 20.0, 50.0, 67.0, 96.0, 92.0, 92.0, 90.0, 76.0, 58.0, 44.0, 48.0, 32.0, 20.0, 22.0, 16.0, 14.0, 12.0, 9.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.6882705688476562, -0.6665802001953125, -0.6448898315429688, -0.623199462890625, -0.6015090942382812, -0.5798187255859375, -0.5581283569335938, -0.53643798828125, -0.5147476196289062, -0.4930572509765625, -0.47136688232421875, -0.449676513671875, -0.42798614501953125, -0.4062957763671875, -0.38460540771484375, -0.3629150390625, -0.34122467041015625, -0.3195343017578125, -0.29784393310546875, -0.276153564453125, -0.25446319580078125, -0.2327728271484375, -0.21108245849609375, -0.18939208984375, -0.16770172119140625, -0.1460113525390625, -0.12432098388671875, -0.102630615234375, -0.08094024658203125, -0.0592498779296875, -0.03755950927734375, -0.015869140625, 0.00582122802734375, 0.0275115966796875, 0.04920196533203125, 0.070892333984375, 0.09258270263671875, 0.1142730712890625, 0.13596343994140625, 0.15765380859375, 0.17934417724609375, 0.2010345458984375, 0.22272491455078125, 0.244415283203125, 0.26610565185546875, 0.2877960205078125, 0.30948638916015625, 0.3311767578125, 0.35286712646484375, 0.3745574951171875, 0.39624786376953125, 0.417938232421875, 0.43962860107421875, 0.4613189697265625, 0.48300933837890625, 0.50469970703125, 0.5263900756835938, 0.5480804443359375, 0.5697708129882812, 0.591461181640625, 0.6131515502929688, 0.6348419189453125, 0.6565322875976562, 0.67822265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 16.0, 41.0, 85.0, 145.0, 212.0, 209.0, 150.0, 56.0, 29.0, 16.0, 9.0, 9.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.551868438720703, -18.916439056396484, -18.281009674072266, -17.645578384399414, -17.010149002075195, -16.374719619750977, -15.739290237426758, -15.103860855102539, -14.468430519104004, -13.833001136779785, -13.19757080078125, -12.562141418457031, -11.926712036132812, -11.291281700134277, -10.655852317810059, -10.020421981811523, -9.384992599487305, -8.749563217163086, -8.11413288116455, -7.478703498840332, -6.843273639678955, -6.207843780517578, -5.572414398193359, -4.936984539031982, -4.3015546798706055, -3.6661248207092285, -3.0306951999664307, -2.395265579223633, -1.7598357200622559, -1.124405860900879, -0.48897624015808105, 0.1464533805847168, 0.7818832397460938, 1.4173129796981812, 2.0527427196502686, 2.6881723403930664, 3.3236021995544434, 3.9590320587158203, 4.594461441040039, 5.229891300201416, 5.865321159362793, 6.50075101852417, 7.136180877685547, 7.771610260009766, 8.407039642333984, 9.04246997833252, 9.677899360656738, 10.313329696655273, 10.948759078979492, 11.584188461303711, 12.219618797302246, 12.855048179626465, 13.490478515625, 14.125907897949219, 14.761337280273438, 15.396766662597656, 16.032196044921875, 16.667625427246094, 17.303054809570312, 17.938486099243164, 18.573915481567383, 19.2093448638916, 19.84477424621582, 20.48020362854004, 21.11563491821289]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 15.0, 31.0, 23.0, 37.0, 36.0, 51.0, 66.0, 74.0, 67.0, 70.0, 62.0, 63.0, 67.0, 58.0, 46.0, 38.0, 30.0, 21.0, 28.0, 25.0, 9.0, 10.0, 11.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.532419204711914, -13.00814151763916, -12.48386287689209, -11.959585189819336, -11.435306549072266, -10.911028861999512, -10.386751174926758, -9.862472534179688, -9.338194847106934, -8.81391716003418, -8.28963851928711, -7.7653608322143555, -7.241082668304443, -6.716804504394531, -6.192526817321777, -5.668248653411865, -5.143970489501953, -4.619692325592041, -4.095414161682129, -3.571136474609375, -3.046858310699463, -2.522580146789551, -1.9983022212982178, -1.4740242958068848, -0.9497461318969727, -0.4254680871963501, 0.09880995750427246, 0.623088002204895, 1.1473660469055176, 1.6716442108154297, 2.1959221363067627, 2.7202000617980957, 3.244476318359375, 3.768754482269287, 4.293032646179199, 4.817310333251953, 5.341588497161865, 5.865866661071777, 6.390144348144531, 6.914422512054443, 7.4387006759643555, 7.962978839874268, 8.48725700378418, 9.011534690856934, 9.535812377929688, 10.060091018676758, 10.584368705749512, 11.108646392822266, 11.632925033569336, 12.15720272064209, 12.68148136138916, 13.205759048461914, 13.730037689208984, 14.254315376281738, 14.778593063354492, 15.302871704101562, 15.827149391174316, 16.35142707824707, 16.87570571899414, 17.39998435974121, 17.92426109313965, 18.44853973388672, 18.97281837463379, 19.497095108032227, 20.021373748779297]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 4.0, 4.0, 9.0, 6.0, 9.0, 21.0, 23.0, 32.0, 64.0, 95.0, 144.0, 219.0, 380.0, 520.0, 996.0, 1977.0, 4125.0, 12740.0, 71715.0, 2282186.0, 1737896.0, 61819.0, 11170.0, 3988.0, 1781.0, 930.0, 524.0, 319.0, 201.0, 123.0, 81.0, 53.0, 50.0, 20.0, 15.0, 11.0, 9.0, 5.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4169921875, -1.3712310791015625, -1.325469970703125, -1.2797088623046875, -1.23394775390625, -1.1881866455078125, -1.142425537109375, -1.0966644287109375, -1.0509033203125, -1.0051422119140625, -0.959381103515625, -0.9136199951171875, -0.86785888671875, -0.8220977783203125, -0.776336669921875, -0.7305755615234375, -0.684814453125, -0.6390533447265625, -0.593292236328125, -0.5475311279296875, -0.50177001953125, -0.4560089111328125, -0.410247802734375, -0.3644866943359375, -0.3187255859375, -0.2729644775390625, -0.227203369140625, -0.1814422607421875, -0.13568115234375, -0.0899200439453125, -0.044158935546875, 0.0016021728515625, 0.04736328125, 0.0931243896484375, 0.138885498046875, 0.1846466064453125, 0.23040771484375, 0.2761688232421875, 0.321929931640625, 0.3676910400390625, 0.4134521484375, 0.4592132568359375, 0.504974365234375, 0.5507354736328125, 0.59649658203125, 0.6422576904296875, 0.688018798828125, 0.7337799072265625, 0.779541015625, 0.8253021240234375, 0.871063232421875, 0.9168243408203125, 0.96258544921875, 1.0083465576171875, 1.054107666015625, 1.0998687744140625, 1.1456298828125, 1.1913909912109375, 1.237152099609375, 1.2829132080078125, 1.32867431640625, 1.3744354248046875, 1.420196533203125, 1.4659576416015625, 1.51171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 8.0, 3.0, 17.0, 12.0, 14.0, 14.0, 34.0, 34.0, 47.0, 44.0, 59.0, 51.0, 55.0, 46.0, 60.0, 58.0, 55.0, 52.0, 46.0, 40.0, 33.0, 45.0, 34.0, 27.0, 25.0, 17.0, 13.0, 15.0, 8.0, 9.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5403289794921875, -0.519622802734375, -0.4989166259765625, -0.47821044921875, -0.4575042724609375, -0.436798095703125, -0.4160919189453125, -0.3953857421875, -0.3746795654296875, -0.353973388671875, -0.3332672119140625, -0.31256103515625, -0.2918548583984375, -0.271148681640625, -0.2504425048828125, -0.229736328125, -0.2090301513671875, -0.188323974609375, -0.1676177978515625, -0.14691162109375, -0.1262054443359375, -0.105499267578125, -0.0847930908203125, -0.0640869140625, -0.0433807373046875, -0.022674560546875, -0.0019683837890625, 0.01873779296875, 0.0394439697265625, 0.060150146484375, 0.0808563232421875, 0.1015625, 0.1222686767578125, 0.142974853515625, 0.1636810302734375, 0.18438720703125, 0.2050933837890625, 0.225799560546875, 0.2465057373046875, 0.2672119140625, 0.2879180908203125, 0.308624267578125, 0.3293304443359375, 0.35003662109375, 0.3707427978515625, 0.391448974609375, 0.4121551513671875, 0.432861328125, 0.4535675048828125, 0.474273681640625, 0.4949798583984375, 0.51568603515625, 0.5363922119140625, 0.557098388671875, 0.5778045654296875, 0.5985107421875, 0.6192169189453125, 0.639923095703125, 0.6606292724609375, 0.68133544921875, 0.7020416259765625, 0.722747802734375, 0.7434539794921875, 0.76416015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 11.0, 1.0, 12.0, 19.0, 10.0, 29.0, 64.0, 91.0, 165.0, 285.0, 570.0, 1185.0, 2924.0, 8579.0, 36778.0, 1065065.0, 3008404.0, 53168.0, 10613.0, 3446.0, 1473.0, 617.0, 350.0, 169.0, 84.0, 60.0, 42.0, 19.0, 23.0, 8.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.162872314453125, -2.09332275390625, -2.023773193359375, -1.9542236328125, -1.884674072265625, -1.81512451171875, -1.745574951171875, -1.676025390625, -1.606475830078125, -1.53692626953125, -1.467376708984375, -1.3978271484375, -1.328277587890625, -1.25872802734375, -1.189178466796875, -1.11962890625, -1.050079345703125, -0.98052978515625, -0.910980224609375, -0.8414306640625, -0.771881103515625, -0.70233154296875, -0.632781982421875, -0.563232421875, -0.493682861328125, -0.42413330078125, -0.354583740234375, -0.2850341796875, -0.215484619140625, -0.14593505859375, -0.076385498046875, -0.0068359375, 0.062713623046875, 0.13226318359375, 0.201812744140625, 0.2713623046875, 0.340911865234375, 0.41046142578125, 0.480010986328125, 0.549560546875, 0.619110107421875, 0.68865966796875, 0.758209228515625, 0.8277587890625, 0.897308349609375, 0.96685791015625, 1.036407470703125, 1.10595703125, 1.175506591796875, 1.24505615234375, 1.314605712890625, 1.3841552734375, 1.453704833984375, 1.52325439453125, 1.592803955078125, 1.662353515625, 1.731903076171875, 1.80145263671875, 1.871002197265625, 1.9405517578125, 2.010101318359375, 2.07965087890625, 2.149200439453125, 2.21875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 9.0, 7.0, 11.0, 16.0, 19.0, 18.0, 39.0, 74.0, 129.0, 274.0, 649.0, 1176.0, 856.0, 375.0, 166.0, 84.0, 59.0, 23.0, 15.0, 16.0, 8.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.67578125, -1.617431640625, -1.55908203125, -1.500732421875, -1.4423828125, -1.384033203125, -1.32568359375, -1.267333984375, -1.208984375, -1.150634765625, -1.09228515625, -1.033935546875, -0.9755859375, -0.917236328125, -0.85888671875, -0.800537109375, -0.7421875, -0.683837890625, -0.62548828125, -0.567138671875, -0.5087890625, -0.450439453125, -0.39208984375, -0.333740234375, -0.275390625, -0.217041015625, -0.15869140625, -0.100341796875, -0.0419921875, 0.016357421875, 0.07470703125, 0.133056640625, 0.19140625, 0.249755859375, 0.30810546875, 0.366455078125, 0.4248046875, 0.483154296875, 0.54150390625, 0.599853515625, 0.658203125, 0.716552734375, 0.77490234375, 0.833251953125, 0.8916015625, 0.949951171875, 1.00830078125, 1.066650390625, 1.125, 1.183349609375, 1.24169921875, 1.300048828125, 1.3583984375, 1.416748046875, 1.47509765625, 1.533447265625, 1.591796875, 1.650146484375, 1.70849609375, 1.766845703125, 1.8251953125, 1.883544921875, 1.94189453125, 2.000244140625, 2.05859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 11.0, 28.0, 51.0, 87.0, 205.0, 238.0, 197.0, 96.0, 42.0, 17.0, 12.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.277074813842773, -26.692138671875, -26.107202529907227, -25.52226448059082, -24.937328338623047, -24.352392196655273, -23.7674560546875, -23.182518005371094, -22.59758186340332, -22.012645721435547, -21.427709579467773, -20.842771530151367, -20.257835388183594, -19.67289924621582, -19.087963104248047, -18.50302505493164, -17.9180908203125, -17.333154678344727, -16.748218536376953, -16.163280487060547, -15.578344345092773, -14.993408203125, -14.408472061157227, -13.823534965515137, -13.238597869873047, -12.653661727905273, -12.068724632263184, -11.48378849029541, -10.89885139465332, -10.313915252685547, -9.728979110717773, -9.144042015075684, -8.559103965759277, -7.974167346954346, -7.389230728149414, -6.804294586181641, -6.219357490539551, -5.634421348571777, -5.049484729766846, -4.464548110961914, -3.8796114921569824, -3.294674873352051, -2.709738254547119, -2.1248018741607666, -1.539865255355835, -0.9549286365509033, -0.3699922561645508, 0.21494436264038086, 0.7998809814453125, 1.3848176002502441, 1.9697540998458862, 2.5546905994415283, 3.13962721824646, 3.7245638370513916, 4.309500217437744, 4.894436836242676, 5.479373455047607, 6.064310073852539, 6.649246692657471, 7.234183311462402, 7.819119453430176, 8.404056549072266, 8.988992691040039, 9.573928833007812, 10.158865928649902]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 6.0, 9.0, 10.0, 16.0, 12.0, 19.0, 20.0, 21.0, 34.0, 33.0, 33.0, 30.0, 42.0, 35.0, 39.0, 50.0, 46.0, 57.0, 45.0, 57.0, 46.0, 43.0, 39.0, 25.0, 46.0, 33.0, 20.0, 26.0, 23.0, 19.0, 18.0, 8.0, 5.0, 11.0, 6.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.645757675170898, -6.436529159545898, -6.227300643920898, -6.018072128295898, -5.808843612670898, -5.599615097045898, -5.390387058258057, -5.181158542633057, -4.971930027008057, -4.762701511383057, -4.553472995758057, -4.344244480133057, -4.135016441345215, -3.9257876873016357, -3.716559410095215, -3.507330894470215, -3.298102378845215, -3.088873863220215, -2.879645347595215, -2.670417070388794, -2.461188554763794, -2.251960039138794, -2.042731761932373, -1.833503246307373, -1.624274730682373, -1.415046215057373, -1.2058178186416626, -0.9965893626213074, -0.7873609066009521, -0.5781323909759521, -0.3689039945602417, -0.15967559814453125, 0.04955291748046875, 0.258781373500824, 0.4680098295211792, 0.6772382855415344, 0.8864667415618896, 1.0956952571868896, 1.3049236536026, 1.5141520500183105, 1.7233805656433105, 1.9326090812683105, 2.1418375968933105, 2.3510658740997314, 2.5602943897247314, 2.7695229053497314, 2.9787511825561523, 3.1879796981811523, 3.3972082138061523, 3.6064367294311523, 3.8156652450561523, 4.024893760681152, 4.234122276306152, 4.443350791931152, 4.652578830718994, 4.861807346343994, 5.071035861968994, 5.280264377593994, 5.489492893218994, 5.698721408843994, 5.907949447631836, 6.117177963256836, 6.326406478881836, 6.535634994506836, 6.744863510131836]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 3.0, 13.0, 22.0, 40.0, 51.0, 81.0, 142.0, 266.0, 438.0, 761.0, 1567.0, 3210.0, 7118.0, 16684.0, 44104.0, 131104.0, 377710.0, 306521.0, 99683.0, 34464.0, 13258.0, 5642.0, 2703.0, 1303.0, 681.0, 385.0, 221.0, 124.0, 79.0, 57.0, 30.0, 20.0, 21.0, 9.0, 5.0, 10.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98046875, -0.9487152099609375, -0.916961669921875, -0.8852081298828125, -0.85345458984375, -0.8217010498046875, -0.789947509765625, -0.7581939697265625, -0.7264404296875, -0.6946868896484375, -0.662933349609375, -0.6311798095703125, -0.59942626953125, -0.5676727294921875, -0.535919189453125, -0.5041656494140625, -0.472412109375, -0.4406585693359375, -0.408905029296875, -0.3771514892578125, -0.34539794921875, -0.3136444091796875, -0.281890869140625, -0.2501373291015625, -0.2183837890625, -0.1866302490234375, -0.154876708984375, -0.1231231689453125, -0.09136962890625, -0.0596160888671875, -0.027862548828125, 0.0038909912109375, 0.03564453125, 0.0673980712890625, 0.099151611328125, 0.1309051513671875, 0.16265869140625, 0.1944122314453125, 0.226165771484375, 0.2579193115234375, 0.2896728515625, 0.3214263916015625, 0.353179931640625, 0.3849334716796875, 0.41668701171875, 0.4484405517578125, 0.480194091796875, 0.5119476318359375, 0.543701171875, 0.5754547119140625, 0.607208251953125, 0.6389617919921875, 0.67071533203125, 0.7024688720703125, 0.734222412109375, 0.7659759521484375, 0.7977294921875, 0.8294830322265625, 0.861236572265625, 0.8929901123046875, 0.92474365234375, 0.9564971923828125, 0.988250732421875, 1.0200042724609375, 1.0517578125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 12.0, 16.0, 23.0, 28.0, 31.0, 34.0, 42.0, 48.0, 66.0, 45.0, 55.0, 47.0, 60.0, 54.0, 56.0, 44.0, 55.0, 40.0, 31.0, 46.0, 30.0, 26.0, 21.0, 11.0, 8.0, 11.0, 16.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.590545654296875, -0.56976318359375, -0.548980712890625, -0.5281982421875, -0.507415771484375, -0.48663330078125, -0.465850830078125, -0.445068359375, -0.424285888671875, -0.40350341796875, -0.382720947265625, -0.3619384765625, -0.341156005859375, -0.32037353515625, -0.299591064453125, -0.27880859375, -0.258026123046875, -0.23724365234375, -0.216461181640625, -0.1956787109375, -0.174896240234375, -0.15411376953125, -0.133331298828125, -0.112548828125, -0.091766357421875, -0.07098388671875, -0.050201416015625, -0.0294189453125, -0.008636474609375, 0.01214599609375, 0.032928466796875, 0.0537109375, 0.074493408203125, 0.09527587890625, 0.116058349609375, 0.1368408203125, 0.157623291015625, 0.17840576171875, 0.199188232421875, 0.219970703125, 0.240753173828125, 0.26153564453125, 0.282318115234375, 0.3031005859375, 0.323883056640625, 0.34466552734375, 0.365447998046875, 0.38623046875, 0.407012939453125, 0.42779541015625, 0.448577880859375, 0.4693603515625, 0.490142822265625, 0.51092529296875, 0.531707763671875, 0.552490234375, 0.573272705078125, 0.59405517578125, 0.614837646484375, 0.6356201171875, 0.656402587890625, 0.67718505859375, 0.697967529296875, 0.71875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 4.0, 8.0, 9.0, 15.0, 14.0, 20.0, 24.0, 33.0, 58.0, 82.0, 136.0, 174.0, 295.0, 524.0, 1240.0, 3153.0, 13020.0, 122266.0, 808242.0, 83790.0, 10315.0, 2733.0, 1074.0, 513.0, 283.0, 183.0, 108.0, 63.0, 40.0, 37.0, 17.0, 13.0, 16.0, 15.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-2.419921875, -2.3475341796875, -2.275146484375, -2.2027587890625, -2.13037109375, -2.0579833984375, -1.985595703125, -1.9132080078125, -1.8408203125, -1.7684326171875, -1.696044921875, -1.6236572265625, -1.55126953125, -1.4788818359375, -1.406494140625, -1.3341064453125, -1.26171875, -1.1893310546875, -1.116943359375, -1.0445556640625, -0.97216796875, -0.8997802734375, -0.827392578125, -0.7550048828125, -0.6826171875, -0.6102294921875, -0.537841796875, -0.4654541015625, -0.39306640625, -0.3206787109375, -0.248291015625, -0.1759033203125, -0.103515625, -0.0311279296875, 0.041259765625, 0.1136474609375, 0.18603515625, 0.2584228515625, 0.330810546875, 0.4031982421875, 0.4755859375, 0.5479736328125, 0.620361328125, 0.6927490234375, 0.76513671875, 0.8375244140625, 0.909912109375, 0.9822998046875, 1.0546875, 1.1270751953125, 1.199462890625, 1.2718505859375, 1.34423828125, 1.4166259765625, 1.489013671875, 1.5614013671875, 1.6337890625, 1.7061767578125, 1.778564453125, 1.8509521484375, 1.92333984375, 1.9957275390625, 2.068115234375, 2.1405029296875, 2.212890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 8.0, 10.0, 20.0, 25.0, 28.0, 33.0, 41.0, 35.0, 44.0, 48.0, 53.0, 58.0, 65.0, 55.0, 49.0, 44.0, 50.0, 48.0, 41.0, 40.0, 34.0, 29.0, 25.0, 20.0, 18.0, 9.0, 7.0, 7.0, 7.0, 6.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.271148681640625, -2.18096923828125, -2.090789794921875, -2.0006103515625, -1.910430908203125, -1.82025146484375, -1.730072021484375, -1.639892578125, -1.549713134765625, -1.45953369140625, -1.369354248046875, -1.2791748046875, -1.188995361328125, -1.09881591796875, -1.008636474609375, -0.91845703125, -0.828277587890625, -0.73809814453125, -0.647918701171875, -0.5577392578125, -0.467559814453125, -0.37738037109375, -0.287200927734375, -0.197021484375, -0.106842041015625, -0.01666259765625, 0.073516845703125, 0.1636962890625, 0.253875732421875, 0.34405517578125, 0.434234619140625, 0.5244140625, 0.614593505859375, 0.70477294921875, 0.794952392578125, 0.8851318359375, 0.975311279296875, 1.06549072265625, 1.155670166015625, 1.245849609375, 1.336029052734375, 1.42620849609375, 1.516387939453125, 1.6065673828125, 1.696746826171875, 1.78692626953125, 1.877105712890625, 1.96728515625, 2.057464599609375, 2.14764404296875, 2.237823486328125, 2.3280029296875, 2.418182373046875, 2.50836181640625, 2.598541259765625, 2.688720703125, 2.778900146484375, 2.86907958984375, 2.959259033203125, 3.0494384765625, 3.139617919921875, 3.22979736328125, 3.319976806640625, 3.41015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 10.0, 25.0, 32.0, 46.0, 108.0, 201.0, 460.0, 1262.0, 5820.0, 69834.0, 908248.0, 55364.0, 5108.0, 1215.0, 401.0, 188.0, 80.0, 53.0, 30.0, 17.0, 13.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3349609375, -1.2938385009765625, -1.252716064453125, -1.2115936279296875, -1.17047119140625, -1.1293487548828125, -1.088226318359375, -1.0471038818359375, -1.0059814453125, -0.9648590087890625, -0.923736572265625, -0.8826141357421875, -0.84149169921875, -0.8003692626953125, -0.759246826171875, -0.7181243896484375, -0.677001953125, -0.6358795166015625, -0.594757080078125, -0.5536346435546875, -0.51251220703125, -0.4713897705078125, -0.430267333984375, -0.3891448974609375, -0.3480224609375, -0.3069000244140625, -0.265777587890625, -0.2246551513671875, -0.18353271484375, -0.1424102783203125, -0.101287841796875, -0.0601654052734375, -0.01904296875, 0.0220794677734375, 0.063201904296875, 0.1043243408203125, 0.14544677734375, 0.1865692138671875, 0.227691650390625, 0.2688140869140625, 0.3099365234375, 0.3510589599609375, 0.392181396484375, 0.4333038330078125, 0.47442626953125, 0.5155487060546875, 0.556671142578125, 0.5977935791015625, 0.638916015625, 0.6800384521484375, 0.721160888671875, 0.7622833251953125, 0.80340576171875, 0.8445281982421875, 0.885650634765625, 0.9267730712890625, 0.9678955078125, 1.0090179443359375, 1.050140380859375, 1.0912628173828125, 1.13238525390625, 1.1735076904296875, 1.214630126953125, 1.2557525634765625, 1.296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 6.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 14.0, 11.0, 20.0, 23.0, 31.0, 39.0, 94.0, 119.0, 145.0, 163.0, 74.0, 43.0, 50.0, 34.0, 24.0, 18.0, 18.0, 11.0, 8.0, 4.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00025391578674316406, -0.0002478398382663727, -0.0002417638897895813, -0.00023568794131278992, -0.00022961199283599854, -0.00022353604435920715, -0.00021746009588241577, -0.0002113841474056244, -0.000205308198928833, -0.00019923225045204163, -0.00019315630197525024, -0.00018708035349845886, -0.00018100440502166748, -0.0001749284565448761, -0.00016885250806808472, -0.00016277655959129333, -0.00015670061111450195, -0.00015062466263771057, -0.0001445487141609192, -0.0001384727656841278, -0.00013239681720733643, -0.00012632086873054504, -0.00012024492025375366, -0.00011416897177696228, -0.0001080930233001709, -0.00010201707482337952, -9.594112634658813e-05, -8.986517786979675e-05, -8.378922939300537e-05, -7.771328091621399e-05, -7.163733243942261e-05, -6.556138396263123e-05, -5.9485435485839844e-05, -5.340948700904846e-05, -4.733353853225708e-05, -4.12575900554657e-05, -3.5181641578674316e-05, -2.9105693101882935e-05, -2.3029744625091553e-05, -1.695379614830017e-05, -1.0877847671508789e-05, -4.801899194717407e-06, 1.2740492820739746e-06, 7.3499977588653564e-06, 1.3425946235656738e-05, 1.950189471244812e-05, 2.5577843189239502e-05, 3.1653791666030884e-05, 3.7729740142822266e-05, 4.380568861961365e-05, 4.988163709640503e-05, 5.595758557319641e-05, 6.203353404998779e-05, 6.810948252677917e-05, 7.418543100357056e-05, 8.026137948036194e-05, 8.633732795715332e-05, 9.24132764339447e-05, 9.848922491073608e-05, 0.00010456517338752747, 0.00011064112186431885, 0.00011671707034111023, 0.0001227930188179016, 0.000128868967294693, 0.00013494491577148438]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 4.0, 6.0, 14.0, 15.0, 26.0, 30.0, 37.0, 47.0, 56.0, 89.0, 135.0, 182.0, 350.0, 551.0, 1055.0, 2117.0, 5610.0, 20081.0, 101511.0, 691769.0, 180445.0, 30734.0, 7885.0, 2733.0, 1226.0, 674.0, 349.0, 229.0, 149.0, 98.0, 74.0, 63.0, 40.0, 24.0, 31.0, 21.0, 11.0, 16.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.65087890625, -0.6264495849609375, -0.602020263671875, -0.5775909423828125, -0.55316162109375, -0.5287322998046875, -0.504302978515625, -0.4798736572265625, -0.4554443359375, -0.4310150146484375, -0.406585693359375, -0.3821563720703125, -0.35772705078125, -0.3332977294921875, -0.308868408203125, -0.2844390869140625, -0.260009765625, -0.2355804443359375, -0.211151123046875, -0.1867218017578125, -0.16229248046875, -0.1378631591796875, -0.113433837890625, -0.0890045166015625, -0.0645751953125, -0.0401458740234375, -0.015716552734375, 0.0087127685546875, 0.03314208984375, 0.0575714111328125, 0.082000732421875, 0.1064300537109375, 0.130859375, 0.1552886962890625, 0.179718017578125, 0.2041473388671875, 0.22857666015625, 0.2530059814453125, 0.277435302734375, 0.3018646240234375, 0.3262939453125, 0.3507232666015625, 0.375152587890625, 0.3995819091796875, 0.42401123046875, 0.4484405517578125, 0.472869873046875, 0.4972991943359375, 0.521728515625, 0.5461578369140625, 0.570587158203125, 0.5950164794921875, 0.61944580078125, 0.6438751220703125, 0.668304443359375, 0.6927337646484375, 0.7171630859375, 0.7415924072265625, 0.766021728515625, 0.7904510498046875, 0.81488037109375, 0.8393096923828125, 0.863739013671875, 0.8881683349609375, 0.91259765625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 14.0, 26.0, 26.0, 40.0, 49.0, 71.0, 97.0, 157.0, 157.0, 126.0, 76.0, 58.0, 32.0, 23.0, 17.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.3940277099609375, -1.356414794921875, -1.3188018798828125, -1.28118896484375, -1.2435760498046875, -1.205963134765625, -1.1683502197265625, -1.1307373046875, -1.0931243896484375, -1.055511474609375, -1.0178985595703125, -0.98028564453125, -0.9426727294921875, -0.905059814453125, -0.8674468994140625, -0.829833984375, -0.7922210693359375, -0.754608154296875, -0.7169952392578125, -0.67938232421875, -0.6417694091796875, -0.604156494140625, -0.5665435791015625, -0.5289306640625, -0.4913177490234375, -0.453704833984375, -0.4160919189453125, -0.37847900390625, -0.3408660888671875, -0.303253173828125, -0.2656402587890625, -0.22802734375, -0.1904144287109375, -0.152801513671875, -0.1151885986328125, -0.07757568359375, -0.0399627685546875, -0.002349853515625, 0.0352630615234375, 0.0728759765625, 0.1104888916015625, 0.148101806640625, 0.1857147216796875, 0.22332763671875, 0.2609405517578125, 0.298553466796875, 0.3361663818359375, 0.373779296875, 0.4113922119140625, 0.449005126953125, 0.4866180419921875, 0.52423095703125, 0.5618438720703125, 0.599456787109375, 0.6370697021484375, 0.6746826171875, 0.7122955322265625, 0.749908447265625, 0.7875213623046875, 0.82513427734375, 0.8627471923828125, 0.900360107421875, 0.9379730224609375, 0.9755859375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 29.0, 65.0, 203.0, 354.0, 202.0, 82.0, 35.0, 12.0, 6.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.49456024169922, -29.683015823364258, -28.871469497680664, -28.059925079345703, -27.248380661010742, -26.43683624267578, -25.625289916992188, -24.813745498657227, -24.002201080322266, -23.190656661987305, -22.37911033630371, -21.56756591796875, -20.75602149963379, -19.944477081298828, -19.132930755615234, -18.321386337280273, -17.50984001159668, -16.69829559326172, -15.886750221252441, -15.075204849243164, -14.263660430908203, -13.452115058898926, -12.640569686889648, -11.829025268554688, -11.01747989654541, -10.205934524536133, -9.394390106201172, -8.582844734191895, -7.771299839019775, -6.959754943847656, -6.148209571838379, -5.33666467666626, -4.525121688842773, -3.7135767936706543, -2.902031660079956, -2.090486526489258, -1.2789416313171387, -0.46739673614501953, 0.3441486358642578, 1.155693531036377, 1.967238426208496, 2.7787833213806152, 3.5903284549713135, 4.401873588562012, 5.213418483734131, 6.02496337890625, 6.836508750915527, 7.6480536460876465, 8.459598541259766, 9.271143913269043, 10.082688331604004, 10.894233703613281, 11.705778121948242, 12.51732349395752, 13.328868865966797, 14.140413284301758, 14.951958656311035, 15.763504028320312, 16.575048446655273, 17.386592864990234, 18.198139190673828, 19.00968360900879, 19.82122802734375, 20.632774353027344, 21.444318771362305]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 13.0, 12.0, 17.0, 15.0, 20.0, 23.0, 25.0, 37.0, 24.0, 39.0, 30.0, 42.0, 58.0, 58.0, 60.0, 59.0, 56.0, 54.0, 37.0, 42.0, 43.0, 28.0, 28.0, 29.0, 22.0, 26.0, 17.0, 16.0, 10.0, 7.0, 11.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.786921501159668, -11.452144622802734, -11.1173677444458, -10.782590866088867, -10.447813987731934, -10.113037109375, -9.778260231018066, -9.443483352661133, -9.1087064743042, -8.773929595947266, -8.439152717590332, -8.104375839233398, -7.769598960876465, -7.434822082519531, -7.100045204162598, -6.765268325805664, -6.430490970611572, -6.095714092254639, -5.760937213897705, -5.4261603355407715, -5.091383457183838, -4.756606578826904, -4.4218292236328125, -4.087052345275879, -3.7522757053375244, -3.417498826980591, -3.0827219486236572, -2.7479448318481445, -2.413167953491211, -2.0783910751342773, -1.7436141967773438, -1.4088373184204102, -1.0740604400634766, -0.739283561706543, -0.4045066237449646, -0.06972968578338623, 0.26504719257354736, 0.599824070930481, 0.9346010684967041, 1.2693779468536377, 1.6041548252105713, 1.9389317035675049, 2.2737085819244385, 2.608485698699951, 2.9432625770568848, 3.2780394554138184, 3.612816333770752, 3.9475932121276855, 4.282370090484619, 4.617146968841553, 4.951923847198486, 5.28670072555542, 5.6214776039123535, 5.956254482269287, 6.291031837463379, 6.6258087158203125, 6.960585594177246, 7.29536247253418, 7.630139350891113, 7.964916229248047, 8.29969310760498, 8.634469985961914, 8.969246864318848, 9.304023742675781, 9.638800621032715]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 14.0, 18.0, 41.0, 62.0, 127.0, 284.0, 548.0, 1415.0, 5396.0, 85282.0, 4047531.0, 47111.0, 4241.0, 1214.0, 490.0, 243.0, 97.0, 49.0, 45.0, 21.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.78619384765625, -2.6915283203125, -2.59686279296875, -2.502197265625, -2.40753173828125, -2.3128662109375, -2.21820068359375, -2.12353515625, -2.02886962890625, -1.9342041015625, -1.83953857421875, -1.744873046875, -1.65020751953125, -1.5555419921875, -1.46087646484375, -1.3662109375, -1.27154541015625, -1.1768798828125, -1.08221435546875, -0.987548828125, -0.89288330078125, -0.7982177734375, -0.70355224609375, -0.60888671875, -0.51422119140625, -0.4195556640625, -0.32489013671875, -0.230224609375, -0.13555908203125, -0.0408935546875, 0.05377197265625, 0.1484375, 0.24310302734375, 0.3377685546875, 0.43243408203125, 0.527099609375, 0.62176513671875, 0.7164306640625, 0.81109619140625, 0.90576171875, 1.00042724609375, 1.0950927734375, 1.18975830078125, 1.284423828125, 1.37908935546875, 1.4737548828125, 1.56842041015625, 1.6630859375, 1.75775146484375, 1.8524169921875, 1.94708251953125, 2.041748046875, 2.13641357421875, 2.2310791015625, 2.32574462890625, 2.42041015625, 2.51507568359375, 2.6097412109375, 2.70440673828125, 2.799072265625, 2.89373779296875, 2.9884033203125, 3.08306884765625, 3.177734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 18.0, 11.0, 19.0, 30.0, 28.0, 38.0, 39.0, 42.0, 39.0, 46.0, 52.0, 45.0, 52.0, 50.0, 48.0, 46.0, 42.0, 41.0, 36.0, 33.0, 37.0, 24.0, 26.0, 26.0, 17.0, 20.0, 14.0, 6.0, 10.0, 7.0, 11.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5048828125, -0.48712158203125, -0.4693603515625, -0.45159912109375, -0.433837890625, -0.41607666015625, -0.3983154296875, -0.38055419921875, -0.36279296875, -0.34503173828125, -0.3272705078125, -0.30950927734375, -0.291748046875, -0.27398681640625, -0.2562255859375, -0.23846435546875, -0.220703125, -0.20294189453125, -0.1851806640625, -0.16741943359375, -0.149658203125, -0.13189697265625, -0.1141357421875, -0.09637451171875, -0.07861328125, -0.06085205078125, -0.0430908203125, -0.02532958984375, -0.007568359375, 0.01019287109375, 0.0279541015625, 0.04571533203125, 0.0634765625, 0.08123779296875, 0.0989990234375, 0.11676025390625, 0.134521484375, 0.15228271484375, 0.1700439453125, 0.18780517578125, 0.20556640625, 0.22332763671875, 0.2410888671875, 0.25885009765625, 0.276611328125, 0.29437255859375, 0.3121337890625, 0.32989501953125, 0.34765625, 0.36541748046875, 0.3831787109375, 0.40093994140625, 0.418701171875, 0.43646240234375, 0.4542236328125, 0.47198486328125, 0.48974609375, 0.50750732421875, 0.5252685546875, 0.54302978515625, 0.560791015625, 0.57855224609375, 0.5963134765625, 0.61407470703125, 0.6318359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 13.0, 14.0, 38.0, 51.0, 77.0, 106.0, 152.0, 262.0, 371.0, 601.0, 966.0, 1648.0, 3163.0, 6618.0, 18303.0, 81299.0, 1502227.0, 2430995.0, 108641.0, 22412.0, 7917.0, 3600.0, 1884.0, 1064.0, 667.0, 406.0, 252.0, 166.0, 106.0, 83.0, 51.0, 45.0, 13.0, 14.0, 13.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4572296142578125, -1.414459228515625, -1.3716888427734375, -1.32891845703125, -1.2861480712890625, -1.243377685546875, -1.2006072998046875, -1.1578369140625, -1.1150665283203125, -1.072296142578125, -1.0295257568359375, -0.98675537109375, -0.9439849853515625, -0.901214599609375, -0.8584442138671875, -0.815673828125, -0.7729034423828125, -0.730133056640625, -0.6873626708984375, -0.64459228515625, -0.6018218994140625, -0.559051513671875, -0.5162811279296875, -0.4735107421875, -0.4307403564453125, -0.387969970703125, -0.3451995849609375, -0.30242919921875, -0.2596588134765625, -0.216888427734375, -0.1741180419921875, -0.13134765625, -0.0885772705078125, -0.045806884765625, -0.0030364990234375, 0.03973388671875, 0.0825042724609375, 0.125274658203125, 0.1680450439453125, 0.2108154296875, 0.2535858154296875, 0.296356201171875, 0.3391265869140625, 0.38189697265625, 0.4246673583984375, 0.467437744140625, 0.5102081298828125, 0.552978515625, 0.5957489013671875, 0.638519287109375, 0.6812896728515625, 0.72406005859375, 0.7668304443359375, 0.809600830078125, 0.8523712158203125, 0.8951416015625, 0.9379119873046875, 0.980682373046875, 1.0234527587890625, 1.06622314453125, 1.1089935302734375, 1.151763916015625, 1.1945343017578125, 1.2373046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 8.0, 8.0, 14.0, 31.0, 49.0, 104.0, 253.0, 723.0, 1447.0, 887.0, 268.0, 122.0, 53.0, 29.0, 22.0, 11.0, 12.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.488616943359375, -2.42059326171875, -2.352569580078125, -2.2845458984375, -2.216522216796875, -2.14849853515625, -2.080474853515625, -2.012451171875, -1.944427490234375, -1.87640380859375, -1.808380126953125, -1.7403564453125, -1.672332763671875, -1.60430908203125, -1.536285400390625, -1.46826171875, -1.400238037109375, -1.33221435546875, -1.264190673828125, -1.1961669921875, -1.128143310546875, -1.06011962890625, -0.992095947265625, -0.924072265625, -0.856048583984375, -0.78802490234375, -0.720001220703125, -0.6519775390625, -0.583953857421875, -0.51593017578125, -0.447906494140625, -0.3798828125, -0.311859130859375, -0.24383544921875, -0.175811767578125, -0.1077880859375, -0.039764404296875, 0.02825927734375, 0.096282958984375, 0.164306640625, 0.232330322265625, 0.30035400390625, 0.368377685546875, 0.4364013671875, 0.504425048828125, 0.57244873046875, 0.640472412109375, 0.70849609375, 0.776519775390625, 0.84454345703125, 0.912567138671875, 0.9805908203125, 1.048614501953125, 1.11663818359375, 1.184661865234375, 1.252685546875, 1.320709228515625, 1.38873291015625, 1.456756591796875, 1.5247802734375, 1.592803955078125, 1.66082763671875, 1.728851318359375, 1.796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 15.0, 23.0, 46.0, 65.0, 89.0, 125.0, 150.0, 148.0, 96.0, 86.0, 36.0, 23.0, 16.0, 12.0, 9.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.69163990020752, -8.415185928344727, -8.138731002807617, -7.862277030944824, -7.585823059082031, -7.309369087219238, -7.032914638519287, -6.756460189819336, -6.480006217956543, -6.20355224609375, -5.927097797393799, -5.650643348693848, -5.374189376831055, -5.097735404968262, -4.8212809562683105, -4.544826507568359, -4.268372535705566, -3.9919183254241943, -3.7154641151428223, -3.43900990486145, -3.162555694580078, -2.886101484298706, -2.609647274017334, -2.333193063735962, -2.05673885345459, -1.7802846431732178, -1.5038304328918457, -1.2273762226104736, -0.9509220123291016, -0.6744678020477295, -0.3980135917663574, -0.12155938148498535, 0.1548938751220703, 0.4313480854034424, 0.7078022956848145, 0.9842565059661865, 1.2607107162475586, 1.5371649265289307, 1.8136191368103027, 2.090073347091675, 2.366527557373047, 2.642981767654419, 2.919435977935791, 3.195890188217163, 3.472344398498535, 3.7487986087799072, 4.025252819061279, 4.3017072677612305, 4.578161239624023, 4.854615211486816, 5.131069660186768, 5.407524108886719, 5.683978080749512, 5.960432052612305, 6.236886501312256, 6.513340950012207, 6.789794921875, 7.066248893737793, 7.342703342437744, 7.619157791137695, 7.895611763000488, 8.172065734863281, 8.44852066040039, 8.724974632263184, 9.001428604125977]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 3.0, 7.0, 6.0, 10.0, 10.0, 7.0, 11.0, 15.0, 15.0, 18.0, 27.0, 23.0, 29.0, 25.0, 41.0, 35.0, 39.0, 39.0, 45.0, 42.0, 41.0, 55.0, 37.0, 42.0, 49.0, 32.0, 26.0, 40.0, 26.0, 32.0, 23.0, 17.0, 20.0, 17.0, 25.0, 14.0, 9.0, 8.0, 7.0, 7.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-5.3482346534729, -5.184440612792969, -5.020646095275879, -4.856852054595947, -4.693058013916016, -4.529263973236084, -4.365469455718994, -4.2016754150390625, -4.037881374359131, -3.87408709526062, -3.7102930545806885, -3.5464987754821777, -3.382704734802246, -3.2189104557037354, -3.0551161766052246, -2.891322135925293, -2.7275278568267822, -2.5637335777282715, -2.39993953704834, -2.236145257949829, -2.0723512172698975, -1.9085569381713867, -1.7447627782821655, -1.5809686183929443, -1.4171744585037231, -1.253380298614502, -1.0895861387252808, -0.9257919192314148, -0.7619977593421936, -0.5982035994529724, -0.43440937995910645, -0.27061522006988525, -0.10682106018066406, 0.05697311460971832, 0.2207672894001007, 0.3845614790916443, 0.5483556389808655, 0.7121497988700867, 0.8759440183639526, 1.0397381782531738, 1.203532338142395, 1.3673264980316162, 1.5311206579208374, 1.6949148178100586, 1.8587090969085693, 2.022503137588501, 2.1862974166870117, 2.3500914573669434, 2.513885736465454, 2.677680015563965, 2.8414740562438965, 3.0052683353424072, 3.169062376022339, 3.3328566551208496, 3.4966506958007812, 3.660444974899292, 3.8242392539978027, 3.9880335330963135, 4.151827812194824, 4.315621852874756, 4.4794158935546875, 4.643209934234619, 4.807004451751709, 4.970798492431641, 5.134592533111572]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 8.0, 10.0, 10.0, 18.0, 29.0, 34.0, 54.0, 105.0, 129.0, 214.0, 398.0, 676.0, 1184.0, 2176.0, 4484.0, 9252.0, 21273.0, 54457.0, 157816.0, 410868.0, 247789.0, 82031.0, 30511.0, 12682.0, 5880.0, 2912.0, 1518.0, 796.0, 483.0, 272.0, 153.0, 118.0, 69.0, 41.0, 31.0, 18.0, 17.0, 12.0, 3.0, 3.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.85693359375, -0.8290176391601562, -0.8011016845703125, -0.7731857299804688, -0.745269775390625, -0.7173538208007812, -0.6894378662109375, -0.6615219116210938, -0.63360595703125, -0.6056900024414062, -0.5777740478515625, -0.5498580932617188, -0.521942138671875, -0.49402618408203125, -0.4661102294921875, -0.43819427490234375, -0.4102783203125, -0.38236236572265625, -0.3544464111328125, -0.32653045654296875, -0.298614501953125, -0.27069854736328125, -0.2427825927734375, -0.21486663818359375, -0.18695068359375, -0.15903472900390625, -0.1311187744140625, -0.10320281982421875, -0.075286865234375, -0.04737091064453125, -0.0194549560546875, 0.00846099853515625, 0.036376953125, 0.06429290771484375, 0.0922088623046875, 0.12012481689453125, 0.148040771484375, 0.17595672607421875, 0.2038726806640625, 0.23178863525390625, 0.25970458984375, 0.28762054443359375, 0.3155364990234375, 0.34345245361328125, 0.371368408203125, 0.39928436279296875, 0.4272003173828125, 0.45511627197265625, 0.4830322265625, 0.5109481811523438, 0.5388641357421875, 0.5667800903320312, 0.594696044921875, 0.6226119995117188, 0.6505279541015625, 0.6784439086914062, 0.70635986328125, 0.7342758178710938, 0.7621917724609375, 0.7901077270507812, 0.818023681640625, 0.8459396362304688, 0.8738555908203125, 0.9017715454101562, 0.9296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 7.0, 5.0, 13.0, 18.0, 14.0, 25.0, 14.0, 24.0, 18.0, 34.0, 39.0, 31.0, 29.0, 40.0, 61.0, 50.0, 55.0, 64.0, 38.0, 40.0, 43.0, 41.0, 38.0, 29.0, 31.0, 24.0, 28.0, 21.0, 9.0, 24.0, 13.0, 17.0, 8.0, 11.0, 10.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.556640625, -0.5389938354492188, -0.5213470458984375, -0.5037002563476562, -0.486053466796875, -0.46840667724609375, -0.4507598876953125, -0.43311309814453125, -0.41546630859375, -0.39781951904296875, -0.3801727294921875, -0.36252593994140625, -0.344879150390625, -0.32723236083984375, -0.3095855712890625, -0.29193878173828125, -0.2742919921875, -0.25664520263671875, -0.2389984130859375, -0.22135162353515625, -0.203704833984375, -0.18605804443359375, -0.1684112548828125, -0.15076446533203125, -0.13311767578125, -0.11547088623046875, -0.0978240966796875, -0.08017730712890625, -0.062530517578125, -0.04488372802734375, -0.0272369384765625, -0.00959014892578125, 0.008056640625, 0.02570343017578125, 0.0433502197265625, 0.06099700927734375, 0.078643798828125, 0.09629058837890625, 0.1139373779296875, 0.13158416748046875, 0.14923095703125, 0.16687774658203125, 0.1845245361328125, 0.20217132568359375, 0.219818115234375, 0.23746490478515625, 0.2551116943359375, 0.27275848388671875, 0.2904052734375, 0.30805206298828125, 0.3256988525390625, 0.34334564208984375, 0.360992431640625, 0.37863922119140625, 0.3962860107421875, 0.41393280029296875, 0.43157958984375, 0.44922637939453125, 0.4668731689453125, 0.48451995849609375, 0.502166748046875, 0.5198135375976562, 0.5374603271484375, 0.5551071166992188, 0.57275390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 12.0, 4.0, 6.0, 11.0, 15.0, 21.0, 32.0, 30.0, 40.0, 67.0, 106.0, 158.0, 254.0, 416.0, 890.0, 1881.0, 5218.0, 18570.0, 107643.0, 725971.0, 152599.0, 23829.0, 6206.0, 2269.0, 1008.0, 500.0, 280.0, 163.0, 107.0, 80.0, 46.0, 33.0, 23.0, 19.0, 12.0, 10.0, 9.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6845703125, -1.629486083984375, -1.57440185546875, -1.519317626953125, -1.4642333984375, -1.409149169921875, -1.35406494140625, -1.298980712890625, -1.243896484375, -1.188812255859375, -1.13372802734375, -1.078643798828125, -1.0235595703125, -0.968475341796875, -0.91339111328125, -0.858306884765625, -0.80322265625, -0.748138427734375, -0.69305419921875, -0.637969970703125, -0.5828857421875, -0.527801513671875, -0.47271728515625, -0.417633056640625, -0.362548828125, -0.307464599609375, -0.25238037109375, -0.197296142578125, -0.1422119140625, -0.087127685546875, -0.03204345703125, 0.023040771484375, 0.078125, 0.133209228515625, 0.18829345703125, 0.243377685546875, 0.2984619140625, 0.353546142578125, 0.40863037109375, 0.463714599609375, 0.518798828125, 0.573883056640625, 0.62896728515625, 0.684051513671875, 0.7391357421875, 0.794219970703125, 0.84930419921875, 0.904388427734375, 0.95947265625, 1.014556884765625, 1.06964111328125, 1.124725341796875, 1.1798095703125, 1.234893798828125, 1.28997802734375, 1.345062255859375, 1.400146484375, 1.455230712890625, 1.51031494140625, 1.565399169921875, 1.6204833984375, 1.675567626953125, 1.73065185546875, 1.785736083984375, 1.8408203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 18.0, 13.0, 28.0, 24.0, 24.0, 30.0, 34.0, 32.0, 40.0, 30.0, 42.0, 48.0, 56.0, 43.0, 59.0, 41.0, 52.0, 47.0, 38.0, 34.0, 43.0, 24.0, 29.0, 16.0, 20.0, 16.0, 13.0, 19.0, 8.0, 5.0, 6.0, 3.0, 3.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.21484375, -2.1429443359375, -2.071044921875, -1.9991455078125, -1.92724609375, -1.8553466796875, -1.783447265625, -1.7115478515625, -1.6396484375, -1.5677490234375, -1.495849609375, -1.4239501953125, -1.35205078125, -1.2801513671875, -1.208251953125, -1.1363525390625, -1.064453125, -0.9925537109375, -0.920654296875, -0.8487548828125, -0.77685546875, -0.7049560546875, -0.633056640625, -0.5611572265625, -0.4892578125, -0.4173583984375, -0.345458984375, -0.2735595703125, -0.20166015625, -0.1297607421875, -0.057861328125, 0.0140380859375, 0.0859375, 0.1578369140625, 0.229736328125, 0.3016357421875, 0.37353515625, 0.4454345703125, 0.517333984375, 0.5892333984375, 0.6611328125, 0.7330322265625, 0.804931640625, 0.8768310546875, 0.94873046875, 1.0206298828125, 1.092529296875, 1.1644287109375, 1.236328125, 1.3082275390625, 1.380126953125, 1.4520263671875, 1.52392578125, 1.5958251953125, 1.667724609375, 1.7396240234375, 1.8115234375, 1.8834228515625, 1.955322265625, 2.0272216796875, 2.09912109375, 2.1710205078125, 2.242919921875, 2.3148193359375, 2.38671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 5.0, 13.0, 10.0, 9.0, 22.0, 54.0, 86.0, 197.0, 575.0, 2242.0, 20413.0, 878815.0, 138108.0, 6191.0, 1119.0, 339.0, 173.0, 70.0, 44.0, 23.0, 14.0, 4.0, 7.0, 7.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6923828125, -1.635528564453125, -1.57867431640625, -1.521820068359375, -1.4649658203125, -1.408111572265625, -1.35125732421875, -1.294403076171875, -1.237548828125, -1.180694580078125, -1.12384033203125, -1.066986083984375, -1.0101318359375, -0.953277587890625, -0.89642333984375, -0.839569091796875, -0.78271484375, -0.725860595703125, -0.66900634765625, -0.612152099609375, -0.5552978515625, -0.498443603515625, -0.44158935546875, -0.384735107421875, -0.327880859375, -0.271026611328125, -0.21417236328125, -0.157318115234375, -0.1004638671875, -0.043609619140625, 0.01324462890625, 0.070098876953125, 0.126953125, 0.183807373046875, 0.24066162109375, 0.297515869140625, 0.3543701171875, 0.411224365234375, 0.46807861328125, 0.524932861328125, 0.581787109375, 0.638641357421875, 0.69549560546875, 0.752349853515625, 0.8092041015625, 0.866058349609375, 0.92291259765625, 0.979766845703125, 1.03662109375, 1.093475341796875, 1.15032958984375, 1.207183837890625, 1.2640380859375, 1.320892333984375, 1.37774658203125, 1.434600830078125, 1.491455078125, 1.548309326171875, 1.60516357421875, 1.662017822265625, 1.7188720703125, 1.775726318359375, 1.83258056640625, 1.889434814453125, 1.9462890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 2.0, 6.0, 4.0, 10.0, 10.0, 6.0, 18.0, 27.0, 25.0, 40.0, 59.0, 99.0, 150.0, 184.0, 109.0, 69.0, 52.0, 40.0, 20.0, 20.0, 13.0, 10.0, 8.0, 8.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029730796813964844, -0.000290602445602417, -0.00028389692306518555, -0.0002771914005279541, -0.00027048587799072266, -0.0002637803554534912, -0.00025707483291625977, -0.0002503693103790283, -0.00024366378784179688, -0.00023695826530456543, -0.00023025274276733398, -0.00022354722023010254, -0.0002168416976928711, -0.00021013617515563965, -0.0002034306526184082, -0.00019672513008117676, -0.0001900196075439453, -0.00018331408500671387, -0.00017660856246948242, -0.00016990303993225098, -0.00016319751739501953, -0.00015649199485778809, -0.00014978647232055664, -0.0001430809497833252, -0.00013637542724609375, -0.0001296699047088623, -0.00012296438217163086, -0.00011625885963439941, -0.00010955333709716797, -0.00010284781455993652, -9.614229202270508e-05, -8.943676948547363e-05, -8.273124694824219e-05, -7.602572441101074e-05, -6.93202018737793e-05, -6.261467933654785e-05, -5.5909156799316406e-05, -4.920363426208496e-05, -4.2498111724853516e-05, -3.579258918762207e-05, -2.9087066650390625e-05, -2.238154411315918e-05, -1.5676021575927734e-05, -8.970499038696289e-06, -2.2649765014648438e-06, 4.4405460357666016e-06, 1.1146068572998047e-05, 1.7851591110229492e-05, 2.4557113647460938e-05, 3.126263618469238e-05, 3.796815872192383e-05, 4.4673681259155273e-05, 5.137920379638672e-05, 5.8084726333618164e-05, 6.479024887084961e-05, 7.149577140808105e-05, 7.82012939453125e-05, 8.490681648254395e-05, 9.161233901977539e-05, 9.831786155700684e-05, 0.00010502338409423828, 0.00011172890663146973, 0.00011843442916870117, 0.00012513995170593262, 0.00013184547424316406]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 6.0, 7.0, 14.0, 11.0, 28.0, 43.0, 50.0, 64.0, 98.0, 156.0, 232.0, 396.0, 649.0, 1379.0, 3070.0, 7905.0, 29195.0, 221613.0, 692624.0, 67927.0, 14154.0, 4615.0, 1978.0, 947.0, 494.0, 315.0, 174.0, 118.0, 87.0, 45.0, 36.0, 33.0, 19.0, 15.0, 10.0, 8.0, 4.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.822265625, -0.7941436767578125, -0.766021728515625, -0.7378997802734375, -0.70977783203125, -0.6816558837890625, -0.653533935546875, -0.6254119873046875, -0.5972900390625, -0.5691680908203125, -0.541046142578125, -0.5129241943359375, -0.48480224609375, -0.4566802978515625, -0.428558349609375, -0.4004364013671875, -0.372314453125, -0.3441925048828125, -0.316070556640625, -0.2879486083984375, -0.25982666015625, -0.2317047119140625, -0.203582763671875, -0.1754608154296875, -0.1473388671875, -0.1192169189453125, -0.091094970703125, -0.0629730224609375, -0.03485107421875, -0.0067291259765625, 0.021392822265625, 0.0495147705078125, 0.07763671875, 0.1057586669921875, 0.133880615234375, 0.1620025634765625, 0.19012451171875, 0.2182464599609375, 0.246368408203125, 0.2744903564453125, 0.3026123046875, 0.3307342529296875, 0.358856201171875, 0.3869781494140625, 0.41510009765625, 0.4432220458984375, 0.471343994140625, 0.4994659423828125, 0.527587890625, 0.5557098388671875, 0.583831787109375, 0.6119537353515625, 0.64007568359375, 0.6681976318359375, 0.696319580078125, 0.7244415283203125, 0.7525634765625, 0.7806854248046875, 0.808807373046875, 0.8369293212890625, 0.86505126953125, 0.8931732177734375, 0.921295166015625, 0.9494171142578125, 0.9775390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 9.0, 8.0, 15.0, 22.0, 25.0, 32.0, 56.0, 58.0, 80.0, 134.0, 159.0, 118.0, 90.0, 34.0, 46.0, 30.0, 16.0, 16.0, 17.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7724609375, -0.7419891357421875, -0.711517333984375, -0.6810455322265625, -0.65057373046875, -0.6201019287109375, -0.589630126953125, -0.5591583251953125, -0.5286865234375, -0.4982147216796875, -0.467742919921875, -0.4372711181640625, -0.40679931640625, -0.3763275146484375, -0.345855712890625, -0.3153839111328125, -0.284912109375, -0.2544403076171875, -0.223968505859375, -0.1934967041015625, -0.16302490234375, -0.1325531005859375, -0.102081298828125, -0.0716094970703125, -0.0411376953125, -0.0106658935546875, 0.019805908203125, 0.0502777099609375, 0.08074951171875, 0.1112213134765625, 0.141693115234375, 0.1721649169921875, 0.20263671875, 0.2331085205078125, 0.263580322265625, 0.2940521240234375, 0.32452392578125, 0.3549957275390625, 0.385467529296875, 0.4159393310546875, 0.4464111328125, 0.4768829345703125, 0.507354736328125, 0.5378265380859375, 0.56829833984375, 0.5987701416015625, 0.629241943359375, 0.6597137451171875, 0.690185546875, 0.7206573486328125, 0.751129150390625, 0.7816009521484375, 0.81207275390625, 0.8425445556640625, 0.873016357421875, 0.9034881591796875, 0.9339599609375, 0.9644317626953125, 0.994903564453125, 1.0253753662109375, 1.05584716796875, 1.0863189697265625, 1.116790771484375, 1.1472625732421875, 1.177734375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 9.0, 23.0, 14.0, 55.0, 158.0, 350.0, 253.0, 83.0, 36.0, 10.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.84917449951172, -35.09694290161133, -34.34470748901367, -33.59247589111328, -32.84024429321289, -32.0880126953125, -31.335779190063477, -30.583545684814453, -29.831314086914062, -29.07908058166504, -28.32684898376465, -27.574615478515625, -26.822383880615234, -26.07015037536621, -25.31791877746582, -24.565685272216797, -23.813453674316406, -23.061220169067383, -22.308988571166992, -21.55675506591797, -20.804523468017578, -20.052289962768555, -19.300058364868164, -18.54782485961914, -17.795591354370117, -17.043357849121094, -16.291126251220703, -15.538893699645996, -14.786661148071289, -14.034428596496582, -13.282196044921875, -12.529962539672852, -11.777731895446777, -11.02549934387207, -10.273266792297363, -9.521034240722656, -8.76880168914795, -8.016569137573242, -7.264336109161377, -6.51210355758667, -5.759871006011963, -5.007638454437256, -4.255405902862549, -3.5031731128692627, -2.7509405612945557, -1.9987080097198486, -1.2464752197265625, -0.49424266815185547, 0.25798988342285156, 1.0102224349975586, 1.7624551057815552, 2.5146877765655518, 3.266920328140259, 4.019152641296387, 4.771385669708252, 5.523618221282959, 6.275850772857666, 7.028083324432373, 7.78031587600708, 8.532548904418945, 9.284781455993652, 10.03701400756836, 10.789246559143066, 11.541479110717773, 12.29371166229248]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 10.0, 7.0, 9.0, 13.0, 15.0, 23.0, 22.0, 33.0, 36.0, 21.0, 32.0, 31.0, 43.0, 42.0, 58.0, 65.0, 59.0, 57.0, 50.0, 38.0, 51.0, 34.0, 37.0, 27.0, 33.0, 26.0, 24.0, 17.0, 17.0, 16.0, 7.0, 9.0, 9.0, 4.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.269038200378418, -8.945643424987793, -8.622248649597168, -8.298853874206543, -7.975459575653076, -7.652064800262451, -7.328670501708984, -7.005275726318359, -6.681880950927734, -6.358486175537109, -6.035091400146484, -5.711697101593018, -5.388302326202393, -5.064907550811768, -4.741513252258301, -4.418118476867676, -4.094723701477051, -3.771328926086426, -3.44793438911438, -3.124539852142334, -2.801145076751709, -2.477750301361084, -2.154355764389038, -1.8309612274169922, -1.5075664520263672, -1.1841717958450317, -0.8607771396636963, -0.5373824834823608, -0.2139878273010254, 0.10940682888031006, 0.4328014850616455, 0.7561960220336914, 1.07958984375, 1.4029844999313354, 1.726379156112671, 2.049773693084717, 2.373168468475342, 2.696563243865967, 3.0199577808380127, 3.3433523178100586, 3.6667470932006836, 3.9901418685913086, 4.313536643981934, 4.6369309425354, 4.960325717926025, 5.28372049331665, 5.607114791870117, 5.930509567260742, 6.253904342651367, 6.577299118041992, 6.900693893432617, 7.224088191986084, 7.547482967376709, 7.870877742767334, 8.1942720413208, 8.517666816711426, 8.84106159210205, 9.164456367492676, 9.4878511428833, 9.811245918273926, 10.134639739990234, 10.45803451538086, 10.781429290771484, 11.10482406616211, 11.428218841552734]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 8.0, 14.0, 17.0, 30.0, 59.0, 91.0, 134.0, 225.0, 310.0, 523.0, 770.0, 1381.0, 2586.0, 5966.0, 17684.0, 106410.0, 1815875.0, 2100445.0, 111956.0, 17080.0, 5817.0, 2771.0, 1514.0, 968.0, 543.0, 358.0, 237.0, 164.0, 104.0, 68.0, 37.0, 46.0, 23.0, 16.0, 8.0, 10.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.283203125, -1.243133544921875, -1.20306396484375, -1.162994384765625, -1.1229248046875, -1.082855224609375, -1.04278564453125, -1.002716064453125, -0.962646484375, -0.922576904296875, -0.88250732421875, -0.842437744140625, -0.8023681640625, -0.762298583984375, -0.72222900390625, -0.682159423828125, -0.64208984375, -0.602020263671875, -0.56195068359375, -0.521881103515625, -0.4818115234375, -0.441741943359375, -0.40167236328125, -0.361602783203125, -0.321533203125, -0.281463623046875, -0.24139404296875, -0.201324462890625, -0.1612548828125, -0.121185302734375, -0.08111572265625, -0.041046142578125, -0.0009765625, 0.039093017578125, 0.07916259765625, 0.119232177734375, 0.1593017578125, 0.199371337890625, 0.23944091796875, 0.279510498046875, 0.319580078125, 0.359649658203125, 0.39971923828125, 0.439788818359375, 0.4798583984375, 0.519927978515625, 0.55999755859375, 0.600067138671875, 0.64013671875, 0.680206298828125, 0.72027587890625, 0.760345458984375, 0.8004150390625, 0.840484619140625, 0.88055419921875, 0.920623779296875, 0.960693359375, 1.000762939453125, 1.04083251953125, 1.080902099609375, 1.1209716796875, 1.161041259765625, 1.20111083984375, 1.241180419921875, 1.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 9.0, 14.0, 22.0, 21.0, 25.0, 39.0, 59.0, 44.0, 62.0, 83.0, 80.0, 81.0, 91.0, 72.0, 61.0, 44.0, 43.0, 51.0, 33.0, 21.0, 12.0, 12.0, 12.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.637908935546875, -0.60980224609375, -0.581695556640625, -0.5535888671875, -0.525482177734375, -0.49737548828125, -0.469268798828125, -0.441162109375, -0.413055419921875, -0.38494873046875, -0.356842041015625, -0.3287353515625, -0.300628662109375, -0.27252197265625, -0.244415283203125, -0.21630859375, -0.188201904296875, -0.16009521484375, -0.131988525390625, -0.1038818359375, -0.075775146484375, -0.04766845703125, -0.019561767578125, 0.008544921875, 0.036651611328125, 0.06475830078125, 0.092864990234375, 0.1209716796875, 0.149078369140625, 0.17718505859375, 0.205291748046875, 0.2333984375, 0.261505126953125, 0.28961181640625, 0.317718505859375, 0.3458251953125, 0.373931884765625, 0.40203857421875, 0.430145263671875, 0.458251953125, 0.486358642578125, 0.51446533203125, 0.542572021484375, 0.5706787109375, 0.598785400390625, 0.62689208984375, 0.654998779296875, 0.68310546875, 0.711212158203125, 0.73931884765625, 0.767425537109375, 0.7955322265625, 0.823638916015625, 0.85174560546875, 0.879852294921875, 0.907958984375, 0.936065673828125, 0.96417236328125, 0.992279052734375, 1.0203857421875, 1.048492431640625, 1.07659912109375, 1.104705810546875, 1.1328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 8.0, 13.0, 11.0, 17.0, 25.0, 34.0, 50.0, 65.0, 77.0, 113.0, 194.0, 288.0, 404.0, 659.0, 1071.0, 2064.0, 4078.0, 10145.0, 35197.0, 271918.0, 3510002.0, 300056.0, 38480.0, 10759.0, 4087.0, 1900.0, 1029.0, 595.0, 295.0, 219.0, 141.0, 90.0, 58.0, 32.0, 34.0, 19.0, 16.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.685546875, -1.63525390625, -1.5849609375, -1.53466796875, -1.484375, -1.43408203125, -1.3837890625, -1.33349609375, -1.283203125, -1.23291015625, -1.1826171875, -1.13232421875, -1.08203125, -1.03173828125, -0.9814453125, -0.93115234375, -0.880859375, -0.83056640625, -0.7802734375, -0.72998046875, -0.6796875, -0.62939453125, -0.5791015625, -0.52880859375, -0.478515625, -0.42822265625, -0.3779296875, -0.32763671875, -0.27734375, -0.22705078125, -0.1767578125, -0.12646484375, -0.076171875, -0.02587890625, 0.0244140625, 0.07470703125, 0.125, 0.17529296875, 0.2255859375, 0.27587890625, 0.326171875, 0.37646484375, 0.4267578125, 0.47705078125, 0.52734375, 0.57763671875, 0.6279296875, 0.67822265625, 0.728515625, 0.77880859375, 0.8291015625, 0.87939453125, 0.9296875, 0.97998046875, 1.0302734375, 1.08056640625, 1.130859375, 1.18115234375, 1.2314453125, 1.28173828125, 1.33203125, 1.38232421875, 1.4326171875, 1.48291015625, 1.533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 10.0, 13.0, 11.0, 22.0, 33.0, 46.0, 100.0, 224.0, 474.0, 1006.0, 1088.0, 522.0, 225.0, 102.0, 45.0, 49.0, 23.0, 19.0, 18.0, 10.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.6510009765625, -2.581298828125, -2.5115966796875, -2.44189453125, -2.3721923828125, -2.302490234375, -2.2327880859375, -2.1630859375, -2.0933837890625, -2.023681640625, -1.9539794921875, -1.88427734375, -1.8145751953125, -1.744873046875, -1.6751708984375, -1.60546875, -1.5357666015625, -1.466064453125, -1.3963623046875, -1.32666015625, -1.2569580078125, -1.187255859375, -1.1175537109375, -1.0478515625, -0.9781494140625, -0.908447265625, -0.8387451171875, -0.76904296875, -0.6993408203125, -0.629638671875, -0.5599365234375, -0.490234375, -0.4205322265625, -0.350830078125, -0.2811279296875, -0.21142578125, -0.1417236328125, -0.072021484375, -0.0023193359375, 0.0673828125, 0.1370849609375, 0.206787109375, 0.2764892578125, 0.34619140625, 0.4158935546875, 0.485595703125, 0.5552978515625, 0.625, 0.6947021484375, 0.764404296875, 0.8341064453125, 0.90380859375, 0.9735107421875, 1.043212890625, 1.1129150390625, 1.1826171875, 1.2523193359375, 1.322021484375, 1.3917236328125, 1.46142578125, 1.5311279296875, 1.600830078125, 1.6705322265625, 1.740234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 9.0, 24.0, 63.0, 155.0, 295.0, 215.0, 131.0, 45.0, 22.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.463030815124512, -14.75528335571289, -14.047536849975586, -13.339789390563965, -12.632041931152344, -11.924294471740723, -11.216547012329102, -10.508800506591797, -9.801053047180176, -9.093305587768555, -8.38555908203125, -7.677811622619629, -6.970064163208008, -6.262316703796387, -5.554569721221924, -4.846822738647461, -4.13907527923584, -3.431328058242798, -2.723580837249756, -2.015833616256714, -1.3080863952636719, -0.6003391742706299, 0.10740804672241211, 0.815155029296875, 1.522902488708496, 2.230649709701538, 2.93839693069458, 3.646144151687622, 4.353891372680664, 5.061638832092285, 5.769385814666748, 6.477132797241211, 7.184881210327148, 7.8926286697387695, 8.60037612915039, 9.308122634887695, 10.015870094299316, 10.723617553710938, 11.431364059448242, 12.139111518859863, 12.846858978271484, 13.554606437683105, 14.262353897094727, 14.970100402832031, 15.677847862243652, 16.385595321655273, 17.093341827392578, 17.801090240478516, 18.50883674621582, 19.216583251953125, 19.924331665039062, 20.632078170776367, 21.339824676513672, 22.04757308959961, 22.755319595336914, 23.46306610107422, 24.170814514160156, 24.87856101989746, 25.5863094329834, 26.294055938720703, 27.00180435180664, 27.709550857543945, 28.41729736328125, 29.125045776367188, 29.832792282104492]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 7.0, 14.0, 15.0, 20.0, 21.0, 22.0, 28.0, 36.0, 38.0, 44.0, 58.0, 52.0, 49.0, 57.0, 52.0, 44.0, 59.0, 47.0, 37.0, 40.0, 36.0, 44.0, 27.0, 22.0, 23.0, 18.0, 12.0, 15.0, 12.0, 16.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-9.771305084228516, -9.531112670898438, -9.290921211242676, -9.050728797912598, -8.81053638458252, -8.570343971252441, -8.33015251159668, -8.089960098266602, -7.849767684936523, -7.6095757484436035, -7.369383335113525, -7.1291913986206055, -6.888998985290527, -6.648807048797607, -6.4086151123046875, -6.168422698974609, -5.9282307624816895, -5.6880388259887695, -5.447846412658691, -5.2076544761657715, -4.967462062835693, -4.727270126342773, -4.487077713012695, -4.246885776519775, -4.0066938400268555, -3.7665016651153564, -3.5263094902038574, -3.2861175537109375, -3.0459251403808594, -2.8057332038879395, -2.5655410289764404, -2.3253488540649414, -2.0851564407348633, -1.8449642658233643, -1.6047720909118652, -1.3645800352096558, -1.1243878602981567, -0.8841956853866577, -0.6440036296844482, -0.4038114547729492, -0.1636192798614502, 0.07657286524772644, 0.3167650103569031, 0.5569571256637573, 0.7971493005752563, 1.0373414754867554, 1.2775335311889648, 1.5177257061004639, 1.757917881011963, 1.998110055923462, 2.238302230834961, 2.478494167327881, 2.718686580657959, 2.958878517150879, 3.199070692062378, 3.439262866973877, 3.679455041885376, 3.919647216796875, 4.159839153289795, 4.400031566619873, 4.640223503112793, 4.880415916442871, 5.120607852935791, 5.360799789428711, 5.600992202758789]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 5.0, 6.0, 8.0, 17.0, 31.0, 37.0, 57.0, 86.0, 145.0, 207.0, 340.0, 600.0, 1032.0, 1963.0, 4017.0, 9525.0, 26811.0, 96410.0, 417357.0, 366105.0, 83375.0, 23787.0, 8662.0, 3681.0, 1825.0, 976.0, 581.0, 301.0, 214.0, 128.0, 73.0, 64.0, 36.0, 23.0, 18.0, 14.0, 3.0, 3.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.4931640625, -1.447845458984375, -1.40252685546875, -1.357208251953125, -1.3118896484375, -1.266571044921875, -1.22125244140625, -1.175933837890625, -1.130615234375, -1.085296630859375, -1.03997802734375, -0.994659423828125, -0.9493408203125, -0.904022216796875, -0.85870361328125, -0.813385009765625, -0.76806640625, -0.722747802734375, -0.67742919921875, -0.632110595703125, -0.5867919921875, -0.541473388671875, -0.49615478515625, -0.450836181640625, -0.405517578125, -0.360198974609375, -0.31488037109375, -0.269561767578125, -0.2242431640625, -0.178924560546875, -0.13360595703125, -0.088287353515625, -0.04296875, 0.002349853515625, 0.04766845703125, 0.092987060546875, 0.1383056640625, 0.183624267578125, 0.22894287109375, 0.274261474609375, 0.319580078125, 0.364898681640625, 0.41021728515625, 0.455535888671875, 0.5008544921875, 0.546173095703125, 0.59149169921875, 0.636810302734375, 0.68212890625, 0.727447509765625, 0.77276611328125, 0.818084716796875, 0.8634033203125, 0.908721923828125, 0.95404052734375, 0.999359130859375, 1.044677734375, 1.089996337890625, 1.13531494140625, 1.180633544921875, 1.2259521484375, 1.271270751953125, 1.31658935546875, 1.361907958984375, 1.4072265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 12.0, 11.0, 18.0, 9.0, 34.0, 26.0, 24.0, 29.0, 42.0, 39.0, 45.0, 45.0, 56.0, 52.0, 51.0, 36.0, 46.0, 54.0, 37.0, 52.0, 31.0, 36.0, 40.0, 22.0, 22.0, 18.0, 15.0, 16.0, 17.0, 12.0, 13.0, 9.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5654296875, -0.5472869873046875, -0.529144287109375, -0.5110015869140625, -0.49285888671875, -0.4747161865234375, -0.456573486328125, -0.4384307861328125, -0.4202880859375, -0.4021453857421875, -0.384002685546875, -0.3658599853515625, -0.34771728515625, -0.3295745849609375, -0.311431884765625, -0.2932891845703125, -0.275146484375, -0.2570037841796875, -0.238861083984375, -0.2207183837890625, -0.20257568359375, -0.1844329833984375, -0.166290283203125, -0.1481475830078125, -0.1300048828125, -0.1118621826171875, -0.093719482421875, -0.0755767822265625, -0.05743408203125, -0.0392913818359375, -0.021148681640625, -0.0030059814453125, 0.01513671875, 0.0332794189453125, 0.051422119140625, 0.0695648193359375, 0.08770751953125, 0.1058502197265625, 0.123992919921875, 0.1421356201171875, 0.1602783203125, 0.1784210205078125, 0.196563720703125, 0.2147064208984375, 0.23284912109375, 0.2509918212890625, 0.269134521484375, 0.2872772216796875, 0.305419921875, 0.3235626220703125, 0.341705322265625, 0.3598480224609375, 0.37799072265625, 0.3961334228515625, 0.414276123046875, 0.4324188232421875, 0.4505615234375, 0.4687042236328125, 0.486846923828125, 0.5049896240234375, 0.52313232421875, 0.5412750244140625, 0.559417724609375, 0.5775604248046875, 0.595703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 10.0, 2.0, 16.0, 18.0, 27.0, 31.0, 54.0, 64.0, 131.0, 208.0, 306.0, 615.0, 1194.0, 2994.0, 10079.0, 72844.0, 852478.0, 90033.0, 11403.0, 3241.0, 1296.0, 597.0, 363.0, 200.0, 115.0, 86.0, 34.0, 35.0, 18.0, 15.0, 11.0, 7.0, 7.0, 8.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.193359375, -3.09521484375, -2.9970703125, -2.89892578125, -2.80078125, -2.70263671875, -2.6044921875, -2.50634765625, -2.408203125, -2.31005859375, -2.2119140625, -2.11376953125, -2.015625, -1.91748046875, -1.8193359375, -1.72119140625, -1.623046875, -1.52490234375, -1.4267578125, -1.32861328125, -1.23046875, -1.13232421875, -1.0341796875, -0.93603515625, -0.837890625, -0.73974609375, -0.6416015625, -0.54345703125, -0.4453125, -0.34716796875, -0.2490234375, -0.15087890625, -0.052734375, 0.04541015625, 0.1435546875, 0.24169921875, 0.33984375, 0.43798828125, 0.5361328125, 0.63427734375, 0.732421875, 0.83056640625, 0.9287109375, 1.02685546875, 1.125, 1.22314453125, 1.3212890625, 1.41943359375, 1.517578125, 1.61572265625, 1.7138671875, 1.81201171875, 1.91015625, 2.00830078125, 2.1064453125, 2.20458984375, 2.302734375, 2.40087890625, 2.4990234375, 2.59716796875, 2.6953125, 2.79345703125, 2.8916015625, 2.98974609375, 3.087890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 8.0, 12.0, 11.0, 20.0, 21.0, 30.0, 28.0, 28.0, 38.0, 32.0, 33.0, 43.0, 51.0, 48.0, 48.0, 47.0, 53.0, 47.0, 48.0, 42.0, 46.0, 48.0, 34.0, 31.0, 37.0, 29.0, 21.0, 16.0, 16.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.763671875, -2.68365478515625, -2.6036376953125, -2.52362060546875, -2.443603515625, -2.36358642578125, -2.2835693359375, -2.20355224609375, -2.12353515625, -2.04351806640625, -1.9635009765625, -1.88348388671875, -1.803466796875, -1.72344970703125, -1.6434326171875, -1.56341552734375, -1.4833984375, -1.40338134765625, -1.3233642578125, -1.24334716796875, -1.163330078125, -1.08331298828125, -1.0032958984375, -0.92327880859375, -0.84326171875, -0.76324462890625, -0.6832275390625, -0.60321044921875, -0.523193359375, -0.44317626953125, -0.3631591796875, -0.28314208984375, -0.203125, -0.12310791015625, -0.0430908203125, 0.03692626953125, 0.116943359375, 0.19696044921875, 0.2769775390625, 0.35699462890625, 0.43701171875, 0.51702880859375, 0.5970458984375, 0.67706298828125, 0.757080078125, 0.83709716796875, 0.9171142578125, 0.99713134765625, 1.0771484375, 1.15716552734375, 1.2371826171875, 1.31719970703125, 1.397216796875, 1.47723388671875, 1.5572509765625, 1.63726806640625, 1.71728515625, 1.79730224609375, 1.8773193359375, 1.95733642578125, 2.037353515625, 2.11737060546875, 2.1973876953125, 2.27740478515625, 2.357421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 12.0, 7.0, 19.0, 12.0, 15.0, 15.0, 35.0, 40.0, 50.0, 72.0, 90.0, 159.0, 284.0, 497.0, 855.0, 1740.0, 4025.0, 11750.0, 44916.0, 293621.0, 602937.0, 62765.0, 15081.0, 4992.0, 2126.0, 988.0, 529.0, 293.0, 192.0, 107.0, 82.0, 46.0, 34.0, 41.0, 25.0, 25.0, 14.0, 22.0, 4.0, 7.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.8740234375, -0.8483963012695312, -0.8227691650390625, -0.7971420288085938, -0.771514892578125, -0.7458877563476562, -0.7202606201171875, -0.6946334838867188, -0.66900634765625, -0.6433792114257812, -0.6177520751953125, -0.5921249389648438, -0.566497802734375, -0.5408706665039062, -0.5152435302734375, -0.48961639404296875, -0.4639892578125, -0.43836212158203125, -0.4127349853515625, -0.38710784912109375, -0.361480712890625, -0.33585357666015625, -0.3102264404296875, -0.28459930419921875, -0.25897216796875, -0.23334503173828125, -0.2077178955078125, -0.18209075927734375, -0.156463623046875, -0.13083648681640625, -0.1052093505859375, -0.07958221435546875, -0.053955078125, -0.02832794189453125, -0.0027008056640625, 0.02292633056640625, 0.048553466796875, 0.07418060302734375, 0.0998077392578125, 0.12543487548828125, 0.15106201171875, 0.17668914794921875, 0.2023162841796875, 0.22794342041015625, 0.253570556640625, 0.27919769287109375, 0.3048248291015625, 0.33045196533203125, 0.3560791015625, 0.38170623779296875, 0.4073333740234375, 0.43296051025390625, 0.458587646484375, 0.48421478271484375, 0.5098419189453125, 0.5354690551757812, 0.56109619140625, 0.5867233276367188, 0.6123504638671875, 0.6379776000976562, 0.663604736328125, 0.6892318725585938, 0.7148590087890625, 0.7404861450195312, 0.76611328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 20.0, 30.0, 29.0, 35.0, 54.0, 68.0, 88.0, 132.0, 132.0, 85.0, 52.0, 36.0, 38.0, 29.0, 29.0, 17.0, 16.0, 11.0, 11.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001933574676513672, -0.00018686801195144653, -0.00018037855625152588, -0.00017388910055160522, -0.00016739964485168457, -0.00016091018915176392, -0.00015442073345184326, -0.0001479312777519226, -0.00014144182205200195, -0.0001349523663520813, -0.00012846291065216064, -0.00012197345495223999, -0.00011548399925231934, -0.00010899454355239868, -0.00010250508785247803, -9.601563215255737e-05, -8.952617645263672e-05, -8.303672075271606e-05, -7.654726505279541e-05, -7.005780935287476e-05, -6.35683536529541e-05, -5.707889795303345e-05, -5.058944225311279e-05, -4.409998655319214e-05, -3.7610530853271484e-05, -3.112107515335083e-05, -2.4631619453430176e-05, -1.814216375350952e-05, -1.1652708053588867e-05, -5.163252353668213e-06, 1.3262033462524414e-06, 7.815659046173096e-06, 1.430511474609375e-05, 2.0794570446014404e-05, 2.728402614593506e-05, 3.377348184585571e-05, 4.026293754577637e-05, 4.675239324569702e-05, 5.3241848945617676e-05, 5.973130464553833e-05, 6.622076034545898e-05, 7.271021604537964e-05, 7.919967174530029e-05, 8.568912744522095e-05, 9.21785831451416e-05, 9.866803884506226e-05, 0.00010515749454498291, 0.00011164695024490356, 0.00011813640594482422, 0.00012462586164474487, 0.00013111531734466553, 0.00013760477304458618, 0.00014409422874450684, 0.0001505836844444275, 0.00015707314014434814, 0.0001635625958442688, 0.00017005205154418945, 0.0001765415072441101, 0.00018303096294403076, 0.00018952041864395142, 0.00019600987434387207, 0.00020249933004379272, 0.00020898878574371338, 0.00021547824144363403, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 9.0, 22.0, 15.0, 32.0, 67.0, 79.0, 114.0, 193.0, 298.0, 503.0, 954.0, 2253.0, 5921.0, 23047.0, 175689.0, 758186.0, 62133.0, 11939.0, 3717.0, 1568.0, 704.0, 435.0, 233.0, 147.0, 93.0, 47.0, 48.0, 26.0, 14.0, 13.0, 10.0, 11.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0859375, -1.0488433837890625, -1.011749267578125, -0.9746551513671875, -0.93756103515625, -0.9004669189453125, -0.863372802734375, -0.8262786865234375, -0.7891845703125, -0.7520904541015625, -0.714996337890625, -0.6779022216796875, -0.64080810546875, -0.6037139892578125, -0.566619873046875, -0.5295257568359375, -0.492431640625, -0.4553375244140625, -0.418243408203125, -0.3811492919921875, -0.34405517578125, -0.3069610595703125, -0.269866943359375, -0.2327728271484375, -0.1956787109375, -0.1585845947265625, -0.121490478515625, -0.0843963623046875, -0.04730224609375, -0.0102081298828125, 0.026885986328125, 0.0639801025390625, 0.10107421875, 0.1381683349609375, 0.175262451171875, 0.2123565673828125, 0.24945068359375, 0.2865447998046875, 0.323638916015625, 0.3607330322265625, 0.3978271484375, 0.4349212646484375, 0.472015380859375, 0.5091094970703125, 0.54620361328125, 0.5832977294921875, 0.620391845703125, 0.6574859619140625, 0.694580078125, 0.7316741943359375, 0.768768310546875, 0.8058624267578125, 0.84295654296875, 0.8800506591796875, 0.917144775390625, 0.9542388916015625, 0.9913330078125, 1.0284271240234375, 1.065521240234375, 1.1026153564453125, 1.13970947265625, 1.1768035888671875, 1.213897705078125, 1.2509918212890625, 1.2880859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 1.0, 7.0, 2.0, 3.0, 9.0, 9.0, 17.0, 23.0, 22.0, 23.0, 28.0, 50.0, 54.0, 69.0, 75.0, 99.0, 111.0, 86.0, 72.0, 39.0, 30.0, 39.0, 21.0, 11.0, 18.0, 9.0, 10.0, 9.0, 7.0, 13.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8662109375, -0.8399276733398438, -0.8136444091796875, -0.7873611450195312, -0.761077880859375, -0.7347946166992188, -0.7085113525390625, -0.6822280883789062, -0.65594482421875, -0.6296615600585938, -0.6033782958984375, -0.5770950317382812, -0.550811767578125, -0.5245285034179688, -0.4982452392578125, -0.47196197509765625, -0.4456787109375, -0.41939544677734375, -0.3931121826171875, -0.36682891845703125, -0.340545654296875, -0.31426239013671875, -0.2879791259765625, -0.26169586181640625, -0.23541259765625, -0.20912933349609375, -0.1828460693359375, -0.15656280517578125, -0.130279541015625, -0.10399627685546875, -0.0777130126953125, -0.05142974853515625, -0.025146484375, 0.00113677978515625, 0.0274200439453125, 0.05370330810546875, 0.079986572265625, 0.10626983642578125, 0.1325531005859375, 0.15883636474609375, 0.18511962890625, 0.21140289306640625, 0.2376861572265625, 0.26396942138671875, 0.290252685546875, 0.31653594970703125, 0.3428192138671875, 0.36910247802734375, 0.3953857421875, 0.42166900634765625, 0.4479522705078125, 0.47423553466796875, 0.500518798828125, 0.5268020629882812, 0.5530853271484375, 0.5793685913085938, 0.60565185546875, 0.6319351196289062, 0.6582183837890625, 0.6845016479492188, 0.710784912109375, 0.7370681762695312, 0.7633514404296875, 0.7896347045898438, 0.81591796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 10.0, 13.0, 45.0, 121.0, 376.0, 259.0, 97.0, 46.0, 18.0, 7.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.516643524169922, -26.525775909423828, -25.534910202026367, -24.544042587280273, -23.55317497253418, -22.56230926513672, -21.571441650390625, -20.58057403564453, -19.58970832824707, -18.598840713500977, -17.607975006103516, -16.617107391357422, -15.626240730285645, -14.635374069213867, -13.644506454467773, -12.653639793395996, -11.662772178649902, -10.671905517578125, -9.681037902832031, -8.690171241760254, -7.699304580688477, -6.708437442779541, -5.7175703048706055, -4.726703643798828, -3.7358365058898926, -2.744969606399536, -1.7541025876998901, -0.7632355690002441, 0.2276313304901123, 1.2184982299804688, 2.2093653678894043, 3.2002320289611816, 4.191099166870117, 5.181966304779053, 6.17283296585083, 7.163700103759766, 8.154566764831543, 9.14543342590332, 10.136301040649414, 11.127167701721191, 12.118034362792969, 13.108901023864746, 14.09976863861084, 15.090635299682617, 16.08150291442871, 17.072368621826172, 18.063236236572266, 19.05410385131836, 20.044971466064453, 21.035839080810547, 22.026704788208008, 23.0175724029541, 24.008440017700195, 24.999305725097656, 25.99017333984375, 26.981040954589844, 27.971906661987305, 28.9627742767334, 29.95363998413086, 30.944507598876953, 31.935375213623047, 32.92624282836914, 33.91710662841797, 34.90797424316406, 35.898841857910156]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 11.0, 7.0, 12.0, 19.0, 23.0, 19.0, 21.0, 31.0, 30.0, 31.0, 29.0, 47.0, 50.0, 38.0, 63.0, 76.0, 67.0, 46.0, 38.0, 38.0, 31.0, 41.0, 27.0, 20.0, 28.0, 29.0, 15.0, 16.0, 13.0, 13.0, 15.0, 9.0, 5.0, 7.0, 9.0, 8.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.68444538116455, -9.389105796813965, -9.093766212463379, -8.798426628112793, -8.503087043762207, -8.207747459411621, -7.912407875061035, -7.617068290710449, -7.321728706359863, -7.026389122009277, -6.731049537658691, -6.4357099533081055, -6.1403703689575195, -5.845030784606934, -5.549691200256348, -5.254351615905762, -4.959011554718018, -4.663671970367432, -4.368332386016846, -4.07299280166626, -3.777653217315674, -3.482313632965088, -3.186973810195923, -2.891634225845337, -2.596294641494751, -2.300955057144165, -2.005615472793579, -1.7102757692337036, -1.4149361848831177, -1.1195966005325317, -0.8242568969726562, -0.5289173126220703, -0.23357772827148438, 0.06176188588142395, 0.3571015000343323, 0.652441143989563, 0.9477807283401489, 1.2431203126907349, 1.5384600162506104, 1.8337996006011963, 2.1291391849517822, 2.424478769302368, 2.719818353652954, 3.015158176422119, 3.310497760772705, 3.605837345123291, 3.901176929473877, 4.196516513824463, 4.491856098175049, 4.787195682525635, 5.082535266876221, 5.377874851226807, 5.673214435577393, 5.9685540199279785, 6.263894081115723, 6.559233665466309, 6.8545732498168945, 7.1499128341674805, 7.445252418518066, 7.740592002868652, 8.035931587219238, 8.331271171569824, 8.62661075592041, 8.921950340270996, 9.217289924621582]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 10.0, 6.0, 12.0, 29.0, 36.0, 45.0, 70.0, 108.0, 199.0, 319.0, 512.0, 928.0, 1693.0, 3945.0, 10292.0, 61104.0, 1343213.0, 2632096.0, 115136.0, 14820.0, 4803.0, 2151.0, 1124.0, 667.0, 338.0, 245.0, 146.0, 73.0, 37.0, 31.0, 24.0, 23.0, 13.0, 7.0, 3.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5302734375, -1.482635498046875, -1.43499755859375, -1.387359619140625, -1.3397216796875, -1.292083740234375, -1.24444580078125, -1.196807861328125, -1.149169921875, -1.101531982421875, -1.05389404296875, -1.006256103515625, -0.9586181640625, -0.910980224609375, -0.86334228515625, -0.815704345703125, -0.76806640625, -0.720428466796875, -0.67279052734375, -0.625152587890625, -0.5775146484375, -0.529876708984375, -0.48223876953125, -0.434600830078125, -0.386962890625, -0.339324951171875, -0.29168701171875, -0.244049072265625, -0.1964111328125, -0.148773193359375, -0.10113525390625, -0.053497314453125, -0.005859375, 0.041778564453125, 0.08941650390625, 0.137054443359375, 0.1846923828125, 0.232330322265625, 0.27996826171875, 0.327606201171875, 0.375244140625, 0.422882080078125, 0.47052001953125, 0.518157958984375, 0.5657958984375, 0.613433837890625, 0.66107177734375, 0.708709716796875, 0.75634765625, 0.803985595703125, 0.85162353515625, 0.899261474609375, 0.9468994140625, 0.994537353515625, 1.04217529296875, 1.089813232421875, 1.137451171875, 1.185089111328125, 1.23272705078125, 1.280364990234375, 1.3280029296875, 1.375640869140625, 1.42327880859375, 1.470916748046875, 1.5185546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 6.0, 13.0, 12.0, 15.0, 16.0, 39.0, 30.0, 29.0, 36.0, 49.0, 49.0, 53.0, 56.0, 64.0, 54.0, 57.0, 53.0, 48.0, 40.0, 47.0, 34.0, 33.0, 34.0, 24.0, 14.0, 19.0, 15.0, 11.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486328125, -0.466522216796875, -0.44671630859375, -0.426910400390625, -0.4071044921875, -0.387298583984375, -0.36749267578125, -0.347686767578125, -0.327880859375, -0.308074951171875, -0.28826904296875, -0.268463134765625, -0.2486572265625, -0.228851318359375, -0.20904541015625, -0.189239501953125, -0.16943359375, -0.149627685546875, -0.12982177734375, -0.110015869140625, -0.0902099609375, -0.070404052734375, -0.05059814453125, -0.030792236328125, -0.010986328125, 0.008819580078125, 0.02862548828125, 0.048431396484375, 0.0682373046875, 0.088043212890625, 0.10784912109375, 0.127655029296875, 0.1474609375, 0.167266845703125, 0.18707275390625, 0.206878662109375, 0.2266845703125, 0.246490478515625, 0.26629638671875, 0.286102294921875, 0.305908203125, 0.325714111328125, 0.34552001953125, 0.365325927734375, 0.3851318359375, 0.404937744140625, 0.42474365234375, 0.444549560546875, 0.46435546875, 0.484161376953125, 0.50396728515625, 0.523773193359375, 0.5435791015625, 0.563385009765625, 0.58319091796875, 0.602996826171875, 0.622802734375, 0.642608642578125, 0.66241455078125, 0.682220458984375, 0.7020263671875, 0.721832275390625, 0.74163818359375, 0.761444091796875, 0.78125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 7.0, 3.0, 10.0, 15.0, 18.0, 30.0, 25.0, 52.0, 67.0, 82.0, 135.0, 201.0, 305.0, 453.0, 709.0, 1215.0, 2107.0, 4187.0, 9529.0, 31476.0, 231390.0, 3440104.0, 410822.0, 39873.0, 10911.0, 4519.0, 2339.0, 1376.0, 802.0, 523.0, 336.0, 207.0, 126.0, 96.0, 72.0, 47.0, 25.0, 30.0, 18.0, 8.0, 10.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7060546875, -1.6552734375, -1.6044921875, -1.5537109375, -1.5029296875, -1.4521484375, -1.4013671875, -1.3505859375, -1.2998046875, -1.2490234375, -1.1982421875, -1.1474609375, -1.0966796875, -1.0458984375, -0.9951171875, -0.9443359375, -0.8935546875, -0.8427734375, -0.7919921875, -0.7412109375, -0.6904296875, -0.6396484375, -0.5888671875, -0.5380859375, -0.4873046875, -0.4365234375, -0.3857421875, -0.3349609375, -0.2841796875, -0.2333984375, -0.1826171875, -0.1318359375, -0.0810546875, -0.0302734375, 0.0205078125, 0.0712890625, 0.1220703125, 0.1728515625, 0.2236328125, 0.2744140625, 0.3251953125, 0.3759765625, 0.4267578125, 0.4775390625, 0.5283203125, 0.5791015625, 0.6298828125, 0.6806640625, 0.7314453125, 0.7822265625, 0.8330078125, 0.8837890625, 0.9345703125, 0.9853515625, 1.0361328125, 1.0869140625, 1.1376953125, 1.1884765625, 1.2392578125, 1.2900390625, 1.3408203125, 1.3916015625, 1.4423828125, 1.4931640625, 1.5439453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 11.0, 14.0, 17.0, 23.0, 51.0, 65.0, 125.0, 208.0, 412.0, 911.0, 1002.0, 625.0, 267.0, 161.0, 52.0, 38.0, 17.0, 15.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.287109375, -2.2202301025390625, -2.153350830078125, -2.0864715576171875, -2.01959228515625, -1.9527130126953125, -1.885833740234375, -1.8189544677734375, -1.7520751953125, -1.6851959228515625, -1.618316650390625, -1.5514373779296875, -1.48455810546875, -1.4176788330078125, -1.350799560546875, -1.2839202880859375, -1.217041015625, -1.1501617431640625, -1.083282470703125, -1.0164031982421875, -0.94952392578125, -0.8826446533203125, -0.815765380859375, -0.7488861083984375, -0.6820068359375, -0.6151275634765625, -0.548248291015625, -0.4813690185546875, -0.41448974609375, -0.3476104736328125, -0.280731201171875, -0.2138519287109375, -0.14697265625, -0.0800933837890625, -0.013214111328125, 0.0536651611328125, 0.12054443359375, 0.1874237060546875, 0.254302978515625, 0.3211822509765625, 0.3880615234375, 0.4549407958984375, 0.521820068359375, 0.5886993408203125, 0.65557861328125, 0.7224578857421875, 0.789337158203125, 0.8562164306640625, 0.923095703125, 0.9899749755859375, 1.056854248046875, 1.1237335205078125, 1.19061279296875, 1.2574920654296875, 1.324371337890625, 1.3912506103515625, 1.4581298828125, 1.5250091552734375, 1.591888427734375, 1.6587677001953125, 1.72564697265625, 1.7925262451171875, 1.859405517578125, 1.9262847900390625, 1.9931640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 9.0, 19.0, 38.0, 119.0, 267.0, 291.0, 136.0, 72.0, 22.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.20813751220703, -32.40103530883789, -31.59393310546875, -30.786828994750977, -29.979726791381836, -29.172624588012695, -28.365520477294922, -27.55841827392578, -26.75131607055664, -25.9442138671875, -25.13711166381836, -24.330007553100586, -23.522905349731445, -22.715803146362305, -21.90869903564453, -21.10159683227539, -20.29449462890625, -19.48739242553711, -18.68029022216797, -17.873186111450195, -17.066083908081055, -16.258981704711914, -15.451878547668457, -14.644775390625, -13.83767318725586, -13.030570983886719, -12.223467826843262, -11.416364669799805, -10.609262466430664, -9.802160263061523, -8.995057106018066, -8.18795394897461, -7.380851745605469, -6.57374906539917, -5.766646385192871, -4.959543704986572, -4.152441024780273, -3.3453383445739746, -2.538235664367676, -1.731132984161377, -0.9240303039550781, -0.1169276237487793, 0.6901750564575195, 1.4972777366638184, 2.304380416870117, 3.111483097076416, 3.918585777282715, 4.725688457489014, 5.5327911376953125, 6.339893817901611, 7.14699649810791, 7.954099178314209, 8.761201858520508, 9.568304061889648, 10.375407218933105, 11.182510375976562, 11.989612579345703, 12.796714782714844, 13.6038179397583, 14.410921096801758, 15.218023300170898, 16.02512550354004, 16.832229614257812, 17.639331817626953, 18.446434020996094]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 15.0, 3.0, 11.0, 6.0, 9.0, 13.0, 20.0, 23.0, 24.0, 24.0, 29.0, 28.0, 30.0, 42.0, 28.0, 42.0, 43.0, 33.0, 45.0, 43.0, 43.0, 49.0, 38.0, 48.0, 48.0, 36.0, 33.0, 35.0, 32.0, 23.0, 17.0, 23.0, 9.0, 5.0, 11.0, 8.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.239570617675781, -7.022808074951172, -6.8060455322265625, -6.589283466339111, -6.372520923614502, -6.155758380889893, -5.938996315002441, -5.722233772277832, -5.505471229553223, -5.288708686828613, -5.071946144104004, -4.855184078216553, -4.638421535491943, -4.421658992767334, -4.204896926879883, -3.9881343841552734, -3.771371841430664, -3.5546092987060547, -3.3378469944000244, -3.121084690093994, -2.9043221473693848, -2.6875596046447754, -2.470797300338745, -2.254034996032715, -2.0372724533081055, -1.8205100297927856, -1.6037476062774658, -1.386985182762146, -1.1702227592468262, -0.9534603357315063, -0.7366979122161865, -0.5199354887008667, -0.3031735420227051, -0.08641111850738525, 0.13035130500793457, 0.3471137285232544, 0.5638761520385742, 0.780638575553894, 0.9974009990692139, 1.2141634225845337, 1.4309258460998535, 1.6476882696151733, 1.8644506931304932, 2.0812129974365234, 2.297975540161133, 2.514738082885742, 2.7315003871917725, 2.9482626914978027, 3.165025234222412, 3.3817877769470215, 3.5985500812530518, 3.815312385559082, 4.032074928283691, 4.248837471008301, 4.46560001373291, 4.682362079620361, 4.899124622344971, 5.11588716506958, 5.332649230957031, 5.549411773681641, 5.76617431640625, 5.982936859130859, 6.199699401855469, 6.41646146774292, 6.633224010467529]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 10.0, 31.0, 24.0, 49.0, 77.0, 143.0, 211.0, 411.0, 699.0, 1383.0, 2591.0, 5972.0, 16099.0, 66514.0, 479124.0, 394107.0, 56020.0, 14340.0, 5366.0, 2487.0, 1236.0, 680.0, 398.0, 218.0, 117.0, 79.0, 53.0, 17.0, 13.0, 17.0, 14.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.95587158203125, -1.8883056640625, -1.82073974609375, -1.753173828125, -1.68560791015625, -1.6180419921875, -1.55047607421875, -1.48291015625, -1.41534423828125, -1.3477783203125, -1.28021240234375, -1.212646484375, -1.14508056640625, -1.0775146484375, -1.00994873046875, -0.9423828125, -0.87481689453125, -0.8072509765625, -0.73968505859375, -0.672119140625, -0.60455322265625, -0.5369873046875, -0.46942138671875, -0.40185546875, -0.33428955078125, -0.2667236328125, -0.19915771484375, -0.131591796875, -0.06402587890625, 0.0035400390625, 0.07110595703125, 0.138671875, 0.20623779296875, 0.2738037109375, 0.34136962890625, 0.408935546875, 0.47650146484375, 0.5440673828125, 0.61163330078125, 0.67919921875, 0.74676513671875, 0.8143310546875, 0.88189697265625, 0.949462890625, 1.01702880859375, 1.0845947265625, 1.15216064453125, 1.2197265625, 1.28729248046875, 1.3548583984375, 1.42242431640625, 1.489990234375, 1.55755615234375, 1.6251220703125, 1.69268798828125, 1.76025390625, 1.82781982421875, 1.8953857421875, 1.96295166015625, 2.030517578125, 2.09808349609375, 2.1656494140625, 2.23321533203125, 2.30078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 12.0, 14.0, 23.0, 19.0, 23.0, 26.0, 33.0, 51.0, 39.0, 48.0, 46.0, 54.0, 52.0, 58.0, 61.0, 48.0, 56.0, 45.0, 34.0, 46.0, 26.0, 28.0, 31.0, 24.0, 16.0, 7.0, 14.0, 15.0, 15.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5726242065429688, -0.5519866943359375, -0.5313491821289062, -0.510711669921875, -0.49007415771484375, -0.4694366455078125, -0.44879913330078125, -0.42816162109375, -0.40752410888671875, -0.3868865966796875, -0.36624908447265625, -0.345611572265625, -0.32497406005859375, -0.3043365478515625, -0.28369903564453125, -0.2630615234375, -0.24242401123046875, -0.2217864990234375, -0.20114898681640625, -0.180511474609375, -0.15987396240234375, -0.1392364501953125, -0.11859893798828125, -0.09796142578125, -0.07732391357421875, -0.0566864013671875, -0.03604888916015625, -0.015411376953125, 0.00522613525390625, 0.0258636474609375, 0.04650115966796875, 0.067138671875, 0.08777618408203125, 0.1084136962890625, 0.12905120849609375, 0.149688720703125, 0.17032623291015625, 0.1909637451171875, 0.21160125732421875, 0.23223876953125, 0.25287628173828125, 0.2735137939453125, 0.29415130615234375, 0.314788818359375, 0.33542633056640625, 0.3560638427734375, 0.37670135498046875, 0.3973388671875, 0.41797637939453125, 0.4386138916015625, 0.45925140380859375, 0.479888916015625, 0.5005264282226562, 0.5211639404296875, 0.5418014526367188, 0.56243896484375, 0.5830764770507812, 0.6037139892578125, 0.6243515014648438, 0.644989013671875, 0.6656265258789062, 0.6862640380859375, 0.7069015502929688, 0.7275390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 17.0, 12.0, 27.0, 26.0, 30.0, 54.0, 78.0, 96.0, 162.0, 242.0, 402.0, 777.0, 1779.0, 4791.0, 19646.0, 235089.0, 741192.0, 32610.0, 6869.0, 2321.0, 974.0, 490.0, 280.0, 173.0, 121.0, 84.0, 61.0, 35.0, 22.0, 21.0, 22.0, 15.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.34765625, -4.22735595703125, -4.1070556640625, -3.98675537109375, -3.866455078125, -3.74615478515625, -3.6258544921875, -3.50555419921875, -3.38525390625, -3.26495361328125, -3.1446533203125, -3.02435302734375, -2.904052734375, -2.78375244140625, -2.6634521484375, -2.54315185546875, -2.4228515625, -2.30255126953125, -2.1822509765625, -2.06195068359375, -1.941650390625, -1.82135009765625, -1.7010498046875, -1.58074951171875, -1.46044921875, -1.34014892578125, -1.2198486328125, -1.09954833984375, -0.979248046875, -0.85894775390625, -0.7386474609375, -0.61834716796875, -0.498046875, -0.37774658203125, -0.2574462890625, -0.13714599609375, -0.016845703125, 0.10345458984375, 0.2237548828125, 0.34405517578125, 0.46435546875, 0.58465576171875, 0.7049560546875, 0.82525634765625, 0.945556640625, 1.06585693359375, 1.1861572265625, 1.30645751953125, 1.4267578125, 1.54705810546875, 1.6673583984375, 1.78765869140625, 1.907958984375, 2.02825927734375, 2.1485595703125, 2.26885986328125, 2.38916015625, 2.50946044921875, 2.6297607421875, 2.75006103515625, 2.870361328125, 2.99066162109375, 3.1109619140625, 3.23126220703125, 3.3515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 3.0, 11.0, 6.0, 14.0, 10.0, 14.0, 16.0, 19.0, 20.0, 35.0, 36.0, 41.0, 51.0, 41.0, 62.0, 56.0, 48.0, 47.0, 58.0, 52.0, 62.0, 56.0, 39.0, 27.0, 38.0, 24.0, 15.0, 11.0, 22.0, 6.0, 14.0, 6.0, 2.0, 10.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.734375, -2.646759033203125, -2.55914306640625, -2.471527099609375, -2.3839111328125, -2.296295166015625, -2.20867919921875, -2.121063232421875, -2.033447265625, -1.945831298828125, -1.85821533203125, -1.770599365234375, -1.6829833984375, -1.595367431640625, -1.50775146484375, -1.420135498046875, -1.33251953125, -1.244903564453125, -1.15728759765625, -1.069671630859375, -0.9820556640625, -0.894439697265625, -0.80682373046875, -0.719207763671875, -0.631591796875, -0.543975830078125, -0.45635986328125, -0.368743896484375, -0.2811279296875, -0.193511962890625, -0.10589599609375, -0.018280029296875, 0.0693359375, 0.156951904296875, 0.24456787109375, 0.332183837890625, 0.4197998046875, 0.507415771484375, 0.59503173828125, 0.682647705078125, 0.770263671875, 0.857879638671875, 0.94549560546875, 1.033111572265625, 1.1207275390625, 1.208343505859375, 1.29595947265625, 1.383575439453125, 1.47119140625, 1.558807373046875, 1.64642333984375, 1.734039306640625, 1.8216552734375, 1.909271240234375, 1.99688720703125, 2.084503173828125, 2.172119140625, 2.259735107421875, 2.34735107421875, 2.434967041015625, 2.5225830078125, 2.610198974609375, 2.69781494140625, 2.785430908203125, 2.873046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 14.0, 13.0, 21.0, 52.0, 67.0, 162.0, 273.0, 716.0, 2161.0, 9675.0, 396768.0, 624794.0, 10187.0, 2201.0, 763.0, 309.0, 153.0, 76.0, 42.0, 20.0, 17.0, 12.0, 9.0, 3.0, 7.0, 6.0, 0.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.12109375, -3.036773681640625, -2.95245361328125, -2.868133544921875, -2.7838134765625, -2.699493408203125, -2.61517333984375, -2.530853271484375, -2.446533203125, -2.362213134765625, -2.27789306640625, -2.193572998046875, -2.1092529296875, -2.024932861328125, -1.94061279296875, -1.856292724609375, -1.77197265625, -1.687652587890625, -1.60333251953125, -1.519012451171875, -1.4346923828125, -1.350372314453125, -1.26605224609375, -1.181732177734375, -1.097412109375, -1.013092041015625, -0.92877197265625, -0.844451904296875, -0.7601318359375, -0.675811767578125, -0.59149169921875, -0.507171630859375, -0.4228515625, -0.338531494140625, -0.25421142578125, -0.169891357421875, -0.0855712890625, -0.001251220703125, 0.08306884765625, 0.167388916015625, 0.251708984375, 0.336029052734375, 0.42034912109375, 0.504669189453125, 0.5889892578125, 0.673309326171875, 0.75762939453125, 0.841949462890625, 0.92626953125, 1.010589599609375, 1.09490966796875, 1.179229736328125, 1.2635498046875, 1.347869873046875, 1.43218994140625, 1.516510009765625, 1.600830078125, 1.685150146484375, 1.76947021484375, 1.853790283203125, 1.9381103515625, 2.022430419921875, 2.10675048828125, 2.191070556640625, 2.275390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 15.0, 22.0, 27.0, 44.0, 67.0, 175.0, 293.0, 149.0, 67.0, 37.0, 37.0, 16.0, 15.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003523826599121094, -0.00033731013536453247, -0.00032223761081695557, -0.00030716508626937866, -0.00029209256172180176, -0.00027702003717422485, -0.00026194751262664795, -0.00024687498807907104, -0.00023180246353149414, -0.00021672993898391724, -0.00020165741443634033, -0.00018658488988876343, -0.00017151236534118652, -0.00015643984079360962, -0.00014136731624603271, -0.0001262947916984558, -0.0001112222671508789, -9.6149742603302e-05, -8.10772180557251e-05, -6.60046935081482e-05, -5.093216896057129e-05, -3.5859644412994385e-05, -2.078711986541748e-05, -5.714595317840576e-06, 9.357929229736328e-06, 2.4430453777313232e-05, 3.950297832489014e-05, 5.457550287246704e-05, 6.964802742004395e-05, 8.472055196762085e-05, 9.979307651519775e-05, 0.00011486560106277466, 0.00012993812561035156, 0.00014501065015792847, 0.00016008317470550537, 0.00017515569925308228, 0.00019022822380065918, 0.00020530074834823608, 0.000220373272895813, 0.0002354457974433899, 0.0002505183219909668, 0.0002655908465385437, 0.0002806633710861206, 0.0002957358956336975, 0.0003108084201812744, 0.0003258809447288513, 0.0003409534692764282, 0.0003560259938240051, 0.00037109851837158203, 0.00038617104291915894, 0.00040124356746673584, 0.00041631609201431274, 0.00043138861656188965, 0.00044646114110946655, 0.00046153366565704346, 0.00047660619020462036, 0.0004916787147521973, 0.0005067512392997742, 0.0005218237638473511, 0.000536896288394928, 0.0005519688129425049, 0.0005670413374900818, 0.0005821138620376587, 0.0005971863865852356, 0.0006122589111328125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 5.0, 1.0, 9.0, 14.0, 8.0, 20.0, 35.0, 59.0, 93.0, 164.0, 347.0, 762.0, 1931.0, 7267.0, 85358.0, 905701.0, 39114.0, 4907.0, 1499.0, 605.0, 270.0, 154.0, 75.0, 49.0, 37.0, 17.0, 16.0, 13.0, 6.0, 5.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.32110595703125, -2.2554931640625, -2.18988037109375, -2.124267578125, -2.05865478515625, -1.9930419921875, -1.92742919921875, -1.86181640625, -1.79620361328125, -1.7305908203125, -1.66497802734375, -1.599365234375, -1.53375244140625, -1.4681396484375, -1.40252685546875, -1.3369140625, -1.27130126953125, -1.2056884765625, -1.14007568359375, -1.074462890625, -1.00885009765625, -0.9432373046875, -0.87762451171875, -0.81201171875, -0.74639892578125, -0.6807861328125, -0.61517333984375, -0.549560546875, -0.48394775390625, -0.4183349609375, -0.35272216796875, -0.287109375, -0.22149658203125, -0.1558837890625, -0.09027099609375, -0.024658203125, 0.04095458984375, 0.1065673828125, 0.17218017578125, 0.23779296875, 0.30340576171875, 0.3690185546875, 0.43463134765625, 0.500244140625, 0.56585693359375, 0.6314697265625, 0.69708251953125, 0.7626953125, 0.82830810546875, 0.8939208984375, 0.95953369140625, 1.025146484375, 1.09075927734375, 1.1563720703125, 1.22198486328125, 1.28759765625, 1.35321044921875, 1.4188232421875, 1.48443603515625, 1.550048828125, 1.61566162109375, 1.6812744140625, 1.74688720703125, 1.8125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 8.0, 4.0, 14.0, 15.0, 26.0, 38.0, 41.0, 73.0, 116.0, 176.0, 167.0, 103.0, 86.0, 48.0, 29.0, 20.0, 15.0, 9.0, 7.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2345428466796875, -1.186859130859375, -1.1391754150390625, -1.09149169921875, -1.0438079833984375, -0.996124267578125, -0.9484405517578125, -0.9007568359375, -0.8530731201171875, -0.805389404296875, -0.7577056884765625, -0.71002197265625, -0.6623382568359375, -0.614654541015625, -0.5669708251953125, -0.519287109375, -0.4716033935546875, -0.423919677734375, -0.3762359619140625, -0.32855224609375, -0.2808685302734375, -0.233184814453125, -0.1855010986328125, -0.1378173828125, -0.0901336669921875, -0.042449951171875, 0.0052337646484375, 0.05291748046875, 0.1006011962890625, 0.148284912109375, 0.1959686279296875, 0.24365234375, 0.2913360595703125, 0.339019775390625, 0.3867034912109375, 0.43438720703125, 0.4820709228515625, 0.529754638671875, 0.5774383544921875, 0.6251220703125, 0.6728057861328125, 0.720489501953125, 0.7681732177734375, 0.81585693359375, 0.8635406494140625, 0.911224365234375, 0.9589080810546875, 1.006591796875, 1.0542755126953125, 1.101959228515625, 1.1496429443359375, 1.19732666015625, 1.2450103759765625, 1.292694091796875, 1.3403778076171875, 1.3880615234375, 1.4357452392578125, 1.483428955078125, 1.5311126708984375, 1.57879638671875, 1.6264801025390625, 1.674163818359375, 1.7218475341796875, 1.76953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 14.0, 31.0, 70.0, 177.0, 387.0, 173.0, 62.0, 41.0, 10.0, 11.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.612131118774414, -28.675294876098633, -27.73845863342285, -26.80162239074707, -25.86478614807129, -24.927949905395508, -23.991113662719727, -23.054277420043945, -22.117441177368164, -21.180604934692383, -20.2437686920166, -19.30693244934082, -18.37009620666504, -17.433259963989258, -16.496423721313477, -15.559587478637695, -14.622751235961914, -13.685914993286133, -12.749078750610352, -11.81224250793457, -10.875406265258789, -9.938570022583008, -9.001733779907227, -8.064897537231445, -7.128061294555664, -6.191225051879883, -5.254388809204102, -4.31755256652832, -3.380716323852539, -2.443880081176758, -1.5070438385009766, -0.5702075958251953, 0.36663055419921875, 1.303466796875, 2.2403030395507812, 3.1771392822265625, 4.113975524902344, 5.050811767578125, 5.987648010253906, 6.9244842529296875, 7.861320495605469, 8.79815673828125, 9.734992980957031, 10.671829223632812, 11.608665466308594, 12.545501708984375, 13.482337951660156, 14.419174194335938, 15.356010437011719, 16.2928466796875, 17.22968292236328, 18.166519165039062, 19.103355407714844, 20.040191650390625, 20.977027893066406, 21.913864135742188, 22.85070037841797, 23.78753662109375, 24.72437286376953, 25.661209106445312, 26.598045349121094, 27.534881591796875, 28.471717834472656, 29.408554077148438, 30.34539031982422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 2.0, 5.0, 7.0, 3.0, 9.0, 8.0, 9.0, 12.0, 24.0, 26.0, 19.0, 30.0, 34.0, 43.0, 35.0, 45.0, 61.0, 61.0, 75.0, 90.0, 60.0, 56.0, 46.0, 41.0, 28.0, 32.0, 17.0, 29.0, 28.0, 14.0, 13.0, 12.0, 9.0, 8.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.289093017578125, -15.860479354858398, -15.431865692138672, -15.003252983093262, -14.574639320373535, -14.146025657653809, -13.717411994934082, -13.288799285888672, -12.860185623168945, -12.431571960449219, -12.002958297729492, -11.574345588684082, -11.145731925964355, -10.717118263244629, -10.288504600524902, -9.859891891479492, -9.431278228759766, -9.002664566040039, -8.574050903320312, -8.145438194274902, -7.716824531555176, -7.288210868835449, -6.859597206115723, -6.430984020233154, -6.0023698806762695, -5.573756217956543, -5.145143032073975, -4.716529369354248, -4.28791618347168, -3.859302520751953, -3.4306890964508057, -3.002075672149658, -2.57346248626709, -2.1448490619659424, -1.716235637664795, -1.287622094154358, -0.8590086698532104, -0.43039512634277344, -0.0017817020416259766, 0.4268317222595215, 0.855445146560669, 1.2840585708618164, 1.7126719951629639, 2.1412854194641113, 2.569899082183838, 2.9985125064849854, 3.427125930786133, 3.8557393550872803, 4.284352779388428, 4.712966442108154, 5.141579627990723, 5.570193290710449, 5.998806476593018, 6.427420139312744, 6.8560333251953125, 7.284646987915039, 7.713260650634766, 8.141874313354492, 8.570487976074219, 8.999100685119629, 9.427714347839355, 9.856328010559082, 10.284941673278809, 10.713554382324219, 11.142168045043945]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 11.0, 12.0, 26.0, 43.0, 65.0, 99.0, 148.0, 259.0, 450.0, 875.0, 1949.0, 5273.0, 25367.0, 417320.0, 3476781.0, 238772.0, 18603.0, 4680.0, 1748.0, 770.0, 419.0, 237.0, 143.0, 83.0, 53.0, 21.0, 19.0, 24.0, 11.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.21484375, -2.1613616943359375, -2.107879638671875, -2.0543975830078125, -2.00091552734375, -1.9474334716796875, -1.893951416015625, -1.8404693603515625, -1.7869873046875, -1.7335052490234375, -1.680023193359375, -1.6265411376953125, -1.57305908203125, -1.5195770263671875, -1.466094970703125, -1.4126129150390625, -1.359130859375, -1.3056488037109375, -1.252166748046875, -1.1986846923828125, -1.14520263671875, -1.0917205810546875, -1.038238525390625, -0.9847564697265625, -0.9312744140625, -0.8777923583984375, -0.824310302734375, -0.7708282470703125, -0.71734619140625, -0.6638641357421875, -0.610382080078125, -0.5569000244140625, -0.50341796875, -0.4499359130859375, -0.396453857421875, -0.3429718017578125, -0.28948974609375, -0.2360076904296875, -0.182525634765625, -0.1290435791015625, -0.0755615234375, -0.0220794677734375, 0.031402587890625, 0.0848846435546875, 0.13836669921875, 0.1918487548828125, 0.245330810546875, 0.2988128662109375, 0.352294921875, 0.4057769775390625, 0.459259033203125, 0.5127410888671875, 0.56622314453125, 0.6197052001953125, 0.673187255859375, 0.7266693115234375, 0.7801513671875, 0.8336334228515625, 0.887115478515625, 0.9405975341796875, 0.99407958984375, 1.0475616455078125, 1.101043701171875, 1.1545257568359375, 1.2080078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 0.0, 3.0, 7.0, 8.0, 10.0, 26.0, 18.0, 30.0, 29.0, 45.0, 54.0, 48.0, 53.0, 70.0, 59.0, 73.0, 70.0, 71.0, 58.0, 51.0, 46.0, 31.0, 32.0, 27.0, 24.0, 23.0, 12.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9306640625, -0.9037399291992188, -0.8768157958984375, -0.8498916625976562, -0.822967529296875, -0.7960433959960938, -0.7691192626953125, -0.7421951293945312, -0.71527099609375, -0.6883468627929688, -0.6614227294921875, -0.6344985961914062, -0.607574462890625, -0.5806503295898438, -0.5537261962890625, -0.5268020629882812, -0.4998779296875, -0.47295379638671875, -0.4460296630859375, -0.41910552978515625, -0.392181396484375, -0.36525726318359375, -0.3383331298828125, -0.31140899658203125, -0.28448486328125, -0.25756072998046875, -0.2306365966796875, -0.20371246337890625, -0.176788330078125, -0.14986419677734375, -0.1229400634765625, -0.09601593017578125, -0.069091796875, -0.04216766357421875, -0.0152435302734375, 0.01168060302734375, 0.038604736328125, 0.06552886962890625, 0.0924530029296875, 0.11937713623046875, 0.14630126953125, 0.17322540283203125, 0.2001495361328125, 0.22707366943359375, 0.253997802734375, 0.28092193603515625, 0.3078460693359375, 0.33477020263671875, 0.3616943359375, 0.38861846923828125, 0.4155426025390625, 0.44246673583984375, 0.469390869140625, 0.49631500244140625, 0.5232391357421875, 0.5501632690429688, 0.57708740234375, 0.6040115356445312, 0.6309356689453125, 0.6578598022460938, 0.684783935546875, 0.7117080688476562, 0.7386322021484375, 0.7655563354492188, 0.79248046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 9.0, 11.0, 28.0, 35.0, 76.0, 141.0, 289.0, 654.0, 1646.0, 4527.0, 17918.0, 333963.0, 3768645.0, 52389.0, 8940.0, 2844.0, 1179.0, 491.0, 225.0, 115.0, 67.0, 29.0, 27.0, 9.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.8050537109375, -2.705810546875, -2.6065673828125, -2.50732421875, -2.4080810546875, -2.308837890625, -2.2095947265625, -2.1103515625, -2.0111083984375, -1.911865234375, -1.8126220703125, -1.71337890625, -1.6141357421875, -1.514892578125, -1.4156494140625, -1.31640625, -1.2171630859375, -1.117919921875, -1.0186767578125, -0.91943359375, -0.8201904296875, -0.720947265625, -0.6217041015625, -0.5224609375, -0.4232177734375, -0.323974609375, -0.2247314453125, -0.12548828125, -0.0262451171875, 0.072998046875, 0.1722412109375, 0.271484375, 0.3707275390625, 0.469970703125, 0.5692138671875, 0.66845703125, 0.7677001953125, 0.866943359375, 0.9661865234375, 1.0654296875, 1.1646728515625, 1.263916015625, 1.3631591796875, 1.46240234375, 1.5616455078125, 1.660888671875, 1.7601318359375, 1.859375, 1.9586181640625, 2.057861328125, 2.1571044921875, 2.25634765625, 2.3555908203125, 2.454833984375, 2.5540771484375, 2.6533203125, 2.7525634765625, 2.851806640625, 2.9510498046875, 3.05029296875, 3.1495361328125, 3.248779296875, 3.3480224609375, 3.447265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 10.0, 20.0, 19.0, 35.0, 53.0, 132.0, 388.0, 957.0, 1293.0, 696.0, 225.0, 88.0, 52.0, 25.0, 13.0, 16.0, 12.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.1817626953125, -2.092041015625, -2.0023193359375, -1.91259765625, -1.8228759765625, -1.733154296875, -1.6434326171875, -1.5537109375, -1.4639892578125, -1.374267578125, -1.2845458984375, -1.19482421875, -1.1051025390625, -1.015380859375, -0.9256591796875, -0.8359375, -0.7462158203125, -0.656494140625, -0.5667724609375, -0.47705078125, -0.3873291015625, -0.297607421875, -0.2078857421875, -0.1181640625, -0.0284423828125, 0.061279296875, 0.1510009765625, 0.24072265625, 0.3304443359375, 0.420166015625, 0.5098876953125, 0.599609375, 0.6893310546875, 0.779052734375, 0.8687744140625, 0.95849609375, 1.0482177734375, 1.137939453125, 1.2276611328125, 1.3173828125, 1.4071044921875, 1.496826171875, 1.5865478515625, 1.67626953125, 1.7659912109375, 1.855712890625, 1.9454345703125, 2.03515625, 2.1248779296875, 2.214599609375, 2.3043212890625, 2.39404296875, 2.4837646484375, 2.573486328125, 2.6632080078125, 2.7529296875, 2.8426513671875, 2.932373046875, 3.0220947265625, 3.11181640625, 3.2015380859375, 3.291259765625, 3.3809814453125, 3.470703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 9.0, 5.0, 19.0, 40.0, 81.0, 143.0, 263.0, 210.0, 107.0, 60.0, 26.0, 15.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.807705879211426, -13.204265594482422, -12.600826263427734, -11.99738597869873, -11.393945693969727, -10.790505409240723, -10.187065124511719, -9.583625793457031, -8.980185508728027, -8.376745223999023, -7.773305416107178, -7.169865608215332, -6.566425323486328, -5.962985038757324, -5.3595452308654785, -4.756105422973633, -4.152665138244629, -3.549225091934204, -2.9457850456237793, -2.3423449993133545, -1.7389049530029297, -1.1354649066925049, -0.5320248603820801, 0.07141494750976562, 0.6748552322387695, 1.2782952785491943, 1.8817353248596191, 2.485175371170044, 3.0886154174804688, 3.6920554637908936, 4.295495510101318, 4.898935317993164, 5.502376556396484, 6.105816841125488, 6.709256649017334, 7.31269645690918, 7.916136741638184, 8.519577026367188, 9.123016357421875, 9.726456642150879, 10.329896926879883, 10.933337211608887, 11.53677749633789, 12.140216827392578, 12.743657112121582, 13.347097396850586, 13.950536727905273, 14.553977012634277, 15.157417297363281, 15.760857582092285, 16.36429786682129, 16.967737197875977, 17.571178436279297, 18.174617767333984, 18.778057098388672, 19.38149642944336, 19.98493766784668, 20.588376998901367, 21.191818237304688, 21.795257568359375, 22.398696899414062, 23.002138137817383, 23.60557746887207, 24.20901870727539, 24.812458038330078]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 7.0, 8.0, 12.0, 14.0, 7.0, 17.0, 19.0, 27.0, 30.0, 29.0, 33.0, 46.0, 52.0, 51.0, 52.0, 58.0, 50.0, 51.0, 66.0, 60.0, 50.0, 56.0, 32.0, 27.0, 20.0, 25.0, 25.0, 14.0, 10.0, 11.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-10.857721328735352, -10.576395034790039, -10.295068740844727, -10.013742446899414, -9.732416152954102, -9.451089859008789, -9.169763565063477, -8.888437271118164, -8.607110977172852, -8.325784683227539, -8.044458389282227, -7.763132095336914, -7.481805801391602, -7.200479507446289, -6.919153213500977, -6.637826919555664, -6.35650110244751, -6.075174808502197, -5.793848514556885, -5.512522220611572, -5.23119592666626, -4.949869632720947, -4.668543815612793, -4.3872175216674805, -4.105891227722168, -3.8245649337768555, -3.543238639831543, -3.2619123458862305, -2.980586051940918, -2.6992597579956055, -2.417933702468872, -2.1366074085235596, -1.8552813529968262, -1.5739550590515137, -1.2926287651062012, -1.0113025903701782, -0.7299762964248657, -0.4486500024795532, -0.16732382774353027, 0.11400246620178223, 0.3953287601470947, 0.6766550540924072, 0.957981288433075, 1.2393075227737427, 1.5206338167190552, 1.8019601106643677, 2.0832862854003906, 2.364612579345703, 2.6459388732910156, 2.927265167236328, 3.2085914611816406, 3.489917755126953, 3.7712440490722656, 4.052570343017578, 4.333896636962891, 4.615222930908203, 4.896549224853516, 5.177875518798828, 5.459201812744141, 5.740528106689453, 6.021854400634766, 6.303180694580078, 6.584506988525391, 6.865833282470703, 7.147159099578857]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 5.0, 18.0, 23.0, 41.0, 73.0, 82.0, 215.0, 436.0, 1104.0, 3213.0, 12837.0, 72858.0, 512777.0, 380237.0, 50828.0, 9542.0, 2545.0, 933.0, 368.0, 158.0, 103.0, 70.0, 31.0, 16.0, 13.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.0769195556640625, -2.019073486328125, -1.9612274169921875, -1.90338134765625, -1.8455352783203125, -1.787689208984375, -1.7298431396484375, -1.6719970703125, -1.6141510009765625, -1.556304931640625, -1.4984588623046875, -1.44061279296875, -1.3827667236328125, -1.324920654296875, -1.2670745849609375, -1.209228515625, -1.1513824462890625, -1.093536376953125, -1.0356903076171875, -0.97784423828125, -0.9199981689453125, -0.862152099609375, -0.8043060302734375, -0.7464599609375, -0.6886138916015625, -0.630767822265625, -0.5729217529296875, -0.51507568359375, -0.4572296142578125, -0.399383544921875, -0.3415374755859375, -0.28369140625, -0.2258453369140625, -0.167999267578125, -0.1101531982421875, -0.05230712890625, 0.0055389404296875, 0.063385009765625, 0.1212310791015625, 0.1790771484375, 0.2369232177734375, 0.294769287109375, 0.3526153564453125, 0.41046142578125, 0.4683074951171875, 0.526153564453125, 0.5839996337890625, 0.641845703125, 0.6996917724609375, 0.757537841796875, 0.8153839111328125, 0.87322998046875, 0.9310760498046875, 0.988922119140625, 1.0467681884765625, 1.1046142578125, 1.1624603271484375, 1.220306396484375, 1.2781524658203125, 1.33599853515625, 1.3938446044921875, 1.451690673828125, 1.5095367431640625, 1.5673828125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 10.0, 3.0, 9.0, 16.0, 16.0, 20.0, 26.0, 25.0, 31.0, 25.0, 44.0, 38.0, 50.0, 41.0, 55.0, 50.0, 43.0, 45.0, 48.0, 57.0, 35.0, 41.0, 26.0, 31.0, 33.0, 21.0, 37.0, 26.0, 20.0, 11.0, 17.0, 8.0, 6.0, 15.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5380859375, -0.5165557861328125, -0.495025634765625, -0.4734954833984375, -0.45196533203125, -0.4304351806640625, -0.408905029296875, -0.3873748779296875, -0.3658447265625, -0.3443145751953125, -0.322784423828125, -0.3012542724609375, -0.27972412109375, -0.2581939697265625, -0.236663818359375, -0.2151336669921875, -0.193603515625, -0.1720733642578125, -0.150543212890625, -0.1290130615234375, -0.10748291015625, -0.0859527587890625, -0.064422607421875, -0.0428924560546875, -0.0213623046875, 0.0001678466796875, 0.021697998046875, 0.0432281494140625, 0.06475830078125, 0.0862884521484375, 0.107818603515625, 0.1293487548828125, 0.15087890625, 0.1724090576171875, 0.193939208984375, 0.2154693603515625, 0.23699951171875, 0.2585296630859375, 0.280059814453125, 0.3015899658203125, 0.3231201171875, 0.3446502685546875, 0.366180419921875, 0.3877105712890625, 0.40924072265625, 0.4307708740234375, 0.452301025390625, 0.4738311767578125, 0.495361328125, 0.5168914794921875, 0.538421630859375, 0.5599517822265625, 0.58148193359375, 0.6030120849609375, 0.624542236328125, 0.6460723876953125, 0.6676025390625, 0.6891326904296875, 0.710662841796875, 0.7321929931640625, 0.75372314453125, 0.7752532958984375, 0.796783447265625, 0.8183135986328125, 0.83984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 12.0, 14.0, 27.0, 34.0, 53.0, 114.0, 189.0, 419.0, 1182.0, 4838.0, 32359.0, 591457.0, 382970.0, 28495.0, 4434.0, 1106.0, 402.0, 188.0, 95.0, 50.0, 43.0, 24.0, 16.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.7046356201171875, -1.627044677734375, -1.5494537353515625, -1.47186279296875, -1.3942718505859375, -1.316680908203125, -1.2390899658203125, -1.1614990234375, -1.0839080810546875, -1.006317138671875, -0.9287261962890625, -0.85113525390625, -0.7735443115234375, -0.695953369140625, -0.6183624267578125, -0.540771484375, -0.4631805419921875, -0.385589599609375, -0.3079986572265625, -0.23040771484375, -0.1528167724609375, -0.075225830078125, 0.0023651123046875, 0.0799560546875, 0.1575469970703125, 0.235137939453125, 0.3127288818359375, 0.39031982421875, 0.4679107666015625, 0.545501708984375, 0.6230926513671875, 0.70068359375, 0.7782745361328125, 0.855865478515625, 0.9334564208984375, 1.01104736328125, 1.0886383056640625, 1.166229248046875, 1.2438201904296875, 1.3214111328125, 1.3990020751953125, 1.476593017578125, 1.5541839599609375, 1.63177490234375, 1.7093658447265625, 1.786956787109375, 1.8645477294921875, 1.942138671875, 2.0197296142578125, 2.097320556640625, 2.1749114990234375, 2.25250244140625, 2.3300933837890625, 2.407684326171875, 2.4852752685546875, 2.5628662109375, 2.6404571533203125, 2.718048095703125, 2.7956390380859375, 2.87322998046875, 2.9508209228515625, 3.028411865234375, 3.1060028076171875, 3.18359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 12.0, 18.0, 18.0, 24.0, 40.0, 43.0, 45.0, 54.0, 50.0, 60.0, 68.0, 66.0, 57.0, 66.0, 73.0, 53.0, 43.0, 43.0, 29.0, 21.0, 16.0, 19.0, 13.0, 14.0, 12.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.905181884765625, -3.79473876953125, -3.684295654296875, -3.5738525390625, -3.463409423828125, -3.35296630859375, -3.242523193359375, -3.132080078125, -3.021636962890625, -2.91119384765625, -2.800750732421875, -2.6903076171875, -2.579864501953125, -2.46942138671875, -2.358978271484375, -2.24853515625, -2.138092041015625, -2.02764892578125, -1.917205810546875, -1.8067626953125, -1.696319580078125, -1.58587646484375, -1.475433349609375, -1.364990234375, -1.254547119140625, -1.14410400390625, -1.033660888671875, -0.9232177734375, -0.812774658203125, -0.70233154296875, -0.591888427734375, -0.4814453125, -0.371002197265625, -0.26055908203125, -0.150115966796875, -0.0396728515625, 0.070770263671875, 0.18121337890625, 0.291656494140625, 0.402099609375, 0.512542724609375, 0.62298583984375, 0.733428955078125, 0.8438720703125, 0.954315185546875, 1.06475830078125, 1.175201416015625, 1.28564453125, 1.396087646484375, 1.50653076171875, 1.616973876953125, 1.7274169921875, 1.837860107421875, 1.94830322265625, 2.058746337890625, 2.169189453125, 2.279632568359375, 2.39007568359375, 2.500518798828125, 2.6109619140625, 2.721405029296875, 2.83184814453125, 2.942291259765625, 3.052734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 4.0, 10.0, 9.0, 16.0, 23.0, 45.0, 57.0, 102.0, 142.0, 257.0, 491.0, 1126.0, 2827.0, 8767.0, 33654.0, 172064.0, 671198.0, 121223.0, 25231.0, 6877.0, 2426.0, 988.0, 463.0, 220.0, 110.0, 81.0, 44.0, 23.0, 17.0, 15.0, 12.0, 8.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.6310958862304688, -0.6103363037109375, -0.5895767211914062, -0.568817138671875, -0.5480575561523438, -0.5272979736328125, -0.5065383911132812, -0.48577880859375, -0.46501922607421875, -0.4442596435546875, -0.42350006103515625, -0.402740478515625, -0.38198089599609375, -0.3612213134765625, -0.34046173095703125, -0.3197021484375, -0.29894256591796875, -0.2781829833984375, -0.25742340087890625, -0.236663818359375, -0.21590423583984375, -0.1951446533203125, -0.17438507080078125, -0.15362548828125, -0.13286590576171875, -0.1121063232421875, -0.09134674072265625, -0.070587158203125, -0.04982757568359375, -0.0290679931640625, -0.00830841064453125, 0.012451171875, 0.03321075439453125, 0.0539703369140625, 0.07472991943359375, 0.095489501953125, 0.11624908447265625, 0.1370086669921875, 0.15776824951171875, 0.17852783203125, 0.19928741455078125, 0.2200469970703125, 0.24080657958984375, 0.261566162109375, 0.28232574462890625, 0.3030853271484375, 0.32384490966796875, 0.3446044921875, 0.36536407470703125, 0.3861236572265625, 0.40688323974609375, 0.427642822265625, 0.44840240478515625, 0.4691619873046875, 0.48992156982421875, 0.51068115234375, 0.5314407348632812, 0.5522003173828125, 0.5729598999023438, 0.593719482421875, 0.6144790649414062, 0.6352386474609375, 0.6559982299804688, 0.6767578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 2.0, 4.0, 3.0, 5.0, 11.0, 3.0, 8.0, 15.0, 18.0, 26.0, 23.0, 40.0, 49.0, 59.0, 71.0, 76.0, 74.0, 67.0, 86.0, 67.0, 59.0, 57.0, 29.0, 33.0, 24.0, 16.0, 20.0, 11.0, 8.0, 4.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001366138458251953, -0.0001324079930782318, -0.0001282021403312683, -0.0001239962875843048, -0.00011979043483734131, -0.00011558458209037781, -0.0001113787293434143, -0.0001071728765964508, -0.0001029670238494873, -9.87611711025238e-05, -9.45553183555603e-05, -9.03494656085968e-05, -8.61436128616333e-05, -8.19377601146698e-05, -7.77319073677063e-05, -7.35260546207428e-05, -6.93202018737793e-05, -6.51143491268158e-05, -6.0908496379852295e-05, -5.6702643632888794e-05, -5.249679088592529e-05, -4.829093813896179e-05, -4.408508539199829e-05, -3.987923264503479e-05, -3.567337989807129e-05, -3.146752715110779e-05, -2.7261674404144287e-05, -2.3055821657180786e-05, -1.8849968910217285e-05, -1.4644116163253784e-05, -1.0438263416290283e-05, -6.232410669326782e-06, -2.0265579223632812e-06, 2.1792948246002197e-06, 6.385147571563721e-06, 1.0591000318527222e-05, 1.4796853065490723e-05, 1.9002705812454224e-05, 2.3208558559417725e-05, 2.7414411306381226e-05, 3.1620264053344727e-05, 3.582611680030823e-05, 4.003196954727173e-05, 4.423782229423523e-05, 4.844367504119873e-05, 5.264952778816223e-05, 5.685538053512573e-05, 6.106123328208923e-05, 6.526708602905273e-05, 6.947293877601624e-05, 7.367879152297974e-05, 7.788464426994324e-05, 8.209049701690674e-05, 8.629634976387024e-05, 9.050220251083374e-05, 9.470805525779724e-05, 9.891390800476074e-05, 0.00010311976075172424, 0.00010732561349868774, 0.00011153146624565125, 0.00011573731899261475, 0.00011994317173957825, 0.00012414902448654175, 0.00012835487723350525, 0.00013256072998046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 13.0, 14.0, 22.0, 29.0, 48.0, 78.0, 211.0, 496.0, 1613.0, 7460.0, 69919.0, 850436.0, 105754.0, 9483.0, 1868.0, 586.0, 226.0, 120.0, 53.0, 41.0, 21.0, 10.0, 14.0, 10.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.1662139892578125, -1.125396728515625, -1.0845794677734375, -1.04376220703125, -1.0029449462890625, -0.962127685546875, -0.9213104248046875, -0.8804931640625, -0.8396759033203125, -0.798858642578125, -0.7580413818359375, -0.71722412109375, -0.6764068603515625, -0.635589599609375, -0.5947723388671875, -0.553955078125, -0.5131378173828125, -0.472320556640625, -0.4315032958984375, -0.39068603515625, -0.3498687744140625, -0.309051513671875, -0.2682342529296875, -0.2274169921875, -0.1865997314453125, -0.145782470703125, -0.1049652099609375, -0.06414794921875, -0.0233306884765625, 0.017486572265625, 0.0583038330078125, 0.09912109375, 0.1399383544921875, 0.180755615234375, 0.2215728759765625, 0.26239013671875, 0.3032073974609375, 0.344024658203125, 0.3848419189453125, 0.4256591796875, 0.4664764404296875, 0.507293701171875, 0.5481109619140625, 0.58892822265625, 0.6297454833984375, 0.670562744140625, 0.7113800048828125, 0.752197265625, 0.7930145263671875, 0.833831787109375, 0.8746490478515625, 0.91546630859375, 0.9562835693359375, 0.997100830078125, 1.0379180908203125, 1.0787353515625, 1.1195526123046875, 1.160369873046875, 1.2011871337890625, 1.24200439453125, 1.2828216552734375, 1.323638916015625, 1.3644561767578125, 1.4052734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 11.0, 10.0, 13.0, 29.0, 23.0, 28.0, 38.0, 64.0, 42.0, 68.0, 79.0, 93.0, 84.0, 73.0, 70.0, 48.0, 39.0, 36.0, 26.0, 14.0, 17.0, 22.0, 12.0, 5.0, 3.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.509765625, -0.49175262451171875, -0.4737396240234375, -0.45572662353515625, -0.437713623046875, -0.41970062255859375, -0.4016876220703125, -0.38367462158203125, -0.36566162109375, -0.34764862060546875, -0.3296356201171875, -0.31162261962890625, -0.293609619140625, -0.27559661865234375, -0.2575836181640625, -0.23957061767578125, -0.2215576171875, -0.20354461669921875, -0.1855316162109375, -0.16751861572265625, -0.149505615234375, -0.13149261474609375, -0.1134796142578125, -0.09546661376953125, -0.07745361328125, -0.05944061279296875, -0.0414276123046875, -0.02341461181640625, -0.005401611328125, 0.01261138916015625, 0.0306243896484375, 0.04863739013671875, 0.066650390625, 0.08466339111328125, 0.1026763916015625, 0.12068939208984375, 0.138702392578125, 0.15671539306640625, 0.1747283935546875, 0.19274139404296875, 0.21075439453125, 0.22876739501953125, 0.2467803955078125, 0.26479339599609375, 0.282806396484375, 0.30081939697265625, 0.3188323974609375, 0.33684539794921875, 0.3548583984375, 0.37287139892578125, 0.3908843994140625, 0.40889739990234375, 0.426910400390625, 0.44492340087890625, 0.4629364013671875, 0.48094940185546875, 0.49896240234375, 0.5169754028320312, 0.5349884033203125, 0.5530014038085938, 0.571014404296875, 0.5890274047851562, 0.6070404052734375, 0.6250534057617188, 0.64306640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 22.0, 72.0, 164.0, 373.0, 216.0, 83.0, 23.0, 14.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.668895721435547, -24.96940040588379, -24.26990509033203, -23.570409774780273, -22.870914459228516, -22.171419143676758, -21.471923828125, -20.772428512573242, -20.072933197021484, -19.373437881469727, -18.67394256591797, -17.97444725036621, -17.274951934814453, -16.575456619262695, -15.875961303710938, -15.17646598815918, -14.476970672607422, -13.777475357055664, -13.077980041503906, -12.378484725952148, -11.67898941040039, -10.979494094848633, -10.279998779296875, -9.580503463745117, -8.88100814819336, -8.181512832641602, -7.482017517089844, -6.782522201538086, -6.083026885986328, -5.38353157043457, -4.6840362548828125, -3.9845409393310547, -3.2850475311279297, -2.585552215576172, -1.886056900024414, -1.1865615844726562, -0.48706626892089844, 0.21242904663085938, 0.9119243621826172, 1.611419677734375, 2.310914993286133, 3.0104103088378906, 3.7099056243896484, 4.409400939941406, 5.108896255493164, 5.808391571044922, 6.50788688659668, 7.2073822021484375, 7.906877517700195, 8.606372833251953, 9.305868148803711, 10.005363464355469, 10.704858779907227, 11.404354095458984, 12.103849411010742, 12.8033447265625, 13.502840042114258, 14.202335357666016, 14.901830673217773, 15.601325988769531, 16.30082130432129, 17.000316619873047, 17.699811935424805, 18.399307250976562, 19.09880256652832]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 8.0, 9.0, 8.0, 20.0, 20.0, 27.0, 29.0, 26.0, 26.0, 25.0, 23.0, 35.0, 52.0, 58.0, 71.0, 70.0, 82.0, 57.0, 46.0, 38.0, 29.0, 34.0, 29.0, 34.0, 30.0, 16.0, 13.0, 14.0, 14.0, 12.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.193066596984863, -10.83924388885498, -10.485422134399414, -10.131599426269531, -9.777776718139648, -9.423954963684082, -9.0701322555542, -8.716310501098633, -8.36248779296875, -8.008665084838867, -7.654842853546143, -7.301020622253418, -6.947198390960693, -6.593376159667969, -6.239553451538086, -5.885731220245361, -5.5319085121154785, -5.178086280822754, -4.824263572692871, -4.4704413414001465, -4.116619110107422, -3.762796640396118, -3.4089741706848145, -3.05515193939209, -2.701329469680786, -2.3475069999694824, -1.9936847686767578, -1.639862298965454, -1.28603994846344, -0.9322175979614258, -0.5783951282501221, -0.22457289695739746, 0.12924957275390625, 0.4830719530582428, 0.8368943333625793, 1.1907167434692383, 1.5445390939712524, 1.8983614444732666, 2.2521839141845703, 2.606006145477295, 2.9598286151885986, 3.3136510848999023, 3.667473316192627, 4.021295547485352, 4.375118255615234, 4.728940486907959, 5.082762718200684, 5.436585426330566, 5.790407657623291, 6.144229888916016, 6.498052597045898, 6.851874828338623, 7.205697059631348, 7.5595197677612305, 7.913341999053955, 8.26716423034668, 8.620986938476562, 8.974809646606445, 9.328631401062012, 9.682454109191895, 10.036276817321777, 10.390098571777344, 10.743921279907227, 11.09774398803711, 11.451565742492676]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 9.0, 14.0, 15.0, 17.0, 36.0, 55.0, 82.0, 177.0, 284.0, 489.0, 851.0, 1550.0, 3777.0, 12221.0, 242826.0, 3790682.0, 124452.0, 9916.0, 3361.0, 1465.0, 839.0, 428.0, 281.0, 154.0, 102.0, 59.0, 43.0, 23.0, 27.0, 13.0, 10.0, 5.0, 5.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.636322021484375, -2.55975341796875, -2.483184814453125, -2.4066162109375, -2.330047607421875, -2.25347900390625, -2.176910400390625, -2.100341796875, -2.023773193359375, -1.94720458984375, -1.870635986328125, -1.7940673828125, -1.717498779296875, -1.64093017578125, -1.564361572265625, -1.48779296875, -1.411224365234375, -1.33465576171875, -1.258087158203125, -1.1815185546875, -1.104949951171875, -1.02838134765625, -0.951812744140625, -0.875244140625, -0.798675537109375, -0.72210693359375, -0.645538330078125, -0.5689697265625, -0.492401123046875, -0.41583251953125, -0.339263916015625, -0.2626953125, -0.186126708984375, -0.10955810546875, -0.032989501953125, 0.0435791015625, 0.120147705078125, 0.19671630859375, 0.273284912109375, 0.349853515625, 0.426422119140625, 0.50299072265625, 0.579559326171875, 0.6561279296875, 0.732696533203125, 0.80926513671875, 0.885833740234375, 0.96240234375, 1.038970947265625, 1.11553955078125, 1.192108154296875, 1.2686767578125, 1.345245361328125, 1.42181396484375, 1.498382568359375, 1.574951171875, 1.651519775390625, 1.72808837890625, 1.804656982421875, 1.8812255859375, 1.957794189453125, 2.03436279296875, 2.110931396484375, 2.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 13.0, 20.0, 9.0, 15.0, 18.0, 27.0, 26.0, 39.0, 32.0, 27.0, 43.0, 34.0, 37.0, 60.0, 58.0, 47.0, 38.0, 39.0, 48.0, 43.0, 36.0, 44.0, 35.0, 26.0, 33.0, 20.0, 22.0, 14.0, 10.0, 16.0, 10.0, 11.0, 5.0, 11.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.72705078125, -0.7073287963867188, -0.6876068115234375, -0.6678848266601562, -0.648162841796875, -0.6284408569335938, -0.6087188720703125, -0.5889968872070312, -0.56927490234375, -0.5495529174804688, -0.5298309326171875, -0.5101089477539062, -0.490386962890625, -0.47066497802734375, -0.4509429931640625, -0.43122100830078125, -0.4114990234375, -0.39177703857421875, -0.3720550537109375, -0.35233306884765625, -0.332611083984375, -0.31288909912109375, -0.2931671142578125, -0.27344512939453125, -0.25372314453125, -0.23400115966796875, -0.2142791748046875, -0.19455718994140625, -0.174835205078125, -0.15511322021484375, -0.1353912353515625, -0.11566925048828125, -0.095947265625, -0.07622528076171875, -0.0565032958984375, -0.03678131103515625, -0.017059326171875, 0.00266265869140625, 0.0223846435546875, 0.04210662841796875, 0.06182861328125, 0.08155059814453125, 0.1012725830078125, 0.12099456787109375, 0.140716552734375, 0.16043853759765625, 0.1801605224609375, 0.19988250732421875, 0.2196044921875, 0.23932647705078125, 0.2590484619140625, 0.27877044677734375, 0.298492431640625, 0.31821441650390625, 0.3379364013671875, 0.35765838623046875, 0.37738037109375, 0.39710235595703125, 0.4168243408203125, 0.43654632568359375, 0.456268310546875, 0.47599029541015625, 0.4957122802734375, 0.5154342651367188, 0.53515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 17.0, 18.0, 35.0, 47.0, 69.0, 130.0, 228.0, 391.0, 755.0, 1471.0, 3225.0, 8243.0, 31406.0, 796423.0, 3267203.0, 63836.0, 12224.0, 4492.0, 1960.0, 933.0, 494.0, 290.0, 135.0, 96.0, 45.0, 30.0, 19.0, 14.0, 12.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.5693359375, -2.494140625, -2.4189453125, -2.34375, -2.2685546875, -2.193359375, -2.1181640625, -2.04296875, -1.9677734375, -1.892578125, -1.8173828125, -1.7421875, -1.6669921875, -1.591796875, -1.5166015625, -1.44140625, -1.3662109375, -1.291015625, -1.2158203125, -1.140625, -1.0654296875, -0.990234375, -0.9150390625, -0.83984375, -0.7646484375, -0.689453125, -0.6142578125, -0.5390625, -0.4638671875, -0.388671875, -0.3134765625, -0.23828125, -0.1630859375, -0.087890625, -0.0126953125, 0.0625, 0.1376953125, 0.212890625, 0.2880859375, 0.36328125, 0.4384765625, 0.513671875, 0.5888671875, 0.6640625, 0.7392578125, 0.814453125, 0.8896484375, 0.96484375, 1.0400390625, 1.115234375, 1.1904296875, 1.265625, 1.3408203125, 1.416015625, 1.4912109375, 1.56640625, 1.6416015625, 1.716796875, 1.7919921875, 1.8671875, 1.9423828125, 2.017578125, 2.0927734375, 2.16796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 24.0, 35.0, 62.0, 119.0, 318.0, 656.0, 1164.0, 878.0, 395.0, 169.0, 77.0, 49.0, 28.0, 18.0, 9.0, 11.0, 3.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.627197265625, -2.54931640625, -2.471435546875, -2.3935546875, -2.315673828125, -2.23779296875, -2.159912109375, -2.08203125, -2.004150390625, -1.92626953125, -1.848388671875, -1.7705078125, -1.692626953125, -1.61474609375, -1.536865234375, -1.458984375, -1.381103515625, -1.30322265625, -1.225341796875, -1.1474609375, -1.069580078125, -0.99169921875, -0.913818359375, -0.8359375, -0.758056640625, -0.68017578125, -0.602294921875, -0.5244140625, -0.446533203125, -0.36865234375, -0.290771484375, -0.212890625, -0.135009765625, -0.05712890625, 0.020751953125, 0.0986328125, 0.176513671875, 0.25439453125, 0.332275390625, 0.41015625, 0.488037109375, 0.56591796875, 0.643798828125, 0.7216796875, 0.799560546875, 0.87744140625, 0.955322265625, 1.033203125, 1.111083984375, 1.18896484375, 1.266845703125, 1.3447265625, 1.422607421875, 1.50048828125, 1.578369140625, 1.65625, 1.734130859375, 1.81201171875, 1.889892578125, 1.9677734375, 2.045654296875, 2.12353515625, 2.201416015625, 2.279296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 6.0, 13.0, 32.0, 82.0, 166.0, 246.0, 223.0, 114.0, 64.0, 34.0, 10.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.494823455810547, -29.815614700317383, -29.136404037475586, -28.457195281982422, -27.777984619140625, -27.09877586364746, -26.419567108154297, -25.7403564453125, -25.061147689819336, -24.381938934326172, -23.702728271484375, -23.02351951599121, -22.344310760498047, -21.66510009765625, -20.985891342163086, -20.306682586669922, -19.627471923828125, -18.94826316833496, -18.269052505493164, -17.58984375, -16.910633087158203, -16.23142433166504, -15.552215576171875, -14.873005867004395, -14.193796157836914, -13.514586448669434, -12.835376739501953, -12.156167984008789, -11.476958274841309, -10.797748565673828, -10.118539810180664, -9.439330101013184, -8.760120391845703, -8.080910682678223, -7.4017014503479, -6.722492218017578, -6.043282508850098, -5.364072799682617, -4.684863567352295, -4.005654335021973, -3.326444625854492, -2.647235155105591, -1.9680256843566895, -1.288816213607788, -0.6096067428588867, 0.06960272789001465, 0.748812198638916, 1.4280214309692383, 2.1072311401367188, 2.78644061088562, 3.4656500816345215, 4.144859313964844, 4.824069023132324, 5.503278732299805, 6.182487964630127, 6.861697196960449, 7.54090690612793, 8.22011661529541, 8.89932632446289, 9.578535079956055, 10.257744789123535, 10.936954498291016, 11.61616325378418, 12.29537296295166, 12.97458267211914]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 11.0, 18.0, 13.0, 13.0, 12.0, 21.0, 16.0, 28.0, 25.0, 28.0, 27.0, 30.0, 35.0, 32.0, 42.0, 44.0, 42.0, 36.0, 40.0, 44.0, 45.0, 38.0, 40.0, 38.0, 39.0, 36.0, 19.0, 19.0, 20.0, 17.0, 9.0, 18.0, 13.0, 11.0, 8.0, 13.0, 8.0, 7.0, 6.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.378134250640869, -6.17901086807251, -5.979887008666992, -5.780763626098633, -5.581640243530273, -5.382516860961914, -5.183393478393555, -4.984269618988037, -4.785146236419678, -4.586022853851318, -4.386898994445801, -4.187775611877441, -3.988652229309082, -3.7895288467407227, -3.590405225753784, -3.3912816047668457, -3.1921582221984863, -2.993034839630127, -2.7939112186431885, -2.59478759765625, -2.3956642150878906, -2.1965408325195312, -1.9974172115325928, -1.7982937097549438, -1.599170207977295, -1.400046706199646, -1.200923204421997, -1.0017997026443481, -0.8026762008666992, -0.6035526990890503, -0.40442919731140137, -0.20530569553375244, -0.0061817169189453125, 0.1929417848587036, 0.39206528663635254, 0.5911887884140015, 0.7903122901916504, 0.9894357919692993, 1.1885592937469482, 1.3876827955245972, 1.586806297302246, 1.785929799079895, 1.985053300857544, 2.1841769218444824, 2.383300304412842, 2.582423686981201, 2.7815473079681396, 2.980670928955078, 3.1797943115234375, 3.378917694091797, 3.5780413150787354, 3.777164936065674, 3.976288318634033, 4.175411701202393, 4.37453556060791, 4.5736589431762695, 4.772782325744629, 4.971905708312988, 5.171029090881348, 5.370152950286865, 5.569276332855225, 5.768399715423584, 5.967523574829102, 6.166646957397461, 6.36577033996582]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 13.0, 8.0, 12.0, 16.0, 29.0, 42.0, 61.0, 78.0, 132.0, 227.0, 382.0, 706.0, 1662.0, 4289.0, 17114.0, 170561.0, 765037.0, 72095.0, 10255.0, 3060.0, 1319.0, 595.0, 285.0, 205.0, 122.0, 89.0, 57.0, 31.0, 29.0, 16.0, 13.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.478851318359375, -2.39715576171875, -2.315460205078125, -2.2337646484375, -2.152069091796875, -2.07037353515625, -1.988677978515625, -1.906982421875, -1.825286865234375, -1.74359130859375, -1.661895751953125, -1.5802001953125, -1.498504638671875, -1.41680908203125, -1.335113525390625, -1.25341796875, -1.171722412109375, -1.09002685546875, -1.008331298828125, -0.9266357421875, -0.844940185546875, -0.76324462890625, -0.681549072265625, -0.599853515625, -0.518157958984375, -0.43646240234375, -0.354766845703125, -0.2730712890625, -0.191375732421875, -0.10968017578125, -0.027984619140625, 0.0537109375, 0.135406494140625, 0.21710205078125, 0.298797607421875, 0.3804931640625, 0.462188720703125, 0.54388427734375, 0.625579833984375, 0.707275390625, 0.788970947265625, 0.87066650390625, 0.952362060546875, 1.0340576171875, 1.115753173828125, 1.19744873046875, 1.279144287109375, 1.36083984375, 1.442535400390625, 1.52423095703125, 1.605926513671875, 1.6876220703125, 1.769317626953125, 1.85101318359375, 1.932708740234375, 2.014404296875, 2.096099853515625, 2.17779541015625, 2.259490966796875, 2.3411865234375, 2.422882080078125, 2.50457763671875, 2.586273193359375, 2.66796875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 6.0, 13.0, 14.0, 12.0, 18.0, 21.0, 20.0, 24.0, 19.0, 29.0, 45.0, 42.0, 48.0, 44.0, 41.0, 49.0, 61.0, 51.0, 45.0, 44.0, 44.0, 43.0, 33.0, 35.0, 29.0, 33.0, 24.0, 17.0, 14.0, 18.0, 14.0, 7.0, 7.0, 14.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68212890625, -0.659210205078125, -0.63629150390625, -0.613372802734375, -0.5904541015625, -0.567535400390625, -0.54461669921875, -0.521697998046875, -0.498779296875, -0.475860595703125, -0.45294189453125, -0.430023193359375, -0.4071044921875, -0.384185791015625, -0.36126708984375, -0.338348388671875, -0.3154296875, -0.292510986328125, -0.26959228515625, -0.246673583984375, -0.2237548828125, -0.200836181640625, -0.17791748046875, -0.154998779296875, -0.132080078125, -0.109161376953125, -0.08624267578125, -0.063323974609375, -0.0404052734375, -0.017486572265625, 0.00543212890625, 0.028350830078125, 0.05126953125, 0.074188232421875, 0.09710693359375, 0.120025634765625, 0.1429443359375, 0.165863037109375, 0.18878173828125, 0.211700439453125, 0.234619140625, 0.257537841796875, 0.28045654296875, 0.303375244140625, 0.3262939453125, 0.349212646484375, 0.37213134765625, 0.395050048828125, 0.41796875, 0.440887451171875, 0.46380615234375, 0.486724853515625, 0.5096435546875, 0.532562255859375, 0.55548095703125, 0.578399658203125, 0.601318359375, 0.624237060546875, 0.64715576171875, 0.670074462890625, 0.6929931640625, 0.715911865234375, 0.73883056640625, 0.761749267578125, 0.78466796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 18.0, 13.0, 43.0, 68.0, 74.0, 107.0, 171.0, 289.0, 521.0, 789.0, 1635.0, 3713.0, 13115.0, 113745.0, 835936.0, 62441.0, 9597.0, 2985.0, 1343.0, 707.0, 398.0, 259.0, 165.0, 120.0, 92.0, 41.0, 36.0, 26.0, 15.0, 17.0, 13.0, 5.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.50390625, -2.42413330078125, -2.3443603515625, -2.26458740234375, -2.184814453125, -2.10504150390625, -2.0252685546875, -1.94549560546875, -1.86572265625, -1.78594970703125, -1.7061767578125, -1.62640380859375, -1.546630859375, -1.46685791015625, -1.3870849609375, -1.30731201171875, -1.2275390625, -1.14776611328125, -1.0679931640625, -0.98822021484375, -0.908447265625, -0.82867431640625, -0.7489013671875, -0.66912841796875, -0.58935546875, -0.50958251953125, -0.4298095703125, -0.35003662109375, -0.270263671875, -0.19049072265625, -0.1107177734375, -0.03094482421875, 0.048828125, 0.12860107421875, 0.2083740234375, 0.28814697265625, 0.367919921875, 0.44769287109375, 0.5274658203125, 0.60723876953125, 0.68701171875, 0.76678466796875, 0.8465576171875, 0.92633056640625, 1.006103515625, 1.08587646484375, 1.1656494140625, 1.24542236328125, 1.3251953125, 1.40496826171875, 1.4847412109375, 1.56451416015625, 1.644287109375, 1.72406005859375, 1.8038330078125, 1.88360595703125, 1.96337890625, 2.04315185546875, 2.1229248046875, 2.20269775390625, 2.282470703125, 2.36224365234375, 2.4420166015625, 2.52178955078125, 2.6015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 3.0, 5.0, 9.0, 8.0, 10.0, 20.0, 14.0, 18.0, 32.0, 26.0, 27.0, 41.0, 57.0, 49.0, 63.0, 59.0, 61.0, 45.0, 58.0, 54.0, 40.0, 47.0, 45.0, 25.0, 25.0, 25.0, 38.0, 22.0, 15.0, 7.0, 6.0, 12.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.84039306640625, -2.7452392578125, -2.65008544921875, -2.554931640625, -2.45977783203125, -2.3646240234375, -2.26947021484375, -2.17431640625, -2.07916259765625, -1.9840087890625, -1.88885498046875, -1.793701171875, -1.69854736328125, -1.6033935546875, -1.50823974609375, -1.4130859375, -1.31793212890625, -1.2227783203125, -1.12762451171875, -1.032470703125, -0.93731689453125, -0.8421630859375, -0.74700927734375, -0.65185546875, -0.55670166015625, -0.4615478515625, -0.36639404296875, -0.271240234375, -0.17608642578125, -0.0809326171875, 0.01422119140625, 0.109375, 0.20452880859375, 0.2996826171875, 0.39483642578125, 0.489990234375, 0.58514404296875, 0.6802978515625, 0.77545166015625, 0.87060546875, 0.96575927734375, 1.0609130859375, 1.15606689453125, 1.251220703125, 1.34637451171875, 1.4415283203125, 1.53668212890625, 1.6318359375, 1.72698974609375, 1.8221435546875, 1.91729736328125, 2.012451171875, 2.10760498046875, 2.2027587890625, 2.29791259765625, 2.39306640625, 2.48822021484375, 2.5833740234375, 2.67852783203125, 2.773681640625, 2.86883544921875, 2.9639892578125, 3.05914306640625, 3.154296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 8.0, 10.0, 8.0, 19.0, 22.0, 35.0, 39.0, 60.0, 82.0, 100.0, 174.0, 237.0, 415.0, 690.0, 1417.0, 2974.0, 7033.0, 19073.0, 64977.0, 550092.0, 311346.0, 59398.0, 17886.0, 6606.0, 2708.0, 1252.0, 698.0, 432.0, 214.0, 167.0, 114.0, 65.0, 57.0, 32.0, 25.0, 22.0, 19.0, 7.0, 12.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4423828125, -0.42761993408203125, -0.4128570556640625, -0.39809417724609375, -0.383331298828125, -0.36856842041015625, -0.3538055419921875, -0.33904266357421875, -0.32427978515625, -0.30951690673828125, -0.2947540283203125, -0.27999114990234375, -0.265228271484375, -0.25046539306640625, -0.2357025146484375, -0.22093963623046875, -0.2061767578125, -0.19141387939453125, -0.1766510009765625, -0.16188812255859375, -0.147125244140625, -0.13236236572265625, -0.1175994873046875, -0.10283660888671875, -0.08807373046875, -0.07331085205078125, -0.0585479736328125, -0.04378509521484375, -0.029022216796875, -0.01425933837890625, 0.0005035400390625, 0.01526641845703125, 0.030029296875, 0.04479217529296875, 0.0595550537109375, 0.07431793212890625, 0.089080810546875, 0.10384368896484375, 0.1186065673828125, 0.13336944580078125, 0.14813232421875, 0.16289520263671875, 0.1776580810546875, 0.19242095947265625, 0.207183837890625, 0.22194671630859375, 0.2367095947265625, 0.25147247314453125, 0.2662353515625, 0.28099822998046875, 0.2957611083984375, 0.31052398681640625, 0.325286865234375, 0.34004974365234375, 0.3548126220703125, 0.36957550048828125, 0.38433837890625, 0.39910125732421875, 0.4138641357421875, 0.42862701416015625, 0.443389892578125, 0.45815277099609375, 0.4729156494140625, 0.48767852783203125, 0.50244140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 14.0, 9.0, 20.0, 17.0, 38.0, 75.0, 100.0, 142.0, 148.0, 144.0, 83.0, 46.0, 41.0, 19.0, 20.0, 11.0, 17.0, 11.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016379356384277344, -0.00015759654343128204, -0.00015139952301979065, -0.00014520250260829926, -0.00013900548219680786, -0.00013280846178531647, -0.00012661144137382507, -0.00012041442096233368, -0.00011421740055084229, -0.00010802038013935089, -0.0001018233597278595, -9.56263393163681e-05, -8.942931890487671e-05, -8.323229849338531e-05, -7.703527808189392e-05, -7.083825767040253e-05, -6.464123725891113e-05, -5.844421684741974e-05, -5.2247196435928345e-05, -4.605017602443695e-05, -3.985315561294556e-05, -3.365613520145416e-05, -2.745911478996277e-05, -2.1262094378471375e-05, -1.506507396697998e-05, -8.868053555488586e-06, -2.6710331439971924e-06, 3.5259872674942017e-06, 9.723007678985596e-06, 1.592002809047699e-05, 2.2117048501968384e-05, 2.8314068913459778e-05, 3.451108932495117e-05, 4.0708109736442566e-05, 4.690513014793396e-05, 5.3102150559425354e-05, 5.929917097091675e-05, 6.549619138240814e-05, 7.169321179389954e-05, 7.789023220539093e-05, 8.408725261688232e-05, 9.028427302837372e-05, 9.648129343986511e-05, 0.0001026783138513565, 0.0001088753342628479, 0.0001150723546743393, 0.00012126937508583069, 0.00012746639549732208, 0.00013366341590881348, 0.00013986043632030487, 0.00014605745673179626, 0.00015225447714328766, 0.00015845149755477905, 0.00016464851796627045, 0.00017084553837776184, 0.00017704255878925323, 0.00018323957920074463, 0.00018943659961223602, 0.00019563362002372742, 0.0002018306404352188, 0.0002080276608467102, 0.0002142246812582016, 0.000220421701669693, 0.0002266187220811844, 0.00023281574249267578]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 0.0, 6.0, 5.0, 7.0, 7.0, 17.0, 15.0, 36.0, 36.0, 50.0, 82.0, 122.0, 230.0, 327.0, 617.0, 1033.0, 2012.0, 4200.0, 10196.0, 28896.0, 111126.0, 674744.0, 154911.0, 37288.0, 12553.0, 4951.0, 2270.0, 1103.0, 655.0, 376.0, 242.0, 130.0, 100.0, 75.0, 40.0, 31.0, 16.0, 16.0, 7.0, 7.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.5908203125, -0.5751075744628906, -0.5593948364257812, -0.5436820983886719, -0.5279693603515625, -0.5122566223144531, -0.49654388427734375, -0.4808311462402344, -0.465118408203125, -0.4494056701660156, -0.43369293212890625, -0.4179801940917969, -0.4022674560546875, -0.3865547180175781, -0.37084197998046875, -0.3551292419433594, -0.33941650390625, -0.3237037658691406, -0.30799102783203125, -0.2922782897949219, -0.2765655517578125, -0.2608528137207031, -0.24514007568359375, -0.22942733764648438, -0.213714599609375, -0.19800186157226562, -0.18228912353515625, -0.16657638549804688, -0.1508636474609375, -0.13515090942382812, -0.11943817138671875, -0.10372543334960938, -0.0880126953125, -0.07229995727539062, -0.05658721923828125, -0.040874481201171875, -0.0251617431640625, -0.009449005126953125, 0.00626373291015625, 0.021976470947265625, 0.037689208984375, 0.053401947021484375, 0.06911468505859375, 0.08482742309570312, 0.1005401611328125, 0.11625289916992188, 0.13196563720703125, 0.14767837524414062, 0.16339111328125, 0.17910385131835938, 0.19481658935546875, 0.21052932739257812, 0.2262420654296875, 0.24195480346679688, 0.25766754150390625, 0.2733802795410156, 0.289093017578125, 0.3048057556152344, 0.32051849365234375, 0.3362312316894531, 0.3519439697265625, 0.3676567077636719, 0.38336944580078125, 0.3990821838378906, 0.414794921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 17.0, 12.0, 14.0, 33.0, 42.0, 39.0, 77.0, 90.0, 104.0, 114.0, 117.0, 75.0, 48.0, 40.0, 30.0, 28.0, 27.0, 19.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 5.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6403274536132812, -0.6204986572265625, -0.6006698608398438, -0.580841064453125, -0.5610122680664062, -0.5411834716796875, -0.5213546752929688, -0.50152587890625, -0.48169708251953125, -0.4618682861328125, -0.44203948974609375, -0.422210693359375, -0.40238189697265625, -0.3825531005859375, -0.36272430419921875, -0.3428955078125, -0.32306671142578125, -0.3032379150390625, -0.28340911865234375, -0.263580322265625, -0.24375152587890625, -0.2239227294921875, -0.20409393310546875, -0.18426513671875, -0.16443634033203125, -0.1446075439453125, -0.12477874755859375, -0.104949951171875, -0.08512115478515625, -0.0652923583984375, -0.04546356201171875, -0.025634765625, -0.00580596923828125, 0.0140228271484375, 0.03385162353515625, 0.053680419921875, 0.07350921630859375, 0.0933380126953125, 0.11316680908203125, 0.13299560546875, 0.15282440185546875, 0.1726531982421875, 0.19248199462890625, 0.212310791015625, 0.23213958740234375, 0.2519683837890625, 0.27179718017578125, 0.2916259765625, 0.31145477294921875, 0.3312835693359375, 0.35111236572265625, 0.370941162109375, 0.39076995849609375, 0.4105987548828125, 0.43042755126953125, 0.45025634765625, 0.47008514404296875, 0.4899139404296875, 0.5097427368164062, 0.529571533203125, 0.5494003295898438, 0.5692291259765625, 0.5890579223632812, 0.60888671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 13.0, 17.0, 21.0, 50.0, 62.0, 107.0, 249.0, 197.0, 102.0, 61.0, 41.0, 28.0, 16.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.762823104858398, -12.3496675491333, -11.936511039733887, -11.523355484008789, -11.110198974609375, -10.697043418884277, -10.28388786315918, -9.870731353759766, -9.457575798034668, -9.04442024230957, -8.631263732910156, -8.218108177185059, -7.804952144622803, -7.391796112060547, -6.978640556335449, -6.565484523773193, -6.1523284912109375, -5.739172458648682, -5.326016426086426, -4.912860870361328, -4.499704837799072, -4.086548805236816, -3.6733930110931396, -3.260237216949463, -2.847081184387207, -2.433925151824951, -2.0207693576812744, -1.607613444328308, -1.1944575309753418, -0.7813014984130859, -0.3681457042694092, 0.04501008987426758, 0.45816612243652344, 0.8713220357894897, 1.284477949142456, 1.6976338624954224, 2.1107897758483887, 2.5239458084106445, 2.9371016025543213, 3.350257396697998, 3.763413429260254, 4.17656946182251, 4.589725494384766, 5.002881050109863, 5.416037082672119, 5.829193115234375, 6.242348670959473, 6.6555047035217285, 7.068660736083984, 7.48181676864624, 7.894972801208496, 8.308128356933594, 8.721284866333008, 9.134440422058105, 9.547595977783203, 9.960752487182617, 10.373908042907715, 10.787063598632812, 11.200220108032227, 11.613375663757324, 12.026531219482422, 12.439687728881836, 12.852843284606934, 13.265998840332031, 13.679155349731445]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 8.0, 7.0, 6.0, 2.0, 4.0, 9.0, 19.0, 9.0, 19.0, 16.0, 16.0, 24.0, 19.0, 28.0, 22.0, 28.0, 40.0, 37.0, 68.0, 108.0, 100.0, 75.0, 52.0, 41.0, 23.0, 26.0, 20.0, 20.0, 20.0, 25.0, 25.0, 10.0, 18.0, 16.0, 9.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-11.756427764892578, -11.410192489624023, -11.063956260681152, -10.717720985412598, -10.371485710144043, -10.025249481201172, -9.679014205932617, -9.332778930664062, -8.986543655395508, -8.640308380126953, -8.294072151184082, -7.947836875915527, -7.601601600646973, -7.25536584854126, -6.909130096435547, -6.562894821166992, -6.216658592224121, -5.870422840118408, -5.5241875648498535, -5.177951812744141, -4.831716537475586, -4.485480785369873, -4.13924503326416, -3.7930095195770264, -3.4467740058898926, -3.100538492202759, -2.754302978515625, -2.408067226409912, -2.0618317127227783, -1.7155961990356445, -1.3693604469299316, -1.0231249332427979, -0.6768903732299805, -0.3306547999382019, 0.01558077335357666, 0.36181640625, 0.7080519199371338, 1.0542874336242676, 1.4005231857299805, 1.7467586994171143, 2.092994213104248, 2.439229726791382, 2.7854652404785156, 3.1317009925842285, 3.4779365062713623, 3.824172019958496, 4.170407772064209, 4.516643524169922, 4.862878799438477, 5.2091145515441895, 5.555349826812744, 5.901585578918457, 6.247820854187012, 6.594056606292725, 6.9402923583984375, 7.286527633666992, 7.632763385772705, 7.978999137878418, 8.325234413146973, 8.671470642089844, 9.017705917358398, 9.363941192626953, 9.710176467895508, 10.056412696838379, 10.402647972106934]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 9.0, 13.0, 18.0, 29.0, 43.0, 75.0, 120.0, 164.0, 258.0, 427.0, 700.0, 1108.0, 1932.0, 3800.0, 13265.0, 199949.0, 3420944.0, 518818.0, 21632.0, 5107.0, 2389.0, 1346.0, 777.0, 479.0, 269.0, 190.0, 127.0, 99.0, 61.0, 29.0, 32.0, 15.0, 18.0, 8.0, 6.0, 6.0, 8.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.73065185546875, -1.6722412109375, -1.61383056640625, -1.555419921875, -1.49700927734375, -1.4385986328125, -1.38018798828125, -1.32177734375, -1.26336669921875, -1.2049560546875, -1.14654541015625, -1.088134765625, -1.02972412109375, -0.9713134765625, -0.91290283203125, -0.8544921875, -0.79608154296875, -0.7376708984375, -0.67926025390625, -0.620849609375, -0.56243896484375, -0.5040283203125, -0.44561767578125, -0.38720703125, -0.32879638671875, -0.2703857421875, -0.21197509765625, -0.153564453125, -0.09515380859375, -0.0367431640625, 0.02166748046875, 0.080078125, 0.13848876953125, 0.1968994140625, 0.25531005859375, 0.313720703125, 0.37213134765625, 0.4305419921875, 0.48895263671875, 0.54736328125, 0.60577392578125, 0.6641845703125, 0.72259521484375, 0.781005859375, 0.83941650390625, 0.8978271484375, 0.95623779296875, 1.0146484375, 1.07305908203125, 1.1314697265625, 1.18988037109375, 1.248291015625, 1.30670166015625, 1.3651123046875, 1.42352294921875, 1.48193359375, 1.54034423828125, 1.5987548828125, 1.65716552734375, 1.715576171875, 1.77398681640625, 1.8323974609375, 1.89080810546875, 1.94921875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 13.0, 11.0, 12.0, 21.0, 23.0, 21.0, 30.0, 32.0, 34.0, 27.0, 41.0, 35.0, 27.0, 39.0, 41.0, 43.0, 42.0, 47.0, 52.0, 51.0, 36.0, 50.0, 31.0, 22.0, 31.0, 23.0, 21.0, 21.0, 14.0, 20.0, 12.0, 12.0, 10.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6253509521484375, -0.605194091796875, -0.5850372314453125, -0.56488037109375, -0.5447235107421875, -0.524566650390625, -0.5044097900390625, -0.4842529296875, -0.4640960693359375, -0.443939208984375, -0.4237823486328125, -0.40362548828125, -0.3834686279296875, -0.363311767578125, -0.3431549072265625, -0.322998046875, -0.3028411865234375, -0.282684326171875, -0.2625274658203125, -0.24237060546875, -0.2222137451171875, -0.202056884765625, -0.1819000244140625, -0.1617431640625, -0.1415863037109375, -0.121429443359375, -0.1012725830078125, -0.08111572265625, -0.0609588623046875, -0.040802001953125, -0.0206451416015625, -0.00048828125, 0.0196685791015625, 0.039825439453125, 0.0599822998046875, 0.08013916015625, 0.1002960205078125, 0.120452880859375, 0.1406097412109375, 0.1607666015625, 0.1809234619140625, 0.201080322265625, 0.2212371826171875, 0.24139404296875, 0.2615509033203125, 0.281707763671875, 0.3018646240234375, 0.322021484375, 0.3421783447265625, 0.362335205078125, 0.3824920654296875, 0.40264892578125, 0.4228057861328125, 0.442962646484375, 0.4631195068359375, 0.4832763671875, 0.5034332275390625, 0.523590087890625, 0.5437469482421875, 0.56390380859375, 0.5840606689453125, 0.604217529296875, 0.6243743896484375, 0.64453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 12.0, 9.0, 20.0, 36.0, 54.0, 105.0, 224.0, 492.0, 1322.0, 4079.0, 19936.0, 2712602.0, 1433149.0, 16507.0, 3620.0, 1200.0, 433.0, 194.0, 110.0, 70.0, 46.0, 19.0, 11.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.90234375, -3.783935546875, -3.66552734375, -3.547119140625, -3.4287109375, -3.310302734375, -3.19189453125, -3.073486328125, -2.955078125, -2.836669921875, -2.71826171875, -2.599853515625, -2.4814453125, -2.363037109375, -2.24462890625, -2.126220703125, -2.0078125, -1.889404296875, -1.77099609375, -1.652587890625, -1.5341796875, -1.415771484375, -1.29736328125, -1.178955078125, -1.060546875, -0.942138671875, -0.82373046875, -0.705322265625, -0.5869140625, -0.468505859375, -0.35009765625, -0.231689453125, -0.11328125, 0.005126953125, 0.12353515625, 0.241943359375, 0.3603515625, 0.478759765625, 0.59716796875, 0.715576171875, 0.833984375, 0.952392578125, 1.07080078125, 1.189208984375, 1.3076171875, 1.426025390625, 1.54443359375, 1.662841796875, 1.78125, 1.899658203125, 2.01806640625, 2.136474609375, 2.2548828125, 2.373291015625, 2.49169921875, 2.610107421875, 2.728515625, 2.846923828125, 2.96533203125, 3.083740234375, 3.2021484375, 3.320556640625, 3.43896484375, 3.557373046875, 3.67578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 12.0, 11.0, 16.0, 24.0, 37.0, 82.0, 229.0, 572.0, 1186.0, 1030.0, 458.0, 194.0, 82.0, 45.0, 35.0, 12.0, 17.0, 9.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9296875, -2.840545654296875, -2.75140380859375, -2.662261962890625, -2.5731201171875, -2.483978271484375, -2.39483642578125, -2.305694580078125, -2.216552734375, -2.127410888671875, -2.03826904296875, -1.949127197265625, -1.8599853515625, -1.770843505859375, -1.68170166015625, -1.592559814453125, -1.50341796875, -1.414276123046875, -1.32513427734375, -1.235992431640625, -1.1468505859375, -1.057708740234375, -0.96856689453125, -0.879425048828125, -0.790283203125, -0.701141357421875, -0.61199951171875, -0.522857666015625, -0.4337158203125, -0.344573974609375, -0.25543212890625, -0.166290283203125, -0.0771484375, 0.011993408203125, 0.10113525390625, 0.190277099609375, 0.2794189453125, 0.368560791015625, 0.45770263671875, 0.546844482421875, 0.635986328125, 0.725128173828125, 0.81427001953125, 0.903411865234375, 0.9925537109375, 1.081695556640625, 1.17083740234375, 1.259979248046875, 1.34912109375, 1.438262939453125, 1.52740478515625, 1.616546630859375, 1.7056884765625, 1.794830322265625, 1.88397216796875, 1.973114013671875, 2.062255859375, 2.151397705078125, 2.24053955078125, 2.329681396484375, 2.4188232421875, 2.507965087890625, 2.59710693359375, 2.686248779296875, 2.775390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 11.0, 24.0, 78.0, 175.0, 342.0, 239.0, 81.0, 31.0, 12.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.909996032714844, -16.993131637573242, -16.07626724243164, -15.159402847290039, -14.242537498474121, -13.32567310333252, -12.408808708190918, -11.491943359375, -10.575078964233398, -9.658214569091797, -8.741350173950195, -7.8244853019714355, -6.907620429992676, -5.990756034851074, -5.073891639709473, -4.157026767730713, -3.2401628494262695, -2.323298215866089, -1.4064337015151978, -0.48956918716430664, 0.427295446395874, 1.3441600799560547, 2.2610244750976562, 3.177889347076416, 4.094753742218018, 5.011618137359619, 5.928483009338379, 6.8453474044799805, 7.762211799621582, 8.6790771484375, 9.595941543579102, 10.512805938720703, 11.429670333862305, 12.346534729003906, 13.263399124145508, 14.18026351928711, 15.097128868103027, 16.013992309570312, 16.930858612060547, 17.84772300720215, 18.76458740234375, 19.68145179748535, 20.598316192626953, 21.515180587768555, 22.432044982910156, 23.34891128540039, 24.26577377319336, 25.182640075683594, 26.099502563476562, 27.016366958618164, 27.933231353759766, 28.850095748901367, 29.76696014404297, 30.683826446533203, 31.600688934326172, 32.517555236816406, 33.43442153930664, 34.351287841796875, 35.268150329589844, 36.18501663208008, 37.10187911987305, 38.01874542236328, 38.93560791015625, 39.852474212646484, 40.76933670043945]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 2.0, 11.0, 9.0, 15.0, 19.0, 12.0, 23.0, 30.0, 29.0, 39.0, 39.0, 55.0, 52.0, 53.0, 48.0, 44.0, 54.0, 53.0, 54.0, 56.0, 49.0, 45.0, 39.0, 30.0, 16.0, 25.0, 18.0, 25.0, 16.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.685941219329834, -7.404282569885254, -7.122623443603516, -6.8409647941589355, -6.559305667877197, -6.277647018432617, -5.995987892150879, -5.714329242706299, -5.432670593261719, -5.151011943817139, -4.8693528175354, -4.58769416809082, -4.306035041809082, -4.024376392364502, -3.7427175045013428, -3.4610586166381836, -3.1793994903564453, -2.897740602493286, -2.616081714630127, -2.334423065185547, -2.0527639389038086, -1.771105170249939, -1.4894464015960693, -1.2077875137329102, -0.926128625869751, -0.6444697380065918, -0.3628109097480774, -0.08115208148956299, 0.2005068063735962, 0.48216569423675537, 0.763824462890625, 1.0454833507537842, 1.3271417617797852, 1.6088006496429443, 1.8904595375061035, 2.1721181869506836, 2.453777313232422, 2.735435962677002, 3.017094850540161, 3.2987537384033203, 3.5804126262664795, 3.8620715141296387, 4.143730163574219, 4.425389289855957, 4.707047939300537, 4.988707065582275, 5.2703657150268555, 5.552024841308594, 5.833683490753174, 6.115342140197754, 6.397001266479492, 6.678659915924072, 6.9603190422058105, 7.241977691650391, 7.523636817932129, 7.805295467376709, 8.086954116821289, 8.368613243103027, 8.65027141571045, 8.931930541992188, 9.213589668273926, 9.495248794555664, 9.776906967163086, 10.058566093444824, 10.340225219726562]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 5.0, 17.0, 19.0, 26.0, 43.0, 52.0, 70.0, 102.0, 155.0, 205.0, 250.0, 415.0, 558.0, 841.0, 1276.0, 1765.0, 2864.0, 4353.0, 7880.0, 14986.0, 34817.0, 110175.0, 470647.0, 277479.0, 66550.0, 24326.0, 11421.0, 6128.0, 3708.0, 2391.0, 1533.0, 1074.0, 700.0, 494.0, 360.0, 238.0, 184.0, 123.0, 87.0, 58.0, 41.0, 33.0, 22.0, 29.0, 15.0, 6.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.23046875, -1.190521240234375, -1.15057373046875, -1.110626220703125, -1.0706787109375, -1.030731201171875, -0.99078369140625, -0.950836181640625, -0.910888671875, -0.870941162109375, -0.83099365234375, -0.791046142578125, -0.7510986328125, -0.711151123046875, -0.67120361328125, -0.631256103515625, -0.59130859375, -0.551361083984375, -0.51141357421875, -0.471466064453125, -0.4315185546875, -0.391571044921875, -0.35162353515625, -0.311676025390625, -0.271728515625, -0.231781005859375, -0.19183349609375, -0.151885986328125, -0.1119384765625, -0.071990966796875, -0.03204345703125, 0.007904052734375, 0.0478515625, 0.087799072265625, 0.12774658203125, 0.167694091796875, 0.2076416015625, 0.247589111328125, 0.28753662109375, 0.327484130859375, 0.367431640625, 0.407379150390625, 0.44732666015625, 0.487274169921875, 0.5272216796875, 0.567169189453125, 0.60711669921875, 0.647064208984375, 0.68701171875, 0.726959228515625, 0.76690673828125, 0.806854248046875, 0.8468017578125, 0.886749267578125, 0.92669677734375, 0.966644287109375, 1.006591796875, 1.046539306640625, 1.08648681640625, 1.126434326171875, 1.1663818359375, 1.206329345703125, 1.24627685546875, 1.286224365234375, 1.326171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 7.0, 8.0, 11.0, 15.0, 14.0, 29.0, 21.0, 18.0, 38.0, 38.0, 29.0, 43.0, 43.0, 49.0, 46.0, 45.0, 49.0, 60.0, 45.0, 58.0, 47.0, 38.0, 39.0, 29.0, 29.0, 28.0, 19.0, 22.0, 18.0, 18.0, 14.0, 9.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8956375122070312, -0.8703765869140625, -0.8451156616210938, -0.819854736328125, -0.7945938110351562, -0.7693328857421875, -0.7440719604492188, -0.71881103515625, -0.6935501098632812, -0.6682891845703125, -0.6430282592773438, -0.617767333984375, -0.5925064086914062, -0.5672454833984375, -0.5419845581054688, -0.5167236328125, -0.49146270751953125, -0.4662017822265625, -0.44094085693359375, -0.415679931640625, -0.39041900634765625, -0.3651580810546875, -0.33989715576171875, -0.31463623046875, -0.28937530517578125, -0.2641143798828125, -0.23885345458984375, -0.213592529296875, -0.18833160400390625, -0.1630706787109375, -0.13780975341796875, -0.112548828125, -0.08728790283203125, -0.0620269775390625, -0.03676605224609375, -0.011505126953125, 0.01375579833984375, 0.0390167236328125, 0.06427764892578125, 0.08953857421875, 0.11479949951171875, 0.1400604248046875, 0.16532135009765625, 0.190582275390625, 0.21584320068359375, 0.2411041259765625, 0.26636505126953125, 0.2916259765625, 0.31688690185546875, 0.3421478271484375, 0.36740875244140625, 0.392669677734375, 0.41793060302734375, 0.4431915283203125, 0.46845245361328125, 0.49371337890625, 0.5189743041992188, 0.5442352294921875, 0.5694961547851562, 0.594757080078125, 0.6200180053710938, 0.6452789306640625, 0.6705398559570312, 0.69580078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 9.0, 14.0, 16.0, 31.0, 40.0, 58.0, 105.0, 180.0, 294.0, 477.0, 951.0, 2177.0, 6707.0, 44580.0, 928121.0, 52937.0, 7406.0, 2290.0, 987.0, 463.0, 228.0, 174.0, 95.0, 79.0, 49.0, 24.0, 16.0, 12.0, 10.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.962890625, -3.844696044921875, -3.72650146484375, -3.608306884765625, -3.4901123046875, -3.371917724609375, -3.25372314453125, -3.135528564453125, -3.017333984375, -2.899139404296875, -2.78094482421875, -2.662750244140625, -2.5445556640625, -2.426361083984375, -2.30816650390625, -2.189971923828125, -2.07177734375, -1.953582763671875, -1.83538818359375, -1.717193603515625, -1.5989990234375, -1.480804443359375, -1.36260986328125, -1.244415283203125, -1.126220703125, -1.008026123046875, -0.88983154296875, -0.771636962890625, -0.6534423828125, -0.535247802734375, -0.41705322265625, -0.298858642578125, -0.1806640625, -0.062469482421875, 0.05572509765625, 0.173919677734375, 0.2921142578125, 0.410308837890625, 0.52850341796875, 0.646697998046875, 0.764892578125, 0.883087158203125, 1.00128173828125, 1.119476318359375, 1.2376708984375, 1.355865478515625, 1.47406005859375, 1.592254638671875, 1.71044921875, 1.828643798828125, 1.94683837890625, 2.065032958984375, 2.1832275390625, 2.301422119140625, 2.41961669921875, 2.537811279296875, 2.656005859375, 2.774200439453125, 2.89239501953125, 3.010589599609375, 3.1287841796875, 3.246978759765625, 3.36517333984375, 3.483367919921875, 3.6015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 5.0, 1.0, 7.0, 12.0, 11.0, 14.0, 11.0, 16.0, 17.0, 25.0, 24.0, 41.0, 23.0, 38.0, 49.0, 48.0, 56.0, 59.0, 57.0, 55.0, 55.0, 48.0, 44.0, 39.0, 40.0, 25.0, 32.0, 24.0, 24.0, 21.0, 10.0, 12.0, 14.0, 10.0, 3.0, 7.0, 4.0, 8.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.68359375, -3.585052490234375, -3.48651123046875, -3.387969970703125, -3.2894287109375, -3.190887451171875, -3.09234619140625, -2.993804931640625, -2.895263671875, -2.796722412109375, -2.69818115234375, -2.599639892578125, -2.5010986328125, -2.402557373046875, -2.30401611328125, -2.205474853515625, -2.10693359375, -2.008392333984375, -1.90985107421875, -1.811309814453125, -1.7127685546875, -1.614227294921875, -1.51568603515625, -1.417144775390625, -1.318603515625, -1.220062255859375, -1.12152099609375, -1.022979736328125, -0.9244384765625, -0.825897216796875, -0.72735595703125, -0.628814697265625, -0.5302734375, -0.431732177734375, -0.33319091796875, -0.234649658203125, -0.1361083984375, -0.037567138671875, 0.06097412109375, 0.159515380859375, 0.258056640625, 0.356597900390625, 0.45513916015625, 0.553680419921875, 0.6522216796875, 0.750762939453125, 0.84930419921875, 0.947845458984375, 1.04638671875, 1.144927978515625, 1.24346923828125, 1.342010498046875, 1.4405517578125, 1.539093017578125, 1.63763427734375, 1.736175537109375, 1.834716796875, 1.933258056640625, 2.03179931640625, 2.130340576171875, 2.2288818359375, 2.327423095703125, 2.42596435546875, 2.524505615234375, 2.623046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 7.0, 11.0, 15.0, 12.0, 34.0, 37.0, 57.0, 67.0, 129.0, 225.0, 434.0, 1080.0, 3145.0, 12439.0, 93318.0, 867260.0, 56721.0, 9241.0, 2453.0, 936.0, 400.0, 147.0, 103.0, 72.0, 51.0, 37.0, 21.0, 20.0, 15.0, 14.0, 10.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9813613891601562, -0.9519805908203125, -0.9225997924804688, -0.893218994140625, -0.8638381958007812, -0.8344573974609375, -0.8050765991210938, -0.77569580078125, -0.7463150024414062, -0.7169342041015625, -0.6875534057617188, -0.658172607421875, -0.6287918090820312, -0.5994110107421875, -0.5700302124023438, -0.5406494140625, -0.5112686157226562, -0.4818878173828125, -0.45250701904296875, -0.423126220703125, -0.39374542236328125, -0.3643646240234375, -0.33498382568359375, -0.30560302734375, -0.27622222900390625, -0.2468414306640625, -0.21746063232421875, -0.188079833984375, -0.15869903564453125, -0.1293182373046875, -0.09993743896484375, -0.070556640625, -0.04117584228515625, -0.0117950439453125, 0.01758575439453125, 0.046966552734375, 0.07634735107421875, 0.1057281494140625, 0.13510894775390625, 0.16448974609375, 0.19387054443359375, 0.2232513427734375, 0.25263214111328125, 0.282012939453125, 0.31139373779296875, 0.3407745361328125, 0.37015533447265625, 0.3995361328125, 0.42891693115234375, 0.4582977294921875, 0.48767852783203125, 0.517059326171875, 0.5464401245117188, 0.5758209228515625, 0.6052017211914062, 0.63458251953125, 0.6639633178710938, 0.6933441162109375, 0.7227249145507812, 0.752105712890625, 0.7814865112304688, 0.8108673095703125, 0.8402481079101562, 0.86962890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 4.0, 2.0, 10.0, 4.0, 6.0, 8.0, 13.0, 23.0, 25.0, 39.0, 45.0, 72.0, 114.0, 139.0, 154.0, 94.0, 62.0, 49.0, 34.0, 15.0, 21.0, 13.0, 10.0, 12.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017523765563964844, -0.00016895122826099396, -0.00016266480088233948, -0.000156378373503685, -0.00015009194612503052, -0.00014380551874637604, -0.00013751909136772156, -0.00013123266398906708, -0.0001249462366104126, -0.00011865980923175812, -0.00011237338185310364, -0.00010608695447444916, -9.980052709579468e-05, -9.35140997171402e-05, -8.722767233848572e-05, -8.094124495983124e-05, -7.465481758117676e-05, -6.836839020252228e-05, -6.20819628238678e-05, -5.579553544521332e-05, -4.950910806655884e-05, -4.322268068790436e-05, -3.693625330924988e-05, -3.06498259305954e-05, -2.4363398551940918e-05, -1.8076971173286438e-05, -1.1790543794631958e-05, -5.504116415977478e-06, 7.82310962677002e-07, 7.068738341331482e-06, 1.3355165719985962e-05, 1.9641593098640442e-05, 2.5928020477294922e-05, 3.22144478559494e-05, 3.850087523460388e-05, 4.478730261325836e-05, 5.107372999191284e-05, 5.736015737056732e-05, 6.36465847492218e-05, 6.993301212787628e-05, 7.621943950653076e-05, 8.250586688518524e-05, 8.879229426383972e-05, 9.50787216424942e-05, 0.00010136514902114868, 0.00010765157639980316, 0.00011393800377845764, 0.00012022443115711212, 0.0001265108585357666, 0.00013279728591442108, 0.00013908371329307556, 0.00014537014067173004, 0.00015165656805038452, 0.000157942995429039, 0.00016422942280769348, 0.00017051585018634796, 0.00017680227756500244, 0.00018308870494365692, 0.0001893751323223114, 0.00019566155970096588, 0.00020194798707962036, 0.00020823441445827484, 0.00021452084183692932, 0.0002208072692155838, 0.00022709369659423828]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 10.0, 8.0, 15.0, 30.0, 49.0, 48.0, 85.0, 100.0, 156.0, 241.0, 344.0, 585.0, 1013.0, 1806.0, 3882.0, 9003.0, 26742.0, 120374.0, 736172.0, 106719.0, 24593.0, 8512.0, 3759.0, 1758.0, 958.0, 549.0, 326.0, 232.0, 146.0, 97.0, 67.0, 55.0, 28.0, 24.0, 15.0, 7.0, 9.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5143661499023438, -0.4974822998046875, -0.48059844970703125, -0.463714599609375, -0.44683074951171875, -0.4299468994140625, -0.41306304931640625, -0.39617919921875, -0.37929534912109375, -0.3624114990234375, -0.34552764892578125, -0.328643798828125, -0.31175994873046875, -0.2948760986328125, -0.27799224853515625, -0.2611083984375, -0.24422454833984375, -0.2273406982421875, -0.21045684814453125, -0.193572998046875, -0.17668914794921875, -0.1598052978515625, -0.14292144775390625, -0.12603759765625, -0.10915374755859375, -0.0922698974609375, -0.07538604736328125, -0.058502197265625, -0.04161834716796875, -0.0247344970703125, -0.00785064697265625, 0.009033203125, 0.02591705322265625, 0.0428009033203125, 0.05968475341796875, 0.076568603515625, 0.09345245361328125, 0.1103363037109375, 0.12722015380859375, 0.14410400390625, 0.16098785400390625, 0.1778717041015625, 0.19475555419921875, 0.211639404296875, 0.22852325439453125, 0.2454071044921875, 0.26229095458984375, 0.2791748046875, 0.29605865478515625, 0.3129425048828125, 0.32982635498046875, 0.346710205078125, 0.36359405517578125, 0.3804779052734375, 0.39736175537109375, 0.41424560546875, 0.43112945556640625, 0.4480133056640625, 0.46489715576171875, 0.481781005859375, 0.49866485595703125, 0.5155487060546875, 0.5324325561523438, 0.54931640625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 10.0, 6.0, 11.0, 8.0, 15.0, 16.0, 17.0, 37.0, 33.0, 32.0, 51.0, 58.0, 85.0, 87.0, 96.0, 82.0, 64.0, 73.0, 28.0, 36.0, 20.0, 24.0, 19.0, 13.0, 18.0, 5.0, 10.0, 4.0, 8.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.46435546875, -0.44824981689453125, -0.4321441650390625, -0.41603851318359375, -0.399932861328125, -0.38382720947265625, -0.3677215576171875, -0.35161590576171875, -0.33551025390625, -0.31940460205078125, -0.3032989501953125, -0.28719329833984375, -0.271087646484375, -0.25498199462890625, -0.2388763427734375, -0.22277069091796875, -0.2066650390625, -0.19055938720703125, -0.1744537353515625, -0.15834808349609375, -0.142242431640625, -0.12613677978515625, -0.1100311279296875, -0.09392547607421875, -0.07781982421875, -0.06171417236328125, -0.0456085205078125, -0.02950286865234375, -0.013397216796875, 0.00270843505859375, 0.0188140869140625, 0.03491973876953125, 0.051025390625, 0.06713104248046875, 0.0832366943359375, 0.09934234619140625, 0.115447998046875, 0.13155364990234375, 0.1476593017578125, 0.16376495361328125, 0.17987060546875, 0.19597625732421875, 0.2120819091796875, 0.22818756103515625, 0.244293212890625, 0.26039886474609375, 0.2765045166015625, 0.29261016845703125, 0.3087158203125, 0.32482147216796875, 0.3409271240234375, 0.35703277587890625, 0.373138427734375, 0.38924407958984375, 0.4053497314453125, 0.42145538330078125, 0.43756103515625, 0.45366668701171875, 0.4697723388671875, 0.48587799072265625, 0.501983642578125, 0.5180892944335938, 0.5341949462890625, 0.5503005981445312, 0.56640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 13.0, 43.0, 147.0, 549.0, 159.0, 50.0, 19.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.531171798706055, -20.42557716369629, -19.319982528686523, -18.214385986328125, -17.10879135131836, -16.003196716308594, -14.897602081298828, -13.792007446289062, -12.68641185760498, -11.580817222595215, -10.475221633911133, -9.369626998901367, -8.264032363891602, -7.1584367752075195, -6.052842140197754, -4.94724702835083, -3.8416519165039062, -2.7360568046569824, -1.6304619312286377, -0.524867057800293, 0.5807280540466309, 1.6863231658935547, 2.7919178009033203, 3.897512912750244, 5.003108024597168, 6.108703136444092, 7.214298248291016, 8.319892883300781, 9.425487518310547, 10.531083106994629, 11.636677742004395, 12.742273330688477, 13.84786605834961, 14.953460693359375, 16.05905532836914, 17.164649963378906, 18.270246505737305, 19.37584114074707, 20.481435775756836, 21.5870304107666, 22.692626953125, 23.798221588134766, 24.90381622314453, 26.009410858154297, 27.115007400512695, 28.22060203552246, 29.326196670532227, 30.431791305541992, 31.537385940551758, 32.642982482910156, 33.74857711791992, 34.85417175292969, 35.95976638793945, 37.06536102294922, 38.170955657958984, 39.27655029296875, 40.382144927978516, 41.48773956298828, 42.59333419799805, 43.69892883300781, 44.80452346801758, 45.910118103027344, 47.015716552734375, 48.12131118774414, 49.226905822753906]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 7.0, 10.0, 11.0, 14.0, 13.0, 17.0, 19.0, 18.0, 23.0, 13.0, 23.0, 31.0, 35.0, 44.0, 74.0, 145.0, 124.0, 50.0, 41.0, 36.0, 27.0, 27.0, 25.0, 18.0, 26.0, 18.0, 19.0, 13.0, 16.0, 12.0, 9.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.020453453063965, -11.640933990478516, -11.261414527893066, -10.881895065307617, -10.502376556396484, -10.122857093811035, -9.743337631225586, -9.363818168640137, -8.984298706054688, -8.604779243469238, -8.225259780883789, -7.845740795135498, -7.466221809387207, -7.086702346801758, -6.707182884216309, -6.327663421630859, -5.948144912719727, -5.568625450134277, -5.189106464385986, -4.809587001800537, -4.430068016052246, -4.050548553466797, -3.6710290908813477, -3.2915098667144775, -2.9119906425476074, -2.5324714183807373, -2.152952194213867, -1.773432731628418, -1.3939135074615479, -1.0143942832946777, -0.6348748207092285, -0.2553555965423584, 0.12416362762451172, 0.5036829113960266, 0.8832021951675415, 1.2627215385437012, 1.6422407627105713, 2.0217599868774414, 2.4012794494628906, 2.7807986736297607, 3.160317897796631, 3.539837121963501, 3.919356346130371, 4.29887580871582, 4.6783952713012695, 5.0579142570495605, 5.43743371963501, 5.816952705383301, 6.19647216796875, 6.575991630554199, 6.95551061630249, 7.3350300788879395, 7.7145490646362305, 8.09406852722168, 8.473587989807129, 8.853107452392578, 9.232625961303711, 9.61214542388916, 9.99166488647461, 10.371183395385742, 10.750702857971191, 11.13022232055664, 11.50974178314209, 11.889261245727539, 12.268780708312988]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 11.0, 14.0, 15.0, 24.0, 25.0, 31.0, 53.0, 73.0, 96.0, 160.0, 203.0, 292.0, 417.0, 664.0, 1071.0, 1892.0, 3433.0, 7462.0, 21765.0, 128961.0, 1266178.0, 2334491.0, 357582.0, 45384.0, 12408.0, 5116.0, 2551.0, 1344.0, 860.0, 532.0, 350.0, 249.0, 176.0, 104.0, 80.0, 57.0, 40.0, 29.0, 22.0, 14.0, 7.0, 9.0, 8.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.541015625, -1.490020751953125, -1.43902587890625, -1.388031005859375, -1.3370361328125, -1.286041259765625, -1.23504638671875, -1.184051513671875, -1.133056640625, -1.082061767578125, -1.03106689453125, -0.980072021484375, -0.9290771484375, -0.878082275390625, -0.82708740234375, -0.776092529296875, -0.72509765625, -0.674102783203125, -0.62310791015625, -0.572113037109375, -0.5211181640625, -0.470123291015625, -0.41912841796875, -0.368133544921875, -0.317138671875, -0.266143798828125, -0.21514892578125, -0.164154052734375, -0.1131591796875, -0.062164306640625, -0.01116943359375, 0.039825439453125, 0.0908203125, 0.141815185546875, 0.19281005859375, 0.243804931640625, 0.2947998046875, 0.345794677734375, 0.39678955078125, 0.447784423828125, 0.498779296875, 0.549774169921875, 0.60076904296875, 0.651763916015625, 0.7027587890625, 0.753753662109375, 0.80474853515625, 0.855743408203125, 0.90673828125, 0.957733154296875, 1.00872802734375, 1.059722900390625, 1.1107177734375, 1.161712646484375, 1.21270751953125, 1.263702392578125, 1.314697265625, 1.365692138671875, 1.41668701171875, 1.467681884765625, 1.5186767578125, 1.569671630859375, 1.62066650390625, 1.671661376953125, 1.72265625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 6.0, 13.0, 20.0, 11.0, 20.0, 35.0, 25.0, 38.0, 28.0, 37.0, 37.0, 35.0, 54.0, 36.0, 44.0, 48.0, 48.0, 45.0, 44.0, 62.0, 37.0, 48.0, 41.0, 28.0, 25.0, 23.0, 18.0, 19.0, 20.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.9111328125, -0.8868637084960938, -0.8625946044921875, -0.8383255004882812, -0.814056396484375, -0.7897872924804688, -0.7655181884765625, -0.7412490844726562, -0.71697998046875, -0.6927108764648438, -0.6684417724609375, -0.6441726684570312, -0.619903564453125, -0.5956344604492188, -0.5713653564453125, -0.5470962524414062, -0.5228271484375, -0.49855804443359375, -0.4742889404296875, -0.45001983642578125, -0.425750732421875, -0.40148162841796875, -0.3772125244140625, -0.35294342041015625, -0.32867431640625, -0.30440521240234375, -0.2801361083984375, -0.25586700439453125, -0.231597900390625, -0.20732879638671875, -0.1830596923828125, -0.15879058837890625, -0.134521484375, -0.11025238037109375, -0.0859832763671875, -0.06171417236328125, -0.037445068359375, -0.01317596435546875, 0.0110931396484375, 0.03536224365234375, 0.05963134765625, 0.08390045166015625, 0.1081695556640625, 0.13243865966796875, 0.156707763671875, 0.18097686767578125, 0.2052459716796875, 0.22951507568359375, 0.2537841796875, 0.27805328369140625, 0.3023223876953125, 0.32659149169921875, 0.350860595703125, 0.37512969970703125, 0.3993988037109375, 0.42366790771484375, 0.44793701171875, 0.47220611572265625, 0.4964752197265625, 0.5207443237304688, 0.545013427734375, 0.5692825317382812, 0.5935516357421875, 0.6178207397460938, 0.64208984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 3.0, 3.0, 6.0, 11.0, 14.0, 22.0, 28.0, 37.0, 53.0, 83.0, 98.0, 220.0, 359.0, 890.0, 2379.0, 9807.0, 135672.0, 3989086.0, 46973.0, 5657.0, 1536.0, 619.0, 254.0, 158.0, 77.0, 64.0, 41.0, 33.0, 22.0, 13.0, 14.0, 12.0, 15.0, 10.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.76171875, -4.59381103515625, -4.4259033203125, -4.25799560546875, -4.090087890625, -3.92218017578125, -3.7542724609375, -3.58636474609375, -3.41845703125, -3.25054931640625, -3.0826416015625, -2.91473388671875, -2.746826171875, -2.57891845703125, -2.4110107421875, -2.24310302734375, -2.0751953125, -1.90728759765625, -1.7393798828125, -1.57147216796875, -1.403564453125, -1.23565673828125, -1.0677490234375, -0.89984130859375, -0.73193359375, -0.56402587890625, -0.3961181640625, -0.22821044921875, -0.060302734375, 0.10760498046875, 0.2755126953125, 0.44342041015625, 0.611328125, 0.77923583984375, 0.9471435546875, 1.11505126953125, 1.282958984375, 1.45086669921875, 1.6187744140625, 1.78668212890625, 1.95458984375, 2.12249755859375, 2.2904052734375, 2.45831298828125, 2.626220703125, 2.79412841796875, 2.9620361328125, 3.12994384765625, 3.2978515625, 3.46575927734375, 3.6336669921875, 3.80157470703125, 3.969482421875, 4.13739013671875, 4.3052978515625, 4.47320556640625, 4.64111328125, 4.80902099609375, 4.9769287109375, 5.14483642578125, 5.312744140625, 5.48065185546875, 5.6485595703125, 5.81646728515625, 5.984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 10.0, 13.0, 21.0, 28.0, 26.0, 52.0, 81.0, 137.0, 220.0, 350.0, 646.0, 876.0, 653.0, 386.0, 225.0, 116.0, 82.0, 50.0, 30.0, 14.0, 19.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.345977783203125, -3.23687744140625, -3.127777099609375, -3.0186767578125, -2.909576416015625, -2.80047607421875, -2.691375732421875, -2.582275390625, -2.473175048828125, -2.36407470703125, -2.254974365234375, -2.1458740234375, -2.036773681640625, -1.92767333984375, -1.818572998046875, -1.70947265625, -1.600372314453125, -1.49127197265625, -1.382171630859375, -1.2730712890625, -1.163970947265625, -1.05487060546875, -0.945770263671875, -0.836669921875, -0.727569580078125, -0.61846923828125, -0.509368896484375, -0.4002685546875, -0.291168212890625, -0.18206787109375, -0.072967529296875, 0.0361328125, 0.145233154296875, 0.25433349609375, 0.363433837890625, 0.4725341796875, 0.581634521484375, 0.69073486328125, 0.799835205078125, 0.908935546875, 1.018035888671875, 1.12713623046875, 1.236236572265625, 1.3453369140625, 1.454437255859375, 1.56353759765625, 1.672637939453125, 1.78173828125, 1.890838623046875, 1.99993896484375, 2.109039306640625, 2.2181396484375, 2.327239990234375, 2.43634033203125, 2.545440673828125, 2.654541015625, 2.763641357421875, 2.87274169921875, 2.981842041015625, 3.0909423828125, 3.200042724609375, 3.30914306640625, 3.418243408203125, 3.52734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 23.0, 39.0, 90.0, 186.0, 274.0, 197.0, 96.0, 37.0, 17.0, 8.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.7006950378418, -49.388797760009766, -48.076904296875, -46.76500701904297, -45.45310974121094, -44.14121627807617, -42.82931900024414, -41.517425537109375, -40.205528259277344, -38.89363098144531, -37.58173751831055, -36.269840240478516, -34.95794677734375, -33.64604949951172, -32.33415222167969, -31.02225685119629, -29.71036148071289, -28.398466110229492, -27.086570739746094, -25.774673461914062, -24.462778091430664, -23.150882720947266, -21.838985443115234, -20.527090072631836, -19.215194702148438, -17.90329933166504, -16.59140396118164, -15.27950668334961, -13.967611312866211, -12.655715942382812, -11.343819618225098, -10.031923294067383, -8.720024108886719, -7.408128261566162, -6.0962324142456055, -4.784336566925049, -3.472440719604492, -2.1605448722839355, -0.8486490249633789, 0.46324729919433594, 1.7751426696777344, 3.087038516998291, 4.398934364318848, 5.710830211639404, 7.022726058959961, 8.33462142944336, 9.646517753601074, 10.958414077758789, 12.270309448242188, 13.582204818725586, 14.8941011428833, 16.205997467041016, 17.517892837524414, 18.829788208007812, 20.141685485839844, 21.453580856323242, 22.76547622680664, 24.07737159729004, 25.389266967773438, 26.70116424560547, 28.013059616088867, 29.324954986572266, 30.636852264404297, 31.948747634887695, 33.260643005371094]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 3.0, 8.0, 11.0, 10.0, 10.0, 19.0, 24.0, 25.0, 39.0, 33.0, 40.0, 35.0, 48.0, 64.0, 64.0, 66.0, 48.0, 53.0, 52.0, 55.0, 42.0, 33.0, 37.0, 23.0, 37.0, 16.0, 32.0, 10.0, 10.0, 9.0, 11.0, 3.0, 8.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.228525161743164, -16.702938079833984, -16.177352905273438, -15.651765823364258, -15.126178741455078, -14.600592613220215, -14.075006484985352, -13.549419403076172, -13.023833274841309, -12.498247146606445, -11.972660064697266, -11.447073936462402, -10.921487808227539, -10.39590072631836, -9.870314598083496, -9.344728469848633, -8.819141387939453, -8.29355525970459, -7.76796817779541, -7.242382049560547, -6.716795444488525, -6.191208839416504, -5.665622711181641, -5.140036106109619, -4.614449501037598, -4.088862895965576, -3.563276529312134, -3.0376901626586914, -2.51210355758667, -1.9865169525146484, -1.460930585861206, -0.9353442192077637, -0.409759521484375, 0.11582696437835693, 0.6414134502410889, 1.1669999361038208, 1.6925864219665527, 2.218173027038574, 2.7437593936920166, 3.269345760345459, 3.7949323654174805, 4.320518970489502, 4.846105575561523, 5.371691703796387, 5.897278308868408, 6.42286491394043, 6.948451042175293, 7.4740376472473145, 7.999624252319336, 8.5252103805542, 9.050797462463379, 9.576383590698242, 10.101970672607422, 10.627556800842285, 11.153142929077148, 11.678730010986328, 12.204316139221191, 12.729902267456055, 13.255489349365234, 13.781075477600098, 14.306661605834961, 14.83224868774414, 15.357834815979004, 15.883420944213867, 16.409008026123047]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 10.0, 10.0, 15.0, 24.0, 46.0, 66.0, 83.0, 177.0, 364.0, 802.0, 1951.0, 6153.0, 27789.0, 434704.0, 535577.0, 30654.0, 6439.0, 2006.0, 841.0, 392.0, 182.0, 101.0, 60.0, 29.0, 23.0, 12.0, 8.0, 10.0, 7.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.201171875, -2.130218505859375, -2.05926513671875, -1.988311767578125, -1.9173583984375, -1.846405029296875, -1.77545166015625, -1.704498291015625, -1.633544921875, -1.562591552734375, -1.49163818359375, -1.420684814453125, -1.3497314453125, -1.278778076171875, -1.20782470703125, -1.136871337890625, -1.06591796875, -0.994964599609375, -0.92401123046875, -0.853057861328125, -0.7821044921875, -0.711151123046875, -0.64019775390625, -0.569244384765625, -0.498291015625, -0.427337646484375, -0.35638427734375, -0.285430908203125, -0.2144775390625, -0.143524169921875, -0.07257080078125, -0.001617431640625, 0.0693359375, 0.140289306640625, 0.21124267578125, 0.282196044921875, 0.3531494140625, 0.424102783203125, 0.49505615234375, 0.566009521484375, 0.636962890625, 0.707916259765625, 0.77886962890625, 0.849822998046875, 0.9207763671875, 0.991729736328125, 1.06268310546875, 1.133636474609375, 1.20458984375, 1.275543212890625, 1.34649658203125, 1.417449951171875, 1.4884033203125, 1.559356689453125, 1.63031005859375, 1.701263427734375, 1.772216796875, 1.843170166015625, 1.91412353515625, 1.985076904296875, 2.0560302734375, 2.126983642578125, 2.19793701171875, 2.268890380859375, 2.33984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 15.0, 27.0, 32.0, 46.0, 55.0, 74.0, 88.0, 106.0, 85.0, 106.0, 95.0, 65.0, 60.0, 45.0, 26.0, 22.0, 17.0, 11.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.783203125, -1.7263946533203125, -1.669586181640625, -1.6127777099609375, -1.55596923828125, -1.4991607666015625, -1.442352294921875, -1.3855438232421875, -1.3287353515625, -1.2719268798828125, -1.215118408203125, -1.1583099365234375, -1.10150146484375, -1.0446929931640625, -0.987884521484375, -0.9310760498046875, -0.874267578125, -0.8174591064453125, -0.760650634765625, -0.7038421630859375, -0.64703369140625, -0.5902252197265625, -0.533416748046875, -0.4766082763671875, -0.4197998046875, -0.3629913330078125, -0.306182861328125, -0.2493743896484375, -0.19256591796875, -0.1357574462890625, -0.078948974609375, -0.0221405029296875, 0.03466796875, 0.0914764404296875, 0.148284912109375, 0.2050933837890625, 0.26190185546875, 0.3187103271484375, 0.375518798828125, 0.4323272705078125, 0.4891357421875, 0.5459442138671875, 0.602752685546875, 0.6595611572265625, 0.71636962890625, 0.7731781005859375, 0.829986572265625, 0.8867950439453125, 0.943603515625, 1.0004119873046875, 1.057220458984375, 1.1140289306640625, 1.17083740234375, 1.2276458740234375, 1.284454345703125, 1.3412628173828125, 1.3980712890625, 1.4548797607421875, 1.511688232421875, 1.5684967041015625, 1.62530517578125, 1.6821136474609375, 1.738922119140625, 1.7957305908203125, 1.8525390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 5.0, 10.0, 17.0, 12.0, 17.0, 22.0, 49.0, 59.0, 108.0, 165.0, 271.0, 616.0, 1411.0, 4898.0, 39122.0, 953376.0, 40355.0, 5212.0, 1453.0, 581.0, 273.0, 180.0, 121.0, 56.0, 52.0, 28.0, 23.0, 21.0, 9.0, 11.0, 6.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.400177001953125, -2.31597900390625, -2.231781005859375, -2.1475830078125, -2.063385009765625, -1.97918701171875, -1.894989013671875, -1.810791015625, -1.726593017578125, -1.64239501953125, -1.558197021484375, -1.4739990234375, -1.389801025390625, -1.30560302734375, -1.221405029296875, -1.13720703125, -1.053009033203125, -0.96881103515625, -0.884613037109375, -0.8004150390625, -0.716217041015625, -0.63201904296875, -0.547821044921875, -0.463623046875, -0.379425048828125, -0.29522705078125, -0.211029052734375, -0.1268310546875, -0.042633056640625, 0.04156494140625, 0.125762939453125, 0.2099609375, 0.294158935546875, 0.37835693359375, 0.462554931640625, 0.5467529296875, 0.630950927734375, 0.71514892578125, 0.799346923828125, 0.883544921875, 0.967742919921875, 1.05194091796875, 1.136138916015625, 1.2203369140625, 1.304534912109375, 1.38873291015625, 1.472930908203125, 1.55712890625, 1.641326904296875, 1.72552490234375, 1.809722900390625, 1.8939208984375, 1.978118896484375, 2.06231689453125, 2.146514892578125, 2.230712890625, 2.314910888671875, 2.39910888671875, 2.483306884765625, 2.5675048828125, 2.651702880859375, 2.73590087890625, 2.820098876953125, 2.904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 7.0, 13.0, 8.0, 11.0, 23.0, 25.0, 29.0, 35.0, 44.0, 68.0, 69.0, 100.0, 95.0, 94.0, 65.0, 49.0, 31.0, 40.0, 32.0, 19.0, 22.0, 17.0, 20.0, 13.0, 10.0, 9.0, 6.0, 11.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.55206298828125, -4.3970947265625, -4.24212646484375, -4.087158203125, -3.93218994140625, -3.7772216796875, -3.62225341796875, -3.46728515625, -3.31231689453125, -3.1573486328125, -3.00238037109375, -2.847412109375, -2.69244384765625, -2.5374755859375, -2.38250732421875, -2.2275390625, -2.07257080078125, -1.9176025390625, -1.76263427734375, -1.607666015625, -1.45269775390625, -1.2977294921875, -1.14276123046875, -0.98779296875, -0.83282470703125, -0.6778564453125, -0.52288818359375, -0.367919921875, -0.21295166015625, -0.0579833984375, 0.09698486328125, 0.251953125, 0.40692138671875, 0.5618896484375, 0.71685791015625, 0.871826171875, 1.02679443359375, 1.1817626953125, 1.33673095703125, 1.49169921875, 1.64666748046875, 1.8016357421875, 1.95660400390625, 2.111572265625, 2.26654052734375, 2.4215087890625, 2.57647705078125, 2.7314453125, 2.88641357421875, 3.0413818359375, 3.19635009765625, 3.351318359375, 3.50628662109375, 3.6612548828125, 3.81622314453125, 3.97119140625, 4.12615966796875, 4.2811279296875, 4.43609619140625, 4.591064453125, 4.74603271484375, 4.9010009765625, 5.05596923828125, 5.2109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 9.0, 5.0, 10.0, 21.0, 19.0, 34.0, 41.0, 54.0, 83.0, 88.0, 116.0, 150.0, 230.0, 305.0, 448.0, 620.0, 1026.0, 1607.0, 2860.0, 5453.0, 12410.0, 41001.0, 816593.0, 125048.0, 21789.0, 8337.0, 3973.0, 2182.0, 1355.0, 767.0, 556.0, 368.0, 247.0, 176.0, 133.0, 88.0, 75.0, 53.0, 39.0, 40.0, 29.0, 24.0, 24.0, 18.0, 9.0, 6.0, 8.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.283935546875, -0.2747077941894531, -0.26548004150390625, -0.2562522888183594, -0.2470245361328125, -0.23779678344726562, -0.22856903076171875, -0.21934127807617188, -0.210113525390625, -0.20088577270507812, -0.19165802001953125, -0.18243026733398438, -0.1732025146484375, -0.16397476196289062, -0.15474700927734375, -0.14551925659179688, -0.13629150390625, -0.12706375122070312, -0.11783599853515625, -0.10860824584960938, -0.0993804931640625, -0.09015274047851562, -0.08092498779296875, -0.07169723510742188, -0.062469482421875, -0.053241729736328125, -0.04401397705078125, -0.034786224365234375, -0.0255584716796875, -0.016330718994140625, -0.00710296630859375, 0.002124786376953125, 0.0113525390625, 0.020580291748046875, 0.02980804443359375, 0.039035797119140625, 0.0482635498046875, 0.057491302490234375, 0.06671905517578125, 0.07594680786132812, 0.085174560546875, 0.09440231323242188, 0.10363006591796875, 0.11285781860351562, 0.1220855712890625, 0.13131332397460938, 0.14054107666015625, 0.14976882934570312, 0.15899658203125, 0.16822433471679688, 0.17745208740234375, 0.18667984008789062, 0.1959075927734375, 0.20513534545898438, 0.21436309814453125, 0.22359085083007812, 0.232818603515625, 0.24204635620117188, 0.25127410888671875, 0.2605018615722656, 0.2697296142578125, 0.2789573669433594, 0.28818511962890625, 0.2974128723144531, 0.306640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 2.0, 8.0, 11.0, 17.0, 21.0, 37.0, 64.0, 143.0, 324.0, 175.0, 79.0, 35.0, 24.0, 16.0, 11.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020551681518554688, -0.00019777566194534302, -0.00019003450870513916, -0.0001822933554649353, -0.00017455220222473145, -0.0001668110489845276, -0.00015906989574432373, -0.00015132874250411987, -0.00014358758926391602, -0.00013584643602371216, -0.0001281052827835083, -0.00012036412954330444, -0.00011262297630310059, -0.00010488182306289673, -9.714066982269287e-05, -8.939951658248901e-05, -8.165836334228516e-05, -7.39172101020813e-05, -6.617605686187744e-05, -5.8434903621673584e-05, -5.0693750381469727e-05, -4.295259714126587e-05, -3.521144390106201e-05, -2.7470290660858154e-05, -1.9729137420654297e-05, -1.198798418045044e-05, -4.246830940246582e-06, 3.4943222999572754e-06, 1.1235475540161133e-05, 1.897662878036499e-05, 2.6717782020568848e-05, 3.4458935260772705e-05, 4.220008850097656e-05, 4.994124174118042e-05, 5.768239498138428e-05, 6.542354822158813e-05, 7.316470146179199e-05, 8.090585470199585e-05, 8.864700794219971e-05, 9.638816118240356e-05, 0.00010412931442260742, 0.00011187046766281128, 0.00011961162090301514, 0.000127352774143219, 0.00013509392738342285, 0.0001428350806236267, 0.00015057623386383057, 0.00015831738710403442, 0.00016605854034423828, 0.00017379969358444214, 0.000181540846824646, 0.00018928200006484985, 0.0001970231533050537, 0.00020476430654525757, 0.00021250545978546143, 0.00022024661302566528, 0.00022798776626586914, 0.000235728919506073, 0.00024347007274627686, 0.0002512112259864807, 0.00025895237922668457, 0.00026669353246688843, 0.0002744346857070923, 0.00028217583894729614, 0.0002899169921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 8.0, 8.0, 13.0, 30.0, 24.0, 33.0, 43.0, 59.0, 92.0, 150.0, 215.0, 288.0, 491.0, 709.0, 1186.0, 2083.0, 4201.0, 8900.0, 24586.0, 136122.0, 796186.0, 46793.0, 13635.0, 5687.0, 2818.0, 1629.0, 866.0, 567.0, 374.0, 239.0, 153.0, 100.0, 94.0, 57.0, 24.0, 25.0, 15.0, 9.0, 8.0, 8.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.263671875, -0.2546501159667969, -0.24562835693359375, -0.23660659790039062, -0.2275848388671875, -0.21856307983398438, -0.20954132080078125, -0.20051956176757812, -0.191497802734375, -0.18247604370117188, -0.17345428466796875, -0.16443252563476562, -0.1554107666015625, -0.14638900756835938, -0.13736724853515625, -0.12834548950195312, -0.11932373046875, -0.11030197143554688, -0.10128021240234375, -0.09225845336914062, -0.0832366943359375, -0.07421493530273438, -0.06519317626953125, -0.056171417236328125, -0.047149658203125, -0.038127899169921875, -0.02910614013671875, -0.020084381103515625, -0.0110626220703125, -0.002040863037109375, 0.00698089599609375, 0.016002655029296875, 0.0250244140625, 0.034046173095703125, 0.04306793212890625, 0.052089691162109375, 0.0611114501953125, 0.07013320922851562, 0.07915496826171875, 0.08817672729492188, 0.097198486328125, 0.10622024536132812, 0.11524200439453125, 0.12426376342773438, 0.1332855224609375, 0.14230728149414062, 0.15132904052734375, 0.16035079956054688, 0.16937255859375, 0.17839431762695312, 0.18741607666015625, 0.19643783569335938, 0.2054595947265625, 0.21448135375976562, 0.22350311279296875, 0.23252487182617188, 0.241546630859375, 0.2505683898925781, 0.25959014892578125, 0.2686119079589844, 0.2776336669921875, 0.2866554260253906, 0.29567718505859375, 0.3046989440917969, 0.313720703125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 8.0, 12.0, 5.0, 5.0, 5.0, 10.0, 10.0, 20.0, 26.0, 38.0, 102.0, 125.0, 203.0, 156.0, 82.0, 45.0, 18.0, 23.0, 14.0, 14.0, 11.0, 9.0, 11.0, 4.0, 4.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5181045532226562, -0.5005645751953125, -0.48302459716796875, -0.465484619140625, -0.44794464111328125, -0.4304046630859375, -0.41286468505859375, -0.39532470703125, -0.37778472900390625, -0.3602447509765625, -0.34270477294921875, -0.325164794921875, -0.30762481689453125, -0.2900848388671875, -0.27254486083984375, -0.2550048828125, -0.23746490478515625, -0.2199249267578125, -0.20238494873046875, -0.184844970703125, -0.16730499267578125, -0.1497650146484375, -0.13222503662109375, -0.11468505859375, -0.09714508056640625, -0.0796051025390625, -0.06206512451171875, -0.044525146484375, -0.02698516845703125, -0.0094451904296875, 0.00809478759765625, 0.025634765625, 0.04317474365234375, 0.0607147216796875, 0.07825469970703125, 0.095794677734375, 0.11333465576171875, 0.1308746337890625, 0.14841461181640625, 0.16595458984375, 0.18349456787109375, 0.2010345458984375, 0.21857452392578125, 0.236114501953125, 0.25365447998046875, 0.2711944580078125, 0.28873443603515625, 0.3062744140625, 0.32381439208984375, 0.3413543701171875, 0.35889434814453125, 0.376434326171875, 0.39397430419921875, 0.4115142822265625, 0.42905426025390625, 0.44659423828125, 0.46413421630859375, 0.4816741943359375, 0.49921417236328125, 0.516754150390625, 0.5342941284179688, 0.5518341064453125, 0.5693740844726562, 0.5869140625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 15.0, 27.0, 56.0, 90.0, 567.0, 127.0, 50.0, 33.0, 11.0, 13.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.343408584594727, -28.584228515625, -27.825048446655273, -27.065868377685547, -26.306690216064453, -25.547510147094727, -24.788330078125, -24.029150009155273, -23.269969940185547, -22.51078987121582, -21.751609802246094, -20.992431640625, -20.233251571655273, -19.474071502685547, -18.71489143371582, -17.955711364746094, -17.196533203125, -16.437353134155273, -15.678174018859863, -14.918993949890137, -14.159814834594727, -13.400634765625, -12.641454696655273, -11.882274627685547, -11.123095512390137, -10.36391544342041, -9.604736328125, -8.845556259155273, -8.086376190185547, -7.327197074890137, -6.56801700592041, -5.808837413787842, -5.049655914306641, -4.290476322174072, -3.531296491622925, -2.7721166610717773, -2.012937068939209, -1.2537574768066406, -0.49457740783691406, 0.2646021842956543, 1.0237817764282227, 1.7829614877700806, 2.5421411991119385, 3.301321029663086, 4.060500621795654, 4.819680213928223, 5.578860282897949, 6.338039875030518, 7.097219467163086, 7.856399059295654, 8.615578651428223, 9.37475872039795, 10.13393783569336, 10.893117904663086, 11.652297973632812, 12.411478042602539, 13.17065715789795, 13.929837226867676, 14.689016342163086, 15.448196411132812, 16.20737648010254, 16.966556549072266, 17.72573471069336, 18.484914779663086, 19.244094848632812]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 10.0, 18.0, 14.0, 18.0, 7.0, 18.0, 23.0, 21.0, 28.0, 35.0, 37.0, 56.0, 283.0, 216.0, 46.0, 27.0, 33.0, 21.0, 17.0, 10.0, 16.0, 15.0, 8.0, 7.0, 3.0, 7.0, 4.0, 6.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.077590942382812, -21.524276733398438, -20.970964431762695, -20.41765022277832, -19.864336013793945, -19.311023712158203, -18.757709503173828, -18.204395294189453, -17.651081085205078, -17.097766876220703, -16.54445457458496, -15.991140365600586, -15.437826156616211, -14.884512901306152, -14.331199645996094, -13.777885437011719, -13.224573135375977, -12.671259880065918, -12.117945671081543, -11.564632415771484, -11.01131820678711, -10.45800495147705, -9.904691696166992, -9.351377487182617, -8.798064231872559, -8.2447509765625, -7.691436767578125, -7.138123512268066, -6.58480978012085, -6.031496047973633, -5.478182792663574, -4.924869060516357, -4.371553421020508, -3.818239688873291, -3.2649261951446533, -2.7116127014160156, -2.158298969268799, -1.604985237121582, -1.0516717433929443, -0.49835824966430664, 0.054955482482910156, 0.6082690954208374, 1.1615827083587646, 1.714896321296692, 2.268209934234619, 2.821523666381836, 3.3748371601104736, 3.9281506538391113, 4.481464385986328, 5.034778118133545, 5.588091850280762, 6.14140510559082, 6.694718837738037, 7.248032569885254, 7.8013458251953125, 8.354660034179688, 8.907973289489746, 9.461286544799805, 10.01460075378418, 10.567914009094238, 11.121227264404297, 11.674541473388672, 12.22785472869873, 12.781167984008789, 13.334482192993164]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 4.0, 5.0, 7.0, 5.0, 9.0, 6.0, 11.0, 10.0, 13.0, 10.0, 18.0, 26.0, 20.0, 21.0, 27.0, 27.0, 44.0, 51.0, 80.0, 213.0, 100.0, 41.0, 46.0, 15.0, 31.0, 25.0, 16.0, 17.0, 19.0, 20.0, 15.0, 12.0, 10.0, 8.0, 5.0, 0.0, 3.0, 4.0, 1.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.9716796875, -0.9464340209960938, -0.9211883544921875, -0.8959426879882812, -0.870697021484375, -0.8454513549804688, -0.8202056884765625, -0.7949600219726562, -0.76971435546875, -0.7444686889648438, -0.7192230224609375, -0.6939773559570312, -0.668731689453125, -0.6434860229492188, -0.6182403564453125, -0.5929946899414062, -0.5677490234375, -0.5425033569335938, -0.5172576904296875, -0.49201202392578125, -0.466766357421875, -0.44152069091796875, -0.4162750244140625, -0.39102935791015625, -0.36578369140625, -0.34053802490234375, -0.3152923583984375, -0.29004669189453125, -0.264801025390625, -0.23955535888671875, -0.2143096923828125, -0.18906402587890625, -0.163818359375, -0.13857269287109375, -0.1133270263671875, -0.08808135986328125, -0.062835693359375, -0.03759002685546875, -0.0123443603515625, 0.01290130615234375, 0.03814697265625, 0.06339263916015625, 0.0886383056640625, 0.11388397216796875, 0.139129638671875, 0.16437530517578125, 0.1896209716796875, 0.21486663818359375, 0.2401123046875, 0.26535797119140625, 0.2906036376953125, 0.31584930419921875, 0.341094970703125, 0.36634063720703125, 0.3915863037109375, 0.41683197021484375, 0.44207763671875, 0.46732330322265625, 0.4925689697265625, 0.5178146362304688, 0.543060302734375, 0.5683059692382812, 0.5935516357421875, 0.6187973022460938, 0.64404296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 1.0, 3.0, 11.0, 9.0, 7.0, 13.0, 11.0, 32.0, 37.0, 67.0, 107.0, 184.0, 363.0, 812.0, 2454.0, 10997.0, 8336661.0, 30420.0, 4010.0, 1253.0, 501.0, 239.0, 122.0, 71.0, 57.0, 40.0, 25.0, 12.0, 10.0, 9.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.116008758544922, -7.867669105529785, -7.619329929351807, -7.37099027633667, -7.122651100158691, -6.874311447143555, -6.625971794128418, -6.3776326179504395, -6.129293441772461, -5.880953788757324, -5.632614612579346, -5.384274959564209, -5.1359357833862305, -4.887596130371094, -4.639256477355957, -4.3909173011779785, -4.142577648162842, -3.894238233566284, -3.6458988189697266, -3.39755916595459, -3.1492199897766113, -2.9008803367614746, -2.652540922164917, -2.4042015075683594, -2.1558620929718018, -1.9075226783752441, -1.6591832637786865, -1.4108437299728394, -1.1625043153762817, -0.9141649007797241, -0.665825366973877, -0.41748595237731934, -0.16914606094360352, 0.07919338345527649, 0.3275328278541565, 0.5758723020553589, 0.8242117166519165, 1.0725511312484741, 1.3208906650543213, 1.569230079650879, 1.8175694942474365, 2.065908908843994, 2.3142483234405518, 2.5625877380371094, 2.810927391052246, 3.0592665672302246, 3.3076062202453613, 3.555945634841919, 3.8042850494384766, 4.052624702453613, 4.300963878631592, 4.5493035316467285, 4.797642707824707, 5.045982360839844, 5.2943220138549805, 5.542661190032959, 5.7910003662109375, 6.039340019226074, 6.287679195404053, 6.5360188484191895, 6.784358024597168, 7.032697677612305, 7.281037330627441, 7.52937650680542, 7.777716159820557]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 4.0, 7.0, 8.0, 3.0, 3.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.90190601348877, -13.522135734558105, -13.142365455627441, -12.762595176696777, -12.382824897766113, -12.00305461883545, -11.623283386230469, -11.243513107299805, -10.86374282836914, -10.483972549438477, -10.104202270507812, -9.724431991577148, -9.344661712646484, -8.96489143371582, -8.585121154785156, -8.205350875854492, -7.825580596923828, -7.445810317993164, -7.0660400390625, -6.686269760131836, -6.306499481201172, -5.926729202270508, -5.5469584465026855, -5.1671881675720215, -4.787417888641357, -4.407647609710693, -4.027877330780029, -3.648106813430786, -3.268336534500122, -2.888566255569458, -2.508795738220215, -2.129025459289551, -1.7492551803588867, -1.3694849014282227, -0.989714503288269, -0.6099441051483154, -0.23017382621765137, 0.1495964527130127, 0.5293669700622559, 0.9091372489929199, 1.288907527923584, 1.668677806854248, 2.048448085784912, 2.4282186031341553, 2.8079888820648193, 3.1877591609954834, 3.5675296783447266, 3.9472999572753906, 4.327070236206055, 4.706840515136719, 5.086610794067383, 5.466381072998047, 5.846151351928711, 6.225921630859375, 6.605692386627197, 6.985462665557861, 7.365232944488525, 7.7450032234191895, 8.124773979187012, 8.504544258117676, 8.88431453704834, 9.264084815979004, 9.643855094909668, 10.023625373840332, 10.403395652770996]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 8.0, 12.0, 22.0, 36.0, 45.0, 72.0, 101.0, 129.0, 148.0, 127.0, 105.0, 72.0, 41.0, 24.0, 20.0, 11.0, 15.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.529296875, -0.5066299438476562, -0.4839630126953125, -0.46129608154296875, -0.438629150390625, -0.41596221923828125, -0.3932952880859375, -0.37062835693359375, -0.34796142578125, -0.32529449462890625, -0.3026275634765625, -0.27996063232421875, -0.257293701171875, -0.23462677001953125, -0.2119598388671875, -0.18929290771484375, -0.1666259765625, -0.14395904541015625, -0.1212921142578125, -0.09862518310546875, -0.075958251953125, -0.05329132080078125, -0.0306243896484375, -0.00795745849609375, 0.01470947265625, 0.03737640380859375, 0.0600433349609375, 0.08271026611328125, 0.105377197265625, 0.12804412841796875, 0.1507110595703125, 0.17337799072265625, 0.196044921875, 0.21871185302734375, 0.2413787841796875, 0.26404571533203125, 0.286712646484375, 0.30937957763671875, 0.3320465087890625, 0.35471343994140625, 0.37738037109375, 0.40004730224609375, 0.4227142333984375, 0.44538116455078125, 0.468048095703125, 0.49071502685546875, 0.5133819580078125, 0.5360488891601562, 0.5587158203125, 0.5813827514648438, 0.6040496826171875, 0.6267166137695312, 0.649383544921875, 0.6720504760742188, 0.6947174072265625, 0.7173843383789062, 0.74005126953125, 0.7627182006835938, 0.7853851318359375, 0.8080520629882812, 0.830718994140625, 0.8533859252929688, 0.8760528564453125, 0.8987197875976562, 0.92138671875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 12.0, 15.0, 27.0, 49.0, 63.0, 116.0, 205.0, 327.0, 639.0, 1480.0, 3851.0, 13019.0, 57324.0, 248632.0, 154718.0, 31062.0, 7796.0, 2573.0, 1010.0, 556.0, 279.0, 163.0, 104.0, 72.0, 39.0, 42.0, 27.0, 15.0, 16.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.40625, -8.1143798828125, -7.822509765625, -7.5306396484375, -7.23876953125, -6.9468994140625, -6.655029296875, -6.3631591796875, -6.0712890625, -5.7794189453125, -5.487548828125, -5.1956787109375, -4.90380859375, -4.6119384765625, -4.320068359375, -4.0281982421875, -3.736328125, -3.4444580078125, -3.152587890625, -2.8607177734375, -2.56884765625, -2.2769775390625, -1.985107421875, -1.6932373046875, -1.4013671875, -1.1094970703125, -0.817626953125, -0.5257568359375, -0.23388671875, 0.0579833984375, 0.349853515625, 0.6417236328125, 0.93359375, 1.2254638671875, 1.517333984375, 1.8092041015625, 2.10107421875, 2.3929443359375, 2.684814453125, 2.9766845703125, 3.2685546875, 3.5604248046875, 3.852294921875, 4.1441650390625, 4.43603515625, 4.7279052734375, 5.019775390625, 5.3116455078125, 5.603515625, 5.8953857421875, 6.187255859375, 6.4791259765625, 6.77099609375, 7.0628662109375, 7.354736328125, 7.6466064453125, 7.9384765625, 8.2303466796875, 8.522216796875, 8.8140869140625, 9.10595703125, 9.3978271484375, 9.689697265625, 9.9815673828125, 10.2734375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 12.0, 10.0, 14.0, 15.0, 22.0, 18.0, 46.0, 46.0, 45.0, 61.0, 66.0, 77.0, 70.0, 96.0, 78.0, 60.0, 57.0, 51.0, 38.0, 34.0, 16.0, 18.0, 10.0, 11.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9661712646484375, -0.926483154296875, -0.8867950439453125, -0.84710693359375, -0.8074188232421875, -0.767730712890625, -0.7280426025390625, -0.6883544921875, -0.6486663818359375, -0.608978271484375, -0.5692901611328125, -0.52960205078125, -0.4899139404296875, -0.450225830078125, -0.4105377197265625, -0.370849609375, -0.3311614990234375, -0.291473388671875, -0.2517852783203125, -0.21209716796875, -0.1724090576171875, -0.132720947265625, -0.0930328369140625, -0.0533447265625, -0.0136566162109375, 0.026031494140625, 0.0657196044921875, 0.10540771484375, 0.1450958251953125, 0.184783935546875, 0.2244720458984375, 0.26416015625, 0.3038482666015625, 0.343536376953125, 0.3832244873046875, 0.42291259765625, 0.4626007080078125, 0.502288818359375, 0.5419769287109375, 0.5816650390625, 0.6213531494140625, 0.661041259765625, 0.7007293701171875, 0.74041748046875, 0.7801055908203125, 0.819793701171875, 0.8594818115234375, 0.899169921875, 0.9388580322265625, 0.978546142578125, 1.0182342529296875, 1.05792236328125, 1.0976104736328125, 1.137298583984375, 1.1769866943359375, 1.2166748046875, 1.2563629150390625, 1.296051025390625, 1.3357391357421875, 1.37542724609375, 1.4151153564453125, 1.454803466796875, 1.4944915771484375, 1.5341796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 13.0, 31.0, 38.0, 72.0, 84.0, 75.0, 69.0, 25.0, 24.0, 6.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.710701942443848, -6.456543922424316, -6.202386379241943, -5.94822883605957, -5.694070816040039, -5.439912796020508, -5.185755252838135, -4.931597709655762, -4.6774396896362305, -4.423281669616699, -4.169124126434326, -3.914966344833374, -3.660808563232422, -3.4066507816314697, -3.1524930000305176, -2.8983352184295654, -2.6441774368286133, -2.390019655227661, -2.135861873626709, -1.8817040920257568, -1.6275463104248047, -1.3733885288238525, -1.1192307472229004, -0.8650729656219482, -0.6109151840209961, -0.35675740242004395, -0.1025996208190918, 0.15155816078186035, 0.4057159423828125, 0.6598737239837646, 0.9140315055847168, 1.168189287185669, 1.4223461151123047, 1.6765038967132568, 1.930661678314209, 2.184819459915161, 2.4389772415161133, 2.6931350231170654, 2.9472928047180176, 3.2014505863189697, 3.455608367919922, 3.709766149520874, 3.963923931121826, 4.218081474304199, 4.4722394943237305, 4.726397514343262, 4.980555057525635, 5.234712600708008, 5.488870620727539, 5.74302864074707, 5.997186183929443, 6.251343727111816, 6.505501747131348, 6.759659767150879, 7.013817310333252, 7.267974853515625, 7.522132873535156, 7.7762908935546875, 8.030448913574219, 8.284605979919434, 8.538763999938965, 8.792922019958496, 9.047079086303711, 9.301237106323242, 9.555395126342773]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 14.0, 27.0, 25.0, 44.0, 51.0, 81.0, 64.0, 26.0, 30.0, 28.0, 13.0, 10.0, 5.0, 5.0, 5.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8963820934295654, -3.7414605617523193, -3.5865390300750732, -3.431617498397827, -3.27669620513916, -3.121774673461914, -2.966853141784668, -2.811931610107422, -2.657010078430176, -2.5020885467529297, -2.3471670150756836, -2.1922454833984375, -2.0373239517211914, -1.8824025392532349, -1.7274811267852783, -1.5725595951080322, -1.4176380634307861, -1.26271653175354, -1.107795000076294, -0.9528735876083374, -0.7979520559310913, -0.6430305242538452, -0.4881090521812439, -0.3331875801086426, -0.17826604843139648, -0.02334454655647278, 0.13157695531845093, 0.28649845719337463, 0.44141995906829834, 0.5963414907455444, 0.7512629628181458, 0.9061844348907471, 1.061105728149414, 1.2160272598266602, 1.3709487915039062, 1.5258702039718628, 1.6807917356491089, 1.835713267326355, 1.9906346797943115, 2.1455562114715576, 2.3004777431488037, 2.45539927482605, 2.610320806503296, 2.765242338180542, 2.920163631439209, 3.075085163116455, 3.230006694793701, 3.3849282264709473, 3.5398497581481934, 3.6947712898254395, 3.8496928215026855, 4.004614353179932, 4.159535884857178, 4.314457416534424, 4.46937894821167, 4.624300003051758, 4.779221534729004, 4.93414306640625, 5.089064598083496, 5.243986129760742, 5.398907661437988, 5.553829193115234, 5.7087507247924805, 5.863672256469727, 6.018593788146973]}, "eval/loss": 4.259941577911377, "eval/wer": 1.0190995636652123, "eval/runtime": 524.0014, "eval/samples_per_second": 5.042, "eval/steps_per_second": 0.632, "train/train_runtime": 51677.5666, "train/train_samples_per_second": 5.522, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 4.09313003856505} \ No newline at end of file