diff --git "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" --- "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" +++ "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.9251, "train/learning_rate": 3.2066153313506185e-07, "train/epoch": 3.0, "train/global_step": 9720, "_runtime": 93795, "_timestamp": 1651767884, "_step": 9739, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 41.0, 232.0, 466.0, 211.0, 43.0, 14.0, 1.0], "bins": [-22.81093406677246, -22.4266300201416, -22.042327880859375, -21.658023834228516, -21.27372169494629, -20.88941764831543, -20.505115509033203, -20.120811462402344, -19.736509323120117, -19.352205276489258, -18.96790313720703, -18.583599090576172, -18.199296951293945, -17.814992904663086, -17.43069076538086, -17.04638671875, -16.66208267211914, -16.27777862548828, -15.893476486206055, -15.509173393249512, -15.124870300292969, -14.740567207336426, -14.356264114379883, -13.971960067749023, -13.587657928466797, -13.203354835510254, -12.819051742553711, -12.434748649597168, -12.050445556640625, -11.666142463684082, -11.281839370727539, -10.89753532409668, -10.513232231140137, -10.128929138183594, -9.74462604522705, -9.360322952270508, -8.976019859313965, -8.591716766357422, -8.207412719726562, -7.823110103607178, -7.438807487487793, -7.05450439453125, -6.670201301574707, -6.285898208618164, -5.901595115661621, -5.517292022705078, -5.132988452911377, -4.748685359954834, -4.364382266998291, -3.980079174041748, -3.595776081085205, -3.211472749710083, -2.82716965675354, -2.442866563796997, -2.058563232421875, -1.674260139465332, -1.2899569272994995, -0.9056537747383118, -0.521350622177124, -0.1370474100112915, 0.24725568294525146, 0.6315587759017944, 1.0158621072769165, 1.4001652002334595, 1.7844682931900024]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 3.0, 8.0, 13.0, 11.0, 13.0, 15.0, 16.0, 22.0, 21.0, 24.0, 29.0, 26.0, 28.0, 39.0, 33.0, 41.0, 34.0, 32.0, 33.0, 47.0, 38.0, 41.0, 30.0, 35.0, 35.0, 43.0, 38.0, 31.0, 30.0, 23.0, 33.0, 16.0, 25.0, 16.0, 12.0, 19.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.0006556510925293, -1.933129072189331, -1.8656026124954224, -1.7980761528015137, -1.7305495738983154, -1.6630229949951172, -1.5954965353012085, -1.5279700756072998, -1.4604434967041016, -1.3929169178009033, -1.3253904581069946, -1.257863998413086, -1.1903374195098877, -1.1228108406066895, -1.0552843809127808, -0.9877578616142273, -0.9202313423156738, -0.8527048230171204, -0.7851783037185669, -0.7176517844200134, -0.65012526512146, -0.5825987458229065, -0.515072226524353, -0.44754570722579956, -0.3800191879272461, -0.3124926686286926, -0.24496614933013916, -0.1774396300315857, -0.10991311073303223, -0.04238659143447876, 0.025139927864074707, 0.09266644716262817, 0.16019272804260254, 0.227719247341156, 0.2952457666397095, 0.36277228593826294, 0.4302988052368164, 0.4978253245353699, 0.5653518438339233, 0.6328783631324768, 0.7004048824310303, 0.7679314017295837, 0.8354579210281372, 0.9029844403266907, 0.9705109596252441, 1.0380375385284424, 1.105563998222351, 1.1730904579162598, 1.240617036819458, 1.3081436157226562, 1.375670075416565, 1.4431965351104736, 1.5107231140136719, 1.5782496929168701, 1.6457761526107788, 1.7133026123046875, 1.7808291912078857, 1.848355770111084, 1.9158822298049927, 1.9834086894989014, 2.0509352684020996, 2.118461847305298, 2.185988426208496, 2.2535147666931152, 2.3210413455963135]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 8.0, 9.0, 10.0, 20.0, 21.0, 38.0, 62.0, 83.0, 124.0, 179.0, 285.0, 389.0, 552.0, 796.0, 1204.0, 1853.0, 3058.0, 5427.0, 9892.0, 19022.0, 38094.0, 82406.0, 219508.0, 868829.0, 2214707.0, 462620.0, 142770.0, 60228.0, 28659.0, 14034.0, 7695.0, 4267.0, 2619.0, 1648.0, 1032.0, 694.0, 471.0, 298.0, 220.0, 151.0, 92.0, 76.0, 41.0, 29.0, 27.0, 10.0, 8.0, 6.0, 5.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.96484375, -1.899993896484375, -1.83514404296875, -1.770294189453125, -1.7054443359375, -1.640594482421875, -1.57574462890625, -1.510894775390625, -1.446044921875, -1.381195068359375, -1.31634521484375, -1.251495361328125, -1.1866455078125, -1.121795654296875, -1.05694580078125, -0.992095947265625, -0.92724609375, -0.862396240234375, -0.79754638671875, -0.732696533203125, -0.6678466796875, -0.602996826171875, -0.53814697265625, -0.473297119140625, -0.408447265625, -0.343597412109375, -0.27874755859375, -0.213897705078125, -0.1490478515625, -0.084197998046875, -0.01934814453125, 0.045501708984375, 0.1103515625, 0.175201416015625, 0.24005126953125, 0.304901123046875, 0.3697509765625, 0.434600830078125, 0.49945068359375, 0.564300537109375, 0.629150390625, 0.694000244140625, 0.75885009765625, 0.823699951171875, 0.8885498046875, 0.953399658203125, 1.01824951171875, 1.083099365234375, 1.14794921875, 1.212799072265625, 1.27764892578125, 1.342498779296875, 1.4073486328125, 1.472198486328125, 1.53704833984375, 1.601898193359375, 1.666748046875, 1.731597900390625, 1.79644775390625, 1.861297607421875, 1.9261474609375, 1.990997314453125, 2.05584716796875, 2.120697021484375, 2.185546875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 10.0, 4.0, 9.0, 9.0, 13.0, 11.0, 14.0, 25.0, 22.0, 30.0, 15.0, 32.0, 40.0, 40.0, 37.0, 45.0, 26.0, 51.0, 47.0, 53.0, 48.0, 48.0, 44.0, 29.0, 52.0, 41.0, 29.0, 32.0, 21.0, 23.0, 21.0, 22.0, 14.0, 10.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.538665771484375, -3.42108154296875, -3.303497314453125, -3.1859130859375, -3.068328857421875, -2.95074462890625, -2.833160400390625, -2.715576171875, -2.597991943359375, -2.48040771484375, -2.362823486328125, -2.2452392578125, -2.127655029296875, -2.01007080078125, -1.892486572265625, -1.77490234375, -1.657318115234375, -1.53973388671875, -1.422149658203125, -1.3045654296875, -1.186981201171875, -1.06939697265625, -0.951812744140625, -0.834228515625, -0.716644287109375, -0.59906005859375, -0.481475830078125, -0.3638916015625, -0.246307373046875, -0.12872314453125, -0.011138916015625, 0.1064453125, 0.224029541015625, 0.34161376953125, 0.459197998046875, 0.5767822265625, 0.694366455078125, 0.81195068359375, 0.929534912109375, 1.047119140625, 1.164703369140625, 1.28228759765625, 1.399871826171875, 1.5174560546875, 1.635040283203125, 1.75262451171875, 1.870208740234375, 1.98779296875, 2.105377197265625, 2.22296142578125, 2.340545654296875, 2.4581298828125, 2.575714111328125, 2.69329833984375, 2.810882568359375, 2.928466796875, 3.046051025390625, 3.16363525390625, 3.281219482421875, 3.3988037109375, 3.516387939453125, 3.63397216796875, 3.751556396484375, 3.869140625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 3.0, 6.0, 7.0, 11.0, 11.0, 21.0, 35.0, 58.0, 86.0, 172.0, 1069.0, 4186925.0, 5374.0, 249.0, 95.0, 60.0, 26.0, 22.0, 30.0, 13.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-65.5625, -63.6708984375, -61.779296875, -59.8876953125, -57.99609375, -56.1044921875, -54.212890625, -52.3212890625, -50.4296875, -48.5380859375, -46.646484375, -44.7548828125, -42.86328125, -40.9716796875, -39.080078125, -37.1884765625, -35.296875, -33.4052734375, -31.513671875, -29.6220703125, -27.73046875, -25.8388671875, -23.947265625, -22.0556640625, -20.1640625, -18.2724609375, -16.380859375, -14.4892578125, -12.59765625, -10.7060546875, -8.814453125, -6.9228515625, -5.03125, -3.1396484375, -1.248046875, 0.6435546875, 2.53515625, 4.4267578125, 6.318359375, 8.2099609375, 10.1015625, 11.9931640625, 13.884765625, 15.7763671875, 17.66796875, 19.5595703125, 21.451171875, 23.3427734375, 25.234375, 27.1259765625, 29.017578125, 30.9091796875, 32.80078125, 34.6923828125, 36.583984375, 38.4755859375, 40.3671875, 42.2587890625, 44.150390625, 46.0419921875, 47.93359375, 49.8251953125, 51.716796875, 53.6083984375, 55.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 6.0, 6.0, 15.0, 18.0, 24.0, 26.0, 66.0, 92.0, 157.0, 682.0, 2059.0, 554.0, 142.0, 84.0, 49.0, 29.0, 22.0, 13.0, 13.0, 11.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.216796875, -2.14630126953125, -2.0758056640625, -2.00531005859375, -1.934814453125, -1.86431884765625, -1.7938232421875, -1.72332763671875, -1.65283203125, -1.58233642578125, -1.5118408203125, -1.44134521484375, -1.370849609375, -1.30035400390625, -1.2298583984375, -1.15936279296875, -1.0888671875, -1.01837158203125, -0.9478759765625, -0.87738037109375, -0.806884765625, -0.73638916015625, -0.6658935546875, -0.59539794921875, -0.52490234375, -0.45440673828125, -0.3839111328125, -0.31341552734375, -0.242919921875, -0.17242431640625, -0.1019287109375, -0.03143310546875, 0.0390625, 0.10955810546875, 0.1800537109375, 0.25054931640625, 0.321044921875, 0.39154052734375, 0.4620361328125, 0.53253173828125, 0.60302734375, 0.67352294921875, 0.7440185546875, 0.81451416015625, 0.885009765625, 0.95550537109375, 1.0260009765625, 1.09649658203125, 1.1669921875, 1.23748779296875, 1.3079833984375, 1.37847900390625, 1.448974609375, 1.51947021484375, 1.5899658203125, 1.66046142578125, 1.73095703125, 1.80145263671875, 1.8719482421875, 1.94244384765625, 2.012939453125, 2.08343505859375, 2.1539306640625, 2.22442626953125, 2.294921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 13.0, 26.0, 31.0, 35.0, 72.0, 82.0, 131.0, 130.0, 138.0, 111.0, 78.0, 52.0, 37.0, 24.0, 12.0, 9.0, 5.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-12.560930252075195, -12.301332473754883, -12.04173469543457, -11.782137870788574, -11.522540092468262, -11.26294231414795, -11.003345489501953, -10.74374771118164, -10.484149932861328, -10.224552154541016, -9.964954376220703, -9.705357551574707, -9.445759773254395, -9.186161994934082, -8.926565170288086, -8.666967391967773, -8.407369613647461, -8.147771835327148, -7.888174533843994, -7.62857723236084, -7.368979454040527, -7.109381675720215, -6.8497843742370605, -6.590187072753906, -6.330589294433594, -6.070991516113281, -5.811394214630127, -5.551796913146973, -5.29219913482666, -5.032601356506348, -4.773004055023193, -4.513406753540039, -4.253809928894043, -3.9942123889923096, -3.734614849090576, -3.4750173091888428, -3.2154197692871094, -2.955822229385376, -2.6962246894836426, -2.436627149581909, -2.177029609680176, -1.9174320697784424, -1.657834529876709, -1.3982369899749756, -1.1386394500732422, -0.8790419101715088, -0.6194443702697754, -0.359846830368042, -0.1002492904663086, 0.1593482494354248, 0.4189457893371582, 0.6785433292388916, 0.938140869140625, 1.1977384090423584, 1.4573359489440918, 1.7169334888458252, 1.9765310287475586, 2.236128568649292, 2.4957261085510254, 2.755323648452759, 3.014921188354492, 3.2745187282562256, 3.534116268157959, 3.7937138080596924, 4.053311347961426]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 10.0, 11.0, 16.0, 14.0, 16.0, 19.0, 18.0, 17.0, 29.0, 28.0, 34.0, 48.0, 40.0, 34.0, 31.0, 49.0, 33.0, 45.0, 38.0, 36.0, 44.0, 42.0, 32.0, 32.0, 29.0, 32.0, 32.0, 24.0, 27.0, 15.0, 20.0, 23.0, 11.0, 17.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.888427495956421, -2.7885069847106934, -2.688586711883545, -2.5886662006378174, -2.488745927810669, -2.3888254165649414, -2.288905143737793, -2.1889846324920654, -2.089064121246338, -1.9891437292099, -1.889223337173462, -1.7893028259277344, -1.689382553100586, -1.5894620418548584, -1.4895416498184204, -1.3896212577819824, -1.289700984954834, -1.189780592918396, -1.089860200881958, -0.9899397492408752, -0.8900193572044373, -0.7900989651679993, -0.6901785135269165, -0.5902581214904785, -0.4903377294540405, -0.39041733741760254, -0.29049691557884216, -0.1905764937400818, -0.0906561017036438, 0.00926429033279419, 0.10918474197387695, 0.20910513401031494, 0.30902528762817383, 0.4089456796646118, 0.5088660717010498, 0.6087865233421326, 0.7087069153785706, 0.8086273074150085, 0.9085477590560913, 1.0084681510925293, 1.1083885431289673, 1.2083089351654053, 1.3082293272018433, 1.4081497192382812, 1.5080702304840088, 1.6079905033111572, 1.7079110145568848, 1.8078314065933228, 1.9077517986297607, 2.0076723098754883, 2.1075925827026367, 2.2075130939483643, 2.3074333667755127, 2.4073538780212402, 2.5072741508483887, 2.607194662094116, 2.7071151733398438, 2.8070356845855713, 2.9069559574127197, 3.0068764686584473, 3.1067967414855957, 3.2067172527313232, 3.306637763977051, 3.406558036804199, 3.5064783096313477]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 8.0, 16.0, 31.0, 47.0, 88.0, 148.0, 271.0, 435.0, 753.0, 1359.0, 2627.0, 5296.0, 11371.0, 26243.0, 65216.0, 173036.0, 349536.0, 248225.0, 96093.0, 37240.0, 15846.0, 7179.0, 3501.0, 1695.0, 932.0, 565.0, 317.0, 188.0, 131.0, 56.0, 20.0, 24.0, 13.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.291015625, -1.24603271484375, -1.2010498046875, -1.15606689453125, -1.111083984375, -1.06610107421875, -1.0211181640625, -0.97613525390625, -0.93115234375, -0.88616943359375, -0.8411865234375, -0.79620361328125, -0.751220703125, -0.70623779296875, -0.6612548828125, -0.61627197265625, -0.5712890625, -0.52630615234375, -0.4813232421875, -0.43634033203125, -0.391357421875, -0.34637451171875, -0.3013916015625, -0.25640869140625, -0.21142578125, -0.16644287109375, -0.1214599609375, -0.07647705078125, -0.031494140625, 0.01348876953125, 0.0584716796875, 0.10345458984375, 0.1484375, 0.19342041015625, 0.2384033203125, 0.28338623046875, 0.328369140625, 0.37335205078125, 0.4183349609375, 0.46331787109375, 0.50830078125, 0.55328369140625, 0.5982666015625, 0.64324951171875, 0.688232421875, 0.73321533203125, 0.7781982421875, 0.82318115234375, 0.8681640625, 0.91314697265625, 0.9581298828125, 1.00311279296875, 1.048095703125, 1.09307861328125, 1.1380615234375, 1.18304443359375, 1.22802734375, 1.27301025390625, 1.3179931640625, 1.36297607421875, 1.407958984375, 1.45294189453125, 1.4979248046875, 1.54290771484375, 1.587890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 12.0, 9.0, 14.0, 19.0, 27.0, 19.0, 30.0, 32.0, 37.0, 41.0, 47.0, 64.0, 63.0, 50.0, 65.0, 54.0, 59.0, 55.0, 52.0, 56.0, 37.0, 42.0, 28.0, 25.0, 14.0, 9.0, 15.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.1015625, -3.98828125, -3.875, -3.76171875, -3.6484375, -3.53515625, -3.421875, -3.30859375, -3.1953125, -3.08203125, -2.96875, -2.85546875, -2.7421875, -2.62890625, -2.515625, -2.40234375, -2.2890625, -2.17578125, -2.0625, -1.94921875, -1.8359375, -1.72265625, -1.609375, -1.49609375, -1.3828125, -1.26953125, -1.15625, -1.04296875, -0.9296875, -0.81640625, -0.703125, -0.58984375, -0.4765625, -0.36328125, -0.25, -0.13671875, -0.0234375, 0.08984375, 0.203125, 0.31640625, 0.4296875, 0.54296875, 0.65625, 0.76953125, 0.8828125, 0.99609375, 1.109375, 1.22265625, 1.3359375, 1.44921875, 1.5625, 1.67578125, 1.7890625, 1.90234375, 2.015625, 2.12890625, 2.2421875, 2.35546875, 2.46875, 2.58203125, 2.6953125, 2.80859375, 2.921875, 3.03515625, 3.1484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 3.0, 11.0, 17.0, 21.0, 30.0, 42.0, 76.0, 101.0, 183.0, 418.0, 634.0, 1361.0, 3222.0, 8430.0, 25532.0, 94036.0, 378079.0, 394984.0, 99770.0, 26703.0, 8597.0, 3250.0, 1409.0, 724.0, 355.0, 188.0, 127.0, 78.0, 48.0, 36.0, 18.0, 21.0, 10.0, 9.0, 5.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8125, -1.7607421875, -1.708984375, -1.6572265625, -1.60546875, -1.5537109375, -1.501953125, -1.4501953125, -1.3984375, -1.3466796875, -1.294921875, -1.2431640625, -1.19140625, -1.1396484375, -1.087890625, -1.0361328125, -0.984375, -0.9326171875, -0.880859375, -0.8291015625, -0.77734375, -0.7255859375, -0.673828125, -0.6220703125, -0.5703125, -0.5185546875, -0.466796875, -0.4150390625, -0.36328125, -0.3115234375, -0.259765625, -0.2080078125, -0.15625, -0.1044921875, -0.052734375, -0.0009765625, 0.05078125, 0.1025390625, 0.154296875, 0.2060546875, 0.2578125, 0.3095703125, 0.361328125, 0.4130859375, 0.46484375, 0.5166015625, 0.568359375, 0.6201171875, 0.671875, 0.7236328125, 0.775390625, 0.8271484375, 0.87890625, 0.9306640625, 0.982421875, 1.0341796875, 1.0859375, 1.1376953125, 1.189453125, 1.2412109375, 1.29296875, 1.3447265625, 1.396484375, 1.4482421875, 1.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 4.0, 7.0, 9.0, 11.0, 10.0, 15.0, 8.0, 24.0, 28.0, 30.0, 38.0, 33.0, 28.0, 38.0, 32.0, 41.0, 34.0, 45.0, 37.0, 47.0, 44.0, 54.0, 44.0, 41.0, 36.0, 25.0, 35.0, 34.0, 25.0, 17.0, 17.0, 13.0, 19.0, 13.0, 11.0, 8.0, 10.0, 12.0, 12.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.43597412109375, -5.2625732421875, -5.08917236328125, -4.915771484375, -4.74237060546875, -4.5689697265625, -4.39556884765625, -4.22216796875, -4.04876708984375, -3.8753662109375, -3.70196533203125, -3.528564453125, -3.35516357421875, -3.1817626953125, -3.00836181640625, -2.8349609375, -2.66156005859375, -2.4881591796875, -2.31475830078125, -2.141357421875, -1.96795654296875, -1.7945556640625, -1.62115478515625, -1.44775390625, -1.27435302734375, -1.1009521484375, -0.92755126953125, -0.754150390625, -0.58074951171875, -0.4073486328125, -0.23394775390625, -0.060546875, 0.11285400390625, 0.2862548828125, 0.45965576171875, 0.633056640625, 0.80645751953125, 0.9798583984375, 1.15325927734375, 1.32666015625, 1.50006103515625, 1.6734619140625, 1.84686279296875, 2.020263671875, 2.19366455078125, 2.3670654296875, 2.54046630859375, 2.7138671875, 2.88726806640625, 3.0606689453125, 3.23406982421875, 3.407470703125, 3.58087158203125, 3.7542724609375, 3.92767333984375, 4.10107421875, 4.27447509765625, 4.4478759765625, 4.62127685546875, 4.794677734375, 4.96807861328125, 5.1414794921875, 5.31488037109375, 5.48828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 2.0, 7.0, 14.0, 26.0, 37.0, 37.0, 57.0, 85.0, 121.0, 227.0, 306.0, 540.0, 838.0, 1482.0, 2504.0, 4760.0, 9445.0, 21136.0, 53814.0, 170990.0, 420848.0, 237123.0, 73071.0, 26541.0, 11585.0, 5552.0, 3031.0, 1710.0, 1020.0, 557.0, 346.0, 239.0, 154.0, 103.0, 67.0, 48.0, 45.0, 22.0, 20.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.373779296875, -0.3619651794433594, -0.35015106201171875, -0.3383369445800781, -0.3265228271484375, -0.3147087097167969, -0.30289459228515625, -0.2910804748535156, -0.279266357421875, -0.2674522399902344, -0.25563812255859375, -0.24382400512695312, -0.2320098876953125, -0.22019577026367188, -0.20838165283203125, -0.19656753540039062, -0.18475341796875, -0.17293930053710938, -0.16112518310546875, -0.14931106567382812, -0.1374969482421875, -0.12568283081054688, -0.11386871337890625, -0.10205459594726562, -0.090240478515625, -0.07842636108398438, -0.06661224365234375, -0.054798126220703125, -0.0429840087890625, -0.031169891357421875, -0.01935577392578125, -0.007541656494140625, 0.0042724609375, 0.016086578369140625, 0.02790069580078125, 0.039714813232421875, 0.0515289306640625, 0.06334304809570312, 0.07515716552734375, 0.08697128295898438, 0.098785400390625, 0.11059951782226562, 0.12241363525390625, 0.13422775268554688, 0.1460418701171875, 0.15785598754882812, 0.16967010498046875, 0.18148422241210938, 0.19329833984375, 0.20511245727539062, 0.21692657470703125, 0.22874069213867188, 0.2405548095703125, 0.2523689270019531, 0.26418304443359375, 0.2759971618652344, 0.287811279296875, 0.2996253967285156, 0.31143951416015625, 0.3232536315917969, 0.3350677490234375, 0.3468818664550781, 0.35869598388671875, 0.3705101013183594, 0.38232421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 12.0, 14.0, 28.0, 20.0, 40.0, 66.0, 81.0, 106.0, 125.0, 142.0, 102.0, 76.0, 54.0, 28.0, 32.0, 21.0, 11.0, 10.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037741661071777344, -0.00036386027932167053, -0.0003503039479255676, -0.0003367476165294647, -0.0003231912851333618, -0.0003096349537372589, -0.000296078622341156, -0.0002825222909450531, -0.0002689659595489502, -0.0002554096281528473, -0.00024185329675674438, -0.00022829696536064148, -0.00021474063396453857, -0.00020118430256843567, -0.00018762797117233276, -0.00017407163977622986, -0.00016051530838012695, -0.00014695897698402405, -0.00013340264558792114, -0.00011984631419181824, -0.00010628998279571533, -9.273365139961243e-05, -7.917732000350952e-05, -6.562098860740662e-05, -5.206465721130371e-05, -3.8508325815200806e-05, -2.49519944190979e-05, -1.1395663022994995e-05, 2.16066837310791e-06, 1.5716999769210815e-05, 2.927333116531372e-05, 4.2829662561416626e-05, 5.638599395751953e-05, 6.994232535362244e-05, 8.349865674972534e-05, 9.705498814582825e-05, 0.00011061131954193115, 0.00012416765093803406, 0.00013772398233413696, 0.00015128031373023987, 0.00016483664512634277, 0.00017839297652244568, 0.00019194930791854858, 0.0002055056393146515, 0.0002190619707107544, 0.0002326183021068573, 0.0002461746335029602, 0.0002597309648990631, 0.000273287296295166, 0.0002868436276912689, 0.0003003999590873718, 0.00031395629048347473, 0.00032751262187957764, 0.00034106895327568054, 0.00035462528467178345, 0.00036818161606788635, 0.00038173794746398926, 0.00039529427886009216, 0.00040885061025619507, 0.000422406941652298, 0.0004359632730484009, 0.0004495196044445038, 0.0004630759358406067, 0.0004766322672367096, 0.0004901885986328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 14.0, 11.0, 11.0, 35.0, 40.0, 66.0, 108.0, 229.0, 976.0, 6056.0, 71367.0, 832968.0, 125746.0, 8947.0, 1273.0, 305.0, 124.0, 91.0, 50.0, 24.0, 19.0, 19.0, 9.0, 8.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.331939697265625, -1.28692626953125, -1.241912841796875, -1.1968994140625, -1.151885986328125, -1.10687255859375, -1.061859130859375, -1.016845703125, -0.971832275390625, -0.92681884765625, -0.881805419921875, -0.8367919921875, -0.791778564453125, -0.74676513671875, -0.701751708984375, -0.65673828125, -0.611724853515625, -0.56671142578125, -0.521697998046875, -0.4766845703125, -0.431671142578125, -0.38665771484375, -0.341644287109375, -0.296630859375, -0.251617431640625, -0.20660400390625, -0.161590576171875, -0.1165771484375, -0.071563720703125, -0.02655029296875, 0.018463134765625, 0.0634765625, 0.108489990234375, 0.15350341796875, 0.198516845703125, 0.2435302734375, 0.288543701171875, 0.33355712890625, 0.378570556640625, 0.423583984375, 0.468597412109375, 0.51361083984375, 0.558624267578125, 0.6036376953125, 0.648651123046875, 0.69366455078125, 0.738677978515625, 0.78369140625, 0.828704833984375, 0.87371826171875, 0.918731689453125, 0.9637451171875, 1.008758544921875, 1.05377197265625, 1.098785400390625, 1.143798828125, 1.188812255859375, 1.23382568359375, 1.278839111328125, 1.3238525390625, 1.368865966796875, 1.41387939453125, 1.458892822265625, 1.50390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 5.0, 1.0, 8.0, 4.0, 5.0, 17.0, 15.0, 16.0, 20.0, 29.0, 33.0, 42.0, 40.0, 50.0, 54.0, 68.0, 70.0, 59.0, 63.0, 69.0, 60.0, 46.0, 56.0, 27.0, 40.0, 30.0, 16.0, 17.0, 8.0, 12.0, 9.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1416015625, -0.1370220184326172, -0.13244247436523438, -0.12786293029785156, -0.12328338623046875, -0.11870384216308594, -0.11412429809570312, -0.10954475402832031, -0.1049652099609375, -0.10038566589355469, -0.09580612182617188, -0.09122657775878906, -0.08664703369140625, -0.08206748962402344, -0.07748794555664062, -0.07290840148925781, -0.068328857421875, -0.06374931335449219, -0.059169769287109375, -0.05459022521972656, -0.05001068115234375, -0.04543113708496094, -0.040851593017578125, -0.03627204895019531, -0.0316925048828125, -0.027112960815429688, -0.022533416748046875, -0.017953872680664062, -0.01337432861328125, -0.008794784545898438, -0.004215240478515625, 0.0003643035888671875, 0.00494384765625, 0.009523391723632812, 0.014102935791015625, 0.018682479858398438, 0.02326202392578125, 0.027841567993164062, 0.032421112060546875, 0.03700065612792969, 0.0415802001953125, 0.04615974426269531, 0.050739288330078125, 0.05531883239746094, 0.05989837646484375, 0.06447792053222656, 0.06905746459960938, 0.07363700866699219, 0.078216552734375, 0.08279609680175781, 0.08737564086914062, 0.09195518493652344, 0.09653472900390625, 0.10111427307128906, 0.10569381713867188, 0.11027336120605469, 0.1148529052734375, 0.11943244934082031, 0.12401199340820312, 0.12859153747558594, 0.13317108154296875, 0.13775062561035156, 0.14233016967773438, 0.1469097137451172, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 33.0, 121.0, 350.0, 322.0, 110.0, 40.0, 15.0, 3.0, 1.0, 3.0], "bins": [-31.517847061157227, -30.963668823242188, -30.40949058532715, -29.855310440063477, -29.301132202148438, -28.7469539642334, -28.19277572631836, -27.63859748840332, -27.08441925048828, -26.530241012573242, -25.976062774658203, -25.42188262939453, -24.867704391479492, -24.313526153564453, -23.759347915649414, -23.205169677734375, -22.650989532470703, -22.096811294555664, -21.542633056640625, -20.988452911376953, -20.434274673461914, -19.880096435546875, -19.325918197631836, -18.771739959716797, -18.217559814453125, -17.663381576538086, -17.109203338623047, -16.555023193359375, -16.000844955444336, -15.446666717529297, -14.892488479614258, -14.338310241699219, -13.784130096435547, -13.229951858520508, -12.675772666931152, -12.121594429016113, -11.567415237426758, -11.013236999511719, -10.45905876159668, -9.90488052368164, -9.350701332092285, -8.796523094177246, -8.24234390258789, -7.688165664672852, -7.133986949920654, -6.579808235168457, -6.025629997253418, -5.471451282501221, -4.917272567749023, -4.363093852996826, -3.808915376663208, -3.25473690032959, -2.7005581855773926, -2.1463794708251953, -1.5922009944915771, -1.038022518157959, -0.4838438034057617, 0.070334792137146, 0.6245133876800537, 1.1786919832229614, 1.7328705787658691, 2.2870492935180664, 2.8412277698516846, 3.3954062461853027, 3.9495849609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 10.0, 17.0, 23.0, 28.0, 29.0, 25.0, 41.0, 35.0, 65.0, 64.0, 65.0, 64.0, 56.0, 69.0, 60.0, 52.0, 54.0, 44.0, 49.0, 42.0, 26.0, 25.0, 15.0, 9.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.441911697387695, -4.322793006896973, -4.203674793243408, -4.0845561027526855, -3.965437889099121, -3.8463194370269775, -3.727200984954834, -3.6080825328826904, -3.488964080810547, -3.3698456287384033, -3.2507271766662598, -3.131608724594116, -3.0124902725219727, -2.893371820449829, -2.7742533683776855, -2.655134916305542, -2.5360164642333984, -2.416898012161255, -2.2977795600891113, -2.1786611080169678, -2.059542655944824, -1.9404242038726807, -1.821305751800537, -1.7021872997283936, -1.583068609237671, -1.4639501571655273, -1.3448317050933838, -1.2257132530212402, -1.1065948009490967, -0.9874762892723083, -0.8683578372001648, -0.7492393851280212, -0.6301209926605225, -0.5110025405883789, -0.39188408851623535, -0.2727656066417694, -0.15364715456962585, -0.03452867269515991, 0.08458977937698364, 0.2037082314491272, 0.32282668352127075, 0.4419451355934143, 0.5610635876655579, 0.6801820993423462, 0.7993005514144897, 0.9184190034866333, 1.0375374555587769, 1.1566559076309204, 1.275774359703064, 1.3948928117752075, 1.514011263847351, 1.6331297159194946, 1.7522481679916382, 1.8713667392730713, 1.9904851913452148, 2.1096036434173584, 2.228722095489502, 2.3478405475616455, 2.466958999633789, 2.5860774517059326, 2.705195903778076, 2.8243143558502197, 2.9434328079223633, 3.062551259994507, 3.1816697120666504]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 17.0, 26.0, 34.0, 74.0, 129.0, 257.0, 594.0, 1410.0, 3652.0, 10241.0, 35789.0, 192897.0, 631025.0, 131685.0, 27353.0, 8093.0, 2947.0, 1208.0, 529.0, 257.0, 131.0, 79.0, 47.0, 19.0, 13.0, 12.0, 11.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.174560546875, -2.08544921875, -1.996337890625, -1.9072265625, -1.818115234375, -1.72900390625, -1.639892578125, -1.55078125, -1.461669921875, -1.37255859375, -1.283447265625, -1.1943359375, -1.105224609375, -1.01611328125, -0.927001953125, -0.837890625, -0.748779296875, -0.65966796875, -0.570556640625, -0.4814453125, -0.392333984375, -0.30322265625, -0.214111328125, -0.125, -0.035888671875, 0.05322265625, 0.142333984375, 0.2314453125, 0.320556640625, 0.40966796875, 0.498779296875, 0.587890625, 0.677001953125, 0.76611328125, 0.855224609375, 0.9443359375, 1.033447265625, 1.12255859375, 1.211669921875, 1.30078125, 1.389892578125, 1.47900390625, 1.568115234375, 1.6572265625, 1.746337890625, 1.83544921875, 1.924560546875, 2.013671875, 2.102783203125, 2.19189453125, 2.281005859375, 2.3701171875, 2.459228515625, 2.54833984375, 2.637451171875, 2.7265625, 2.815673828125, 2.90478515625, 2.993896484375, 3.0830078125, 3.172119140625, 3.26123046875, 3.350341796875, 3.439453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 8.0, 5.0, 14.0, 24.0, 18.0, 20.0, 23.0, 24.0, 33.0, 30.0, 29.0, 42.0, 39.0, 43.0, 43.0, 46.0, 44.0, 32.0, 39.0, 42.0, 43.0, 44.0, 32.0, 31.0, 30.0, 27.0, 27.0, 21.0, 18.0, 16.0, 17.0, 17.0, 10.0, 10.0, 4.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.140625, -7.91253662109375, -7.6844482421875, -7.45635986328125, -7.228271484375, -7.00018310546875, -6.7720947265625, -6.54400634765625, -6.31591796875, -6.08782958984375, -5.8597412109375, -5.63165283203125, -5.403564453125, -5.17547607421875, -4.9473876953125, -4.71929931640625, -4.4912109375, -4.26312255859375, -4.0350341796875, -3.80694580078125, -3.578857421875, -3.35076904296875, -3.1226806640625, -2.89459228515625, -2.66650390625, -2.43841552734375, -2.2103271484375, -1.98223876953125, -1.754150390625, -1.52606201171875, -1.2979736328125, -1.06988525390625, -0.841796875, -0.61370849609375, -0.3856201171875, -0.15753173828125, 0.070556640625, 0.29864501953125, 0.5267333984375, 0.75482177734375, 0.98291015625, 1.21099853515625, 1.4390869140625, 1.66717529296875, 1.895263671875, 2.12335205078125, 2.3514404296875, 2.57952880859375, 2.8076171875, 3.03570556640625, 3.2637939453125, 3.49188232421875, 3.719970703125, 3.94805908203125, 4.1761474609375, 4.40423583984375, 4.63232421875, 4.86041259765625, 5.0885009765625, 5.31658935546875, 5.544677734375, 5.77276611328125, 6.0008544921875, 6.22894287109375, 6.45703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 12.0, 12.0, 12.0, 25.0, 31.0, 42.0, 56.0, 71.0, 102.0, 132.0, 222.0, 432.0, 1308.0, 10681.0, 573857.0, 449960.0, 9307.0, 1126.0, 394.0, 209.0, 144.0, 92.0, 65.0, 47.0, 44.0, 36.0, 21.0, 28.0, 8.0, 13.0, 8.0, 2.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.34765625, -7.12481689453125, -6.9019775390625, -6.67913818359375, -6.456298828125, -6.23345947265625, -6.0106201171875, -5.78778076171875, -5.56494140625, -5.34210205078125, -5.1192626953125, -4.89642333984375, -4.673583984375, -4.45074462890625, -4.2279052734375, -4.00506591796875, -3.7822265625, -3.55938720703125, -3.3365478515625, -3.11370849609375, -2.890869140625, -2.66802978515625, -2.4451904296875, -2.22235107421875, -1.99951171875, -1.77667236328125, -1.5538330078125, -1.33099365234375, -1.108154296875, -0.88531494140625, -0.6624755859375, -0.43963623046875, -0.216796875, 0.00604248046875, 0.2288818359375, 0.45172119140625, 0.674560546875, 0.89739990234375, 1.1202392578125, 1.34307861328125, 1.56591796875, 1.78875732421875, 2.0115966796875, 2.23443603515625, 2.457275390625, 2.68011474609375, 2.9029541015625, 3.12579345703125, 3.3486328125, 3.57147216796875, 3.7943115234375, 4.01715087890625, 4.239990234375, 4.46282958984375, 4.6856689453125, 4.90850830078125, 5.13134765625, 5.35418701171875, 5.5770263671875, 5.79986572265625, 6.022705078125, 6.24554443359375, 6.4683837890625, 6.69122314453125, 6.9140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 9.0, 6.0, 5.0, 11.0, 12.0, 13.0, 16.0, 18.0, 21.0, 25.0, 28.0, 19.0, 39.0, 34.0, 29.0, 38.0, 26.0, 44.0, 35.0, 41.0, 54.0, 45.0, 41.0, 27.0, 42.0, 33.0, 29.0, 31.0, 30.0, 27.0, 24.0, 17.0, 16.0, 21.0, 16.0, 17.0, 12.0, 7.0, 9.0, 1.0, 6.0, 1.0, 6.0, 5.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3046875, -7.06494140625, -6.8251953125, -6.58544921875, -6.345703125, -6.10595703125, -5.8662109375, -5.62646484375, -5.38671875, -5.14697265625, -4.9072265625, -4.66748046875, -4.427734375, -4.18798828125, -3.9482421875, -3.70849609375, -3.46875, -3.22900390625, -2.9892578125, -2.74951171875, -2.509765625, -2.27001953125, -2.0302734375, -1.79052734375, -1.55078125, -1.31103515625, -1.0712890625, -0.83154296875, -0.591796875, -0.35205078125, -0.1123046875, 0.12744140625, 0.3671875, 0.60693359375, 0.8466796875, 1.08642578125, 1.326171875, 1.56591796875, 1.8056640625, 2.04541015625, 2.28515625, 2.52490234375, 2.7646484375, 3.00439453125, 3.244140625, 3.48388671875, 3.7236328125, 3.96337890625, 4.203125, 4.44287109375, 4.6826171875, 4.92236328125, 5.162109375, 5.40185546875, 5.6416015625, 5.88134765625, 6.12109375, 6.36083984375, 6.6005859375, 6.84033203125, 7.080078125, 7.31982421875, 7.5595703125, 7.79931640625, 8.0390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 11.0, 29.0, 39.0, 54.0, 119.0, 214.0, 420.0, 1152.0, 3624.0, 16163.0, 129794.0, 815705.0, 66841.0, 10125.0, 2531.0, 913.0, 365.0, 178.0, 103.0, 50.0, 26.0, 27.0, 21.0, 13.0, 8.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.818359375, -0.7904891967773438, -0.7626190185546875, -0.7347488403320312, -0.706878662109375, -0.6790084838867188, -0.6511383056640625, -0.6232681274414062, -0.59539794921875, -0.5675277709960938, -0.5396575927734375, -0.5117874145507812, -0.483917236328125, -0.45604705810546875, -0.4281768798828125, -0.40030670166015625, -0.3724365234375, -0.34456634521484375, -0.3166961669921875, -0.28882598876953125, -0.260955810546875, -0.23308563232421875, -0.2052154541015625, -0.17734527587890625, -0.14947509765625, -0.12160491943359375, -0.0937347412109375, -0.06586456298828125, -0.037994384765625, -0.01012420654296875, 0.0177459716796875, 0.04561614990234375, 0.073486328125, 0.10135650634765625, 0.1292266845703125, 0.15709686279296875, 0.184967041015625, 0.21283721923828125, 0.2407073974609375, 0.26857757568359375, 0.29644775390625, 0.32431793212890625, 0.3521881103515625, 0.38005828857421875, 0.407928466796875, 0.43579864501953125, 0.4636688232421875, 0.49153900146484375, 0.5194091796875, 0.5472793579101562, 0.5751495361328125, 0.6030197143554688, 0.630889892578125, 0.6587600708007812, 0.6866302490234375, 0.7145004272460938, 0.74237060546875, 0.7702407836914062, 0.7981109619140625, 0.8259811401367188, 0.853851318359375, 0.8817214965820312, 0.9095916748046875, 0.9374618530273438, 0.96533203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 10.0, 3.0, 6.0, 23.0, 42.0, 41.0, 66.0, 121.0, 150.0, 182.0, 101.0, 77.0, 47.0, 30.0, 21.0, 14.0, 13.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011426210403442383, -0.00011033471673727036, -0.00010640732944011688, -0.00010247994214296341, -9.855255484580994e-05, -9.462516754865646e-05, -9.069778025150299e-05, -8.677039295434952e-05, -8.284300565719604e-05, -7.891561836004257e-05, -7.49882310628891e-05, -7.106084376573563e-05, -6.713345646858215e-05, -6.320606917142868e-05, -5.927868187427521e-05, -5.5351294577121735e-05, -5.142390727996826e-05, -4.749651998281479e-05, -4.3569132685661316e-05, -3.964174538850784e-05, -3.571435809135437e-05, -3.17869707942009e-05, -2.7859583497047424e-05, -2.393219619989395e-05, -2.000480890274048e-05, -1.6077421605587006e-05, -1.2150034308433533e-05, -8.22264701128006e-06, -4.295259714126587e-06, -3.67872416973114e-07, 3.559514880180359e-06, 7.486902177333832e-06, 1.1414289474487305e-05, 1.5341676771640778e-05, 1.926906406879425e-05, 2.3196451365947723e-05, 2.7123838663101196e-05, 3.105122596025467e-05, 3.497861325740814e-05, 3.8906000554561615e-05, 4.283338785171509e-05, 4.676077514886856e-05, 5.0688162446022034e-05, 5.4615549743175507e-05, 5.854293704032898e-05, 6.247032433748245e-05, 6.639771163463593e-05, 7.03250989317894e-05, 7.425248622894287e-05, 7.817987352609634e-05, 8.210726082324982e-05, 8.603464812040329e-05, 8.996203541755676e-05, 9.388942271471024e-05, 9.781681001186371e-05, 0.00010174419730901718, 0.00010567158460617065, 0.00010959897190332413, 0.0001135263592004776, 0.00011745374649763107, 0.00012138113379478455, 0.00012530852109193802, 0.0001292359083890915, 0.00013316329568624496, 0.00013709068298339844]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 8.0, 7.0, 15.0, 13.0, 25.0, 46.0, 56.0, 109.0, 204.0, 300.0, 692.0, 1510.0, 4056.0, 12234.0, 49897.0, 519401.0, 394488.0, 47036.0, 11734.0, 3774.0, 1459.0, 685.0, 315.0, 194.0, 106.0, 67.0, 34.0, 21.0, 20.0, 7.0, 10.0, 9.0, 3.0, 1.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65283203125, -0.6317596435546875, -0.610687255859375, -0.5896148681640625, -0.56854248046875, -0.5474700927734375, -0.526397705078125, -0.5053253173828125, -0.4842529296875, -0.4631805419921875, -0.442108154296875, -0.4210357666015625, -0.39996337890625, -0.3788909912109375, -0.357818603515625, -0.3367462158203125, -0.315673828125, -0.2946014404296875, -0.273529052734375, -0.2524566650390625, -0.23138427734375, -0.2103118896484375, -0.189239501953125, -0.1681671142578125, -0.1470947265625, -0.1260223388671875, -0.104949951171875, -0.0838775634765625, -0.06280517578125, -0.0417327880859375, -0.020660400390625, 0.0004119873046875, 0.021484375, 0.0425567626953125, 0.063629150390625, 0.0847015380859375, 0.10577392578125, 0.1268463134765625, 0.147918701171875, 0.1689910888671875, 0.1900634765625, 0.2111358642578125, 0.232208251953125, 0.2532806396484375, 0.27435302734375, 0.2954254150390625, 0.316497802734375, 0.3375701904296875, 0.358642578125, 0.3797149658203125, 0.400787353515625, 0.4218597412109375, 0.44293212890625, 0.4640045166015625, 0.485076904296875, 0.5061492919921875, 0.5272216796875, 0.5482940673828125, 0.569366455078125, 0.5904388427734375, 0.61151123046875, 0.6325836181640625, 0.653656005859375, 0.6747283935546875, 0.69580078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 6.0, 8.0, 10.0, 10.0, 6.0, 11.0, 21.0, 35.0, 43.0, 51.0, 46.0, 105.0, 175.0, 120.0, 71.0, 49.0, 52.0, 28.0, 21.0, 18.0, 21.0, 19.0, 6.0, 5.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.264404296875, -0.2572002410888672, -0.24999618530273438, -0.24279212951660156, -0.23558807373046875, -0.22838401794433594, -0.22117996215820312, -0.2139759063720703, -0.2067718505859375, -0.1995677947998047, -0.19236373901367188, -0.18515968322753906, -0.17795562744140625, -0.17075157165527344, -0.16354751586914062, -0.1563434600830078, -0.149139404296875, -0.1419353485107422, -0.13473129272460938, -0.12752723693847656, -0.12032318115234375, -0.11311912536621094, -0.10591506958007812, -0.09871101379394531, -0.0915069580078125, -0.08430290222167969, -0.07709884643554688, -0.06989479064941406, -0.06269073486328125, -0.05548667907714844, -0.048282623291015625, -0.04107856750488281, -0.03387451171875, -0.026670455932617188, -0.019466400146484375, -0.012262344360351562, -0.00505828857421875, 0.0021457672119140625, 0.009349822998046875, 0.016553878784179688, 0.0237579345703125, 0.030961990356445312, 0.038166046142578125, 0.04537010192871094, 0.05257415771484375, 0.05977821350097656, 0.06698226928710938, 0.07418632507324219, 0.081390380859375, 0.08859443664550781, 0.09579849243164062, 0.10300254821777344, 0.11020660400390625, 0.11741065979003906, 0.12461471557617188, 0.1318187713623047, 0.1390228271484375, 0.1462268829345703, 0.15343093872070312, 0.16063499450683594, 0.16783905029296875, 0.17504310607910156, 0.18224716186523438, 0.1894512176513672, 0.1966552734375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 61.0, 320.0, 473.0, 126.0, 25.0, 6.0, 2.0], "bins": [-75.66742706298828, -74.3896484375, -73.11187744140625, -71.8341064453125, -70.55632781982422, -69.27854919433594, -68.00077819824219, -66.72300720214844, -65.44522857666016, -64.16744995117188, -62.889678955078125, -61.61190414428711, -60.334129333496094, -59.05635452270508, -57.77857971191406, -56.50080490112305, -55.22303009033203, -53.945255279541016, -52.66748046875, -51.389705657958984, -50.11193084716797, -48.83415603637695, -47.55638122558594, -46.27860641479492, -45.000831604003906, -43.72305679321289, -42.445281982421875, -41.16750717163086, -39.889732360839844, -38.61195755004883, -37.33418273925781, -36.0564079284668, -34.77863693237305, -33.50086212158203, -32.223087310791016, -30.9453125, -29.667537689208984, -28.38976287841797, -27.111988067626953, -25.834213256835938, -24.55643653869629, -23.278661727905273, -22.000886917114258, -20.723112106323242, -19.445337295532227, -18.16756248474121, -16.889787673950195, -15.61201286315918, -14.334238052368164, -13.056463241577148, -11.778688430786133, -10.500913619995117, -9.223138809204102, -7.945363998413086, -6.66758918762207, -5.389814376831055, -4.112040042877197, -2.8342652320861816, -1.556490421295166, -0.2787156105041504, 0.9990592002868652, 2.276834011077881, 3.5546088218688965, 4.832383632659912, 6.110158443450928]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 13.0, 9.0, 9.0, 11.0, 14.0, 16.0, 19.0, 30.0, 21.0, 18.0, 34.0, 27.0, 41.0, 29.0, 23.0, 42.0, 42.0, 30.0, 41.0, 34.0, 45.0, 39.0, 37.0, 32.0, 27.0, 38.0, 27.0, 28.0, 32.0, 20.0, 24.0, 29.0, 24.0, 16.0, 11.0, 10.0, 11.0, 9.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.042387962341309, -10.688484191894531, -10.334579467773438, -9.98067569732666, -9.626770973205566, -9.272867202758789, -8.918962478637695, -8.565058708190918, -8.21115493774414, -7.857250690460205, -7.5033464431762695, -7.149442672729492, -6.795538425445557, -6.441634178161621, -6.0877299308776855, -5.73382568359375, -5.3799214363098145, -5.026017189025879, -4.672112941741943, -4.318208694458008, -3.9643049240112305, -3.610400676727295, -3.2564964294433594, -2.902592420578003, -2.5486881732940674, -2.194783926010132, -1.8408799171447754, -1.4869756698608398, -1.1330715417861938, -0.7791674137115479, -0.4252631664276123, -0.07135915756225586, 0.2825450897216797, 0.6364492177963257, 0.9903534054756165, 1.3442575931549072, 1.6981617212295532, 2.052065849304199, 2.4059700965881348, 2.759874105453491, 3.1137783527374268, 3.4676826000213623, 3.8215866088867188, 4.175490856170654, 4.52939510345459, 4.883298873901367, 5.237203598022461, 5.591107368469238, 5.945011615753174, 6.298915863037109, 6.652820110321045, 7.0067243576049805, 7.360628128051758, 7.714532375335693, 8.068436622619629, 8.422340393066406, 8.7762451171875, 9.130148887634277, 9.484053611755371, 9.837957382202148, 10.191862106323242, 10.54576587677002, 10.899669647216797, 11.25357437133789, 11.607478141784668]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 6.0, 8.0, 25.0, 27.0, 45.0, 69.0, 119.0, 214.0, 394.0, 828.0, 1715.0, 4468.0, 12219.0, 42664.0, 295240.0, 3206520.0, 542674.0, 61423.0, 15583.0, 5547.0, 2299.0, 1073.0, 520.0, 290.0, 129.0, 80.0, 37.0, 18.0, 15.0, 9.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4765625, -5.3309326171875, -5.185302734375, -5.0396728515625, -4.89404296875, -4.7484130859375, -4.602783203125, -4.4571533203125, -4.3115234375, -4.1658935546875, -4.020263671875, -3.8746337890625, -3.72900390625, -3.5833740234375, -3.437744140625, -3.2921142578125, -3.146484375, -3.0008544921875, -2.855224609375, -2.7095947265625, -2.56396484375, -2.4183349609375, -2.272705078125, -2.1270751953125, -1.9814453125, -1.8358154296875, -1.690185546875, -1.5445556640625, -1.39892578125, -1.2532958984375, -1.107666015625, -0.9620361328125, -0.81640625, -0.6707763671875, -0.525146484375, -0.3795166015625, -0.23388671875, -0.0882568359375, 0.057373046875, 0.2030029296875, 0.3486328125, 0.4942626953125, 0.639892578125, 0.7855224609375, 0.93115234375, 1.0767822265625, 1.222412109375, 1.3680419921875, 1.513671875, 1.6593017578125, 1.804931640625, 1.9505615234375, 2.09619140625, 2.2418212890625, 2.387451171875, 2.5330810546875, 2.6787109375, 2.8243408203125, 2.969970703125, 3.1156005859375, 3.26123046875, 3.4068603515625, 3.552490234375, 3.6981201171875, 3.84375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 14.0, 17.0, 26.0, 57.0, 51.0, 71.0, 69.0, 84.0, 94.0, 112.0, 91.0, 79.0, 75.0, 55.0, 33.0, 29.0, 15.0, 12.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.171875, -7.9898681640625, -7.807861328125, -7.6258544921875, -7.44384765625, -7.2618408203125, -7.079833984375, -6.8978271484375, -6.7158203125, -6.5338134765625, -6.351806640625, -6.1697998046875, -5.98779296875, -5.8057861328125, -5.623779296875, -5.4417724609375, -5.259765625, -5.0777587890625, -4.895751953125, -4.7137451171875, -4.53173828125, -4.3497314453125, -4.167724609375, -3.9857177734375, -3.8037109375, -3.6217041015625, -3.439697265625, -3.2576904296875, -3.07568359375, -2.8936767578125, -2.711669921875, -2.5296630859375, -2.34765625, -2.1656494140625, -1.983642578125, -1.8016357421875, -1.61962890625, -1.4376220703125, -1.255615234375, -1.0736083984375, -0.8916015625, -0.7095947265625, -0.527587890625, -0.3455810546875, -0.16357421875, 0.0184326171875, 0.200439453125, 0.3824462890625, 0.564453125, 0.7464599609375, 0.928466796875, 1.1104736328125, 1.29248046875, 1.4744873046875, 1.656494140625, 1.8385009765625, 2.0205078125, 2.2025146484375, 2.384521484375, 2.5665283203125, 2.74853515625, 2.9305419921875, 3.112548828125, 3.2945556640625, 3.4765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 12.0, 28.0, 57.0, 145.0, 999.0, 4190117.0, 2634.0, 185.0, 63.0, 17.0, 12.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-87.5, -85.661865234375, -83.82373046875, -81.985595703125, -80.1474609375, -78.309326171875, -76.47119140625, -74.633056640625, -72.794921875, -70.956787109375, -69.11865234375, -67.280517578125, -65.4423828125, -63.604248046875, -61.76611328125, -59.927978515625, -58.08984375, -56.251708984375, -54.41357421875, -52.575439453125, -50.7373046875, -48.899169921875, -47.06103515625, -45.222900390625, -43.384765625, -41.546630859375, -39.70849609375, -37.870361328125, -36.0322265625, -34.194091796875, -32.35595703125, -30.517822265625, -28.6796875, -26.841552734375, -25.00341796875, -23.165283203125, -21.3271484375, -19.489013671875, -17.65087890625, -15.812744140625, -13.974609375, -12.136474609375, -10.29833984375, -8.460205078125, -6.6220703125, -4.783935546875, -2.94580078125, -1.107666015625, 0.73046875, 2.568603515625, 4.40673828125, 6.244873046875, 8.0830078125, 9.921142578125, 11.75927734375, 13.597412109375, 15.435546875, 17.273681640625, 19.11181640625, 20.949951171875, 22.7880859375, 24.626220703125, 26.46435546875, 28.302490234375, 30.140625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 2.0, 11.0, 25.0, 31.0, 35.0, 49.0, 99.0, 145.0, 307.0, 674.0, 1305.0, 684.0, 302.0, 145.0, 89.0, 67.0, 38.0, 19.0, 14.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.59130859375, -1.5390625, -1.48681640625, -1.4345703125, -1.38232421875, -1.330078125, -1.27783203125, -1.2255859375, -1.17333984375, -1.12109375, -1.06884765625, -1.0166015625, -0.96435546875, -0.912109375, -0.85986328125, -0.8076171875, -0.75537109375, -0.703125, -0.65087890625, -0.5986328125, -0.54638671875, -0.494140625, -0.44189453125, -0.3896484375, -0.33740234375, -0.28515625, -0.23291015625, -0.1806640625, -0.12841796875, -0.076171875, -0.02392578125, 0.0283203125, 0.08056640625, 0.1328125, 0.18505859375, 0.2373046875, 0.28955078125, 0.341796875, 0.39404296875, 0.4462890625, 0.49853515625, 0.55078125, 0.60302734375, 0.6552734375, 0.70751953125, 0.759765625, 0.81201171875, 0.8642578125, 0.91650390625, 0.96875, 1.02099609375, 1.0732421875, 1.12548828125, 1.177734375, 1.22998046875, 1.2822265625, 1.33447265625, 1.38671875, 1.43896484375, 1.4912109375, 1.54345703125, 1.595703125, 1.64794921875, 1.7001953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 13.0, 21.0, 29.0, 68.0, 119.0, 195.0, 178.0, 178.0, 101.0, 54.0, 28.0, 9.0, 11.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.76431655883789, -15.431965827941895, -15.099614143371582, -14.767263412475586, -14.434911727905273, -14.102560997009277, -13.770210266113281, -13.437858581542969, -13.105507850646973, -12.773157119750977, -12.440805435180664, -12.108454704284668, -11.776103973388672, -11.44375228881836, -11.111401557922363, -10.779050827026367, -10.446699142456055, -10.114348411560059, -9.781996726989746, -9.44964599609375, -9.117294311523438, -8.784943580627441, -8.452592849731445, -8.120241165161133, -7.787890434265137, -7.455539226531982, -7.123188018798828, -6.790837287902832, -6.458486080169678, -6.126134872436523, -5.793784141540527, -5.461432933807373, -5.129082679748535, -4.796731472015381, -4.464380264282227, -4.1320295333862305, -3.799678325653076, -3.467327117919922, -3.1349761486053467, -2.8026251792907715, -2.470273971557617, -2.137922763824463, -1.8055717945098877, -1.473220705986023, -1.1408696174621582, -0.8085185289382935, -0.4761674404144287, -0.14381647109985352, 0.18853473663330078, 0.5208858251571655, 0.8532369136810303, 1.185588002204895, 1.5179390907287598, 1.8502901792526245, 2.1826412677764893, 2.5149922370910645, 2.8473434448242188, 3.179694652557373, 3.5120456218719482, 3.8443965911865234, 4.176747798919678, 4.509099006652832, 4.841449737548828, 5.173800945281982, 5.506152153015137]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 5.0, 6.0, 6.0, 18.0, 15.0, 25.0, 26.0, 47.0, 32.0, 46.0, 40.0, 59.0, 54.0, 62.0, 69.0, 60.0, 67.0, 62.0, 61.0, 53.0, 54.0, 30.0, 23.0, 18.0, 18.0, 13.0, 10.0, 4.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.992746829986572, -4.8575592041015625, -4.722371578216553, -4.587183475494385, -4.451995849609375, -4.316808223724365, -4.1816205978393555, -4.046432971954346, -3.911245107650757, -3.776057481765747, -3.640869617462158, -3.5056819915771484, -3.3704943656921387, -3.23530650138855, -3.10011887550354, -2.964931011199951, -2.8297433853149414, -2.6945557594299316, -2.5593678951263428, -2.424180269241333, -2.288992404937744, -2.1538047790527344, -2.0186171531677246, -1.8834294080734253, -1.748241662979126, -1.6130539178848267, -1.4778661727905273, -1.3426785469055176, -1.2074908018112183, -1.072303056716919, -0.9371153712272644, -0.8019276857376099, -0.6667399406433105, -0.5315521955490112, -0.3963645100593567, -0.26117679476737976, -0.12598907947540283, 0.009198665618896484, 0.14438635110855103, 0.27957403659820557, 0.4147617816925049, 0.5499495267868042, 0.6851372122764587, 0.8203248977661133, 0.9555126428604126, 1.090700387954712, 1.2258880138397217, 1.361075758934021, 1.4962635040283203, 1.6314512491226196, 1.766638994216919, 1.9018266201019287, 2.0370144844055176, 2.1722021102905273, 2.307389736175537, 2.442577362060547, 2.5777652263641357, 2.7129528522491455, 2.8481407165527344, 2.983328342437744, 3.118515968322754, 3.2537038326263428, 3.3888914585113525, 3.5240793228149414, 3.659266948699951]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 8.0, 10.0, 18.0, 25.0, 39.0, 40.0, 72.0, 108.0, 149.0, 260.0, 467.0, 679.0, 1155.0, 1990.0, 3574.0, 6718.0, 14377.0, 36318.0, 114518.0, 378253.0, 333452.0, 97491.0, 31672.0, 12803.0, 6281.0, 3305.0, 1877.0, 1102.0, 657.0, 407.0, 258.0, 171.0, 99.0, 61.0, 40.0, 28.0, 29.0, 9.0, 12.0, 2.0, 5.0, 0.0, 3.0, 5.0, 1.0, 1.0, 5.0], "bins": [-1.2734375, -1.2389602661132812, -1.2044830322265625, -1.1700057983398438, -1.135528564453125, -1.1010513305664062, -1.0665740966796875, -1.0320968627929688, -0.99761962890625, -0.9631423950195312, -0.9286651611328125, -0.8941879272460938, -0.859710693359375, -0.8252334594726562, -0.7907562255859375, -0.7562789916992188, -0.7218017578125, -0.6873245239257812, -0.6528472900390625, -0.6183700561523438, -0.583892822265625, -0.5494155883789062, -0.5149383544921875, -0.48046112060546875, -0.44598388671875, -0.41150665283203125, -0.3770294189453125, -0.34255218505859375, -0.308074951171875, -0.27359771728515625, -0.2391204833984375, -0.20464324951171875, -0.170166015625, -0.13568878173828125, -0.1012115478515625, -0.06673431396484375, -0.032257080078125, 0.00222015380859375, 0.0366973876953125, 0.07117462158203125, 0.10565185546875, 0.14012908935546875, 0.1746063232421875, 0.20908355712890625, 0.243560791015625, 0.27803802490234375, 0.3125152587890625, 0.34699249267578125, 0.3814697265625, 0.41594696044921875, 0.4504241943359375, 0.48490142822265625, 0.519378662109375, 0.5538558959960938, 0.5883331298828125, 0.6228103637695312, 0.65728759765625, 0.6917648315429688, 0.7262420654296875, 0.7607192993164062, 0.795196533203125, 0.8296737670898438, 0.8641510009765625, 0.8986282348632812, 0.93310546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 4.0, 11.0, 12.0, 18.0, 39.0, 24.0, 41.0, 55.0, 60.0, 77.0, 70.0, 82.0, 88.0, 79.0, 66.0, 82.0, 60.0, 40.0, 29.0, 21.0, 13.0, 11.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.46484375, -4.346405029296875, -4.22796630859375, -4.109527587890625, -3.9910888671875, -3.872650146484375, -3.75421142578125, -3.635772705078125, -3.517333984375, -3.398895263671875, -3.28045654296875, -3.162017822265625, -3.0435791015625, -2.925140380859375, -2.80670166015625, -2.688262939453125, -2.56982421875, -2.451385498046875, -2.33294677734375, -2.214508056640625, -2.0960693359375, -1.977630615234375, -1.85919189453125, -1.740753173828125, -1.622314453125, -1.503875732421875, -1.38543701171875, -1.266998291015625, -1.1485595703125, -1.030120849609375, -0.91168212890625, -0.793243408203125, -0.6748046875, -0.556365966796875, -0.43792724609375, -0.319488525390625, -0.2010498046875, -0.082611083984375, 0.03582763671875, 0.154266357421875, 0.272705078125, 0.391143798828125, 0.50958251953125, 0.628021240234375, 0.7464599609375, 0.864898681640625, 0.98333740234375, 1.101776123046875, 1.22021484375, 1.338653564453125, 1.45709228515625, 1.575531005859375, 1.6939697265625, 1.812408447265625, 1.93084716796875, 2.049285888671875, 2.167724609375, 2.286163330078125, 2.40460205078125, 2.523040771484375, 2.6414794921875, 2.759918212890625, 2.87835693359375, 2.996795654296875, 3.115234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 8.0, 6.0, 6.0, 7.0, 11.0, 11.0, 20.0, 16.0, 33.0, 57.0, 65.0, 122.0, 162.0, 261.0, 454.0, 770.0, 1418.0, 2752.0, 5952.0, 13823.0, 40045.0, 147418.0, 470631.0, 260065.0, 66986.0, 21064.0, 8371.0, 3673.0, 1810.0, 991.0, 565.0, 312.0, 213.0, 134.0, 98.0, 53.0, 40.0, 38.0, 29.0, 18.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.9599609375, -0.9306106567382812, -0.9012603759765625, -0.8719100952148438, -0.842559814453125, -0.8132095336914062, -0.7838592529296875, -0.7545089721679688, -0.72515869140625, -0.6958084106445312, -0.6664581298828125, -0.6371078491210938, -0.607757568359375, -0.5784072875976562, -0.5490570068359375, -0.5197067260742188, -0.4903564453125, -0.46100616455078125, -0.4316558837890625, -0.40230560302734375, -0.372955322265625, -0.34360504150390625, -0.3142547607421875, -0.28490447998046875, -0.25555419921875, -0.22620391845703125, -0.1968536376953125, -0.16750335693359375, -0.138153076171875, -0.10880279541015625, -0.0794525146484375, -0.05010223388671875, -0.020751953125, 0.00859832763671875, 0.0379486083984375, 0.06729888916015625, 0.096649169921875, 0.12599945068359375, 0.1553497314453125, 0.18470001220703125, 0.21405029296875, 0.24340057373046875, 0.2727508544921875, 0.30210113525390625, 0.331451416015625, 0.36080169677734375, 0.3901519775390625, 0.41950225830078125, 0.4488525390625, 0.47820281982421875, 0.5075531005859375, 0.5369033813476562, 0.566253662109375, 0.5956039428710938, 0.6249542236328125, 0.6543045043945312, 0.68365478515625, 0.7130050659179688, 0.7423553466796875, 0.7717056274414062, 0.801055908203125, 0.8304061889648438, 0.8597564697265625, 0.8891067504882812, 0.91845703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 8.0, 7.0, 6.0, 8.0, 12.0, 15.0, 15.0, 19.0, 20.0, 29.0, 28.0, 29.0, 35.0, 42.0, 31.0, 38.0, 45.0, 38.0, 46.0, 32.0, 46.0, 49.0, 41.0, 38.0, 40.0, 34.0, 30.0, 26.0, 23.0, 27.0, 18.0, 14.0, 10.0, 11.0, 11.0, 13.0, 13.0, 12.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.4140625, -3.30328369140625, -3.1925048828125, -3.08172607421875, -2.970947265625, -2.86016845703125, -2.7493896484375, -2.63861083984375, -2.52783203125, -2.41705322265625, -2.3062744140625, -2.19549560546875, -2.084716796875, -1.97393798828125, -1.8631591796875, -1.75238037109375, -1.6416015625, -1.53082275390625, -1.4200439453125, -1.30926513671875, -1.198486328125, -1.08770751953125, -0.9769287109375, -0.86614990234375, -0.75537109375, -0.64459228515625, -0.5338134765625, -0.42303466796875, -0.312255859375, -0.20147705078125, -0.0906982421875, 0.02008056640625, 0.130859375, 0.24163818359375, 0.3524169921875, 0.46319580078125, 0.573974609375, 0.68475341796875, 0.7955322265625, 0.90631103515625, 1.01708984375, 1.12786865234375, 1.2386474609375, 1.34942626953125, 1.460205078125, 1.57098388671875, 1.6817626953125, 1.79254150390625, 1.9033203125, 2.01409912109375, 2.1248779296875, 2.23565673828125, 2.346435546875, 2.45721435546875, 2.5679931640625, 2.67877197265625, 2.78955078125, 2.90032958984375, 3.0111083984375, 3.12188720703125, 3.232666015625, 3.34344482421875, 3.4542236328125, 3.56500244140625, 3.67578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 18.0, 14.0, 26.0, 39.0, 71.0, 136.0, 160.0, 290.0, 474.0, 831.0, 1614.0, 3300.0, 7315.0, 18005.0, 56233.0, 257369.0, 532304.0, 117515.0, 31218.0, 11637.0, 4852.0, 2283.0, 1221.0, 693.0, 347.0, 219.0, 130.0, 74.0, 50.0, 35.0, 26.0, 15.0, 7.0, 4.0, 9.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35498046875, -0.34430694580078125, -0.3336334228515625, -0.32295989990234375, -0.312286376953125, -0.30161285400390625, -0.2909393310546875, -0.28026580810546875, -0.26959228515625, -0.25891876220703125, -0.2482452392578125, -0.23757171630859375, -0.226898193359375, -0.21622467041015625, -0.2055511474609375, -0.19487762451171875, -0.1842041015625, -0.17353057861328125, -0.1628570556640625, -0.15218353271484375, -0.141510009765625, -0.13083648681640625, -0.1201629638671875, -0.10948944091796875, -0.09881591796875, -0.08814239501953125, -0.0774688720703125, -0.06679534912109375, -0.056121826171875, -0.04544830322265625, -0.0347747802734375, -0.02410125732421875, -0.013427734375, -0.00275421142578125, 0.0079193115234375, 0.01859283447265625, 0.029266357421875, 0.03993988037109375, 0.0506134033203125, 0.06128692626953125, 0.07196044921875, 0.08263397216796875, 0.0933074951171875, 0.10398101806640625, 0.114654541015625, 0.12532806396484375, 0.1360015869140625, 0.14667510986328125, 0.1573486328125, 0.16802215576171875, 0.1786956787109375, 0.18936920166015625, 0.200042724609375, 0.21071624755859375, 0.2213897705078125, 0.23206329345703125, 0.24273681640625, 0.25341033935546875, 0.2640838623046875, 0.27475738525390625, 0.285430908203125, 0.29610443115234375, 0.3067779541015625, 0.31745147705078125, 0.328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 4.0, 7.0, 12.0, 30.0, 25.0, 51.0, 91.0, 123.0, 155.0, 153.0, 112.0, 63.0, 43.0, 38.0, 17.0, 16.0, 12.0, 7.0, 8.0, 7.0, 7.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002105236053466797, -0.00019943341612815857, -0.00018834322690963745, -0.00017725303769111633, -0.00016616284847259521, -0.0001550726592540741, -0.00014398247003555298, -0.00013289228081703186, -0.00012180209159851074, -0.00011071190237998962, -9.96217131614685e-05, -8.853152394294739e-05, -7.744133472442627e-05, -6.635114550590515e-05, -5.526095628738403e-05, -4.4170767068862915e-05, -3.30805778503418e-05, -2.199038863182068e-05, -1.090019941329956e-05, 1.8998980522155762e-07, 1.1280179023742676e-05, 2.2370368242263794e-05, 3.346055746078491e-05, 4.455074667930603e-05, 5.564093589782715e-05, 6.673112511634827e-05, 7.782131433486938e-05, 8.89115035533905e-05, 0.00010000169277191162, 0.00011109188199043274, 0.00012218207120895386, 0.00013327226042747498, 0.0001443624496459961, 0.0001554526388645172, 0.00016654282808303833, 0.00017763301730155945, 0.00018872320652008057, 0.00019981339573860168, 0.0002109035849571228, 0.00022199377417564392, 0.00023308396339416504, 0.00024417415261268616, 0.0002552643418312073, 0.0002663545310497284, 0.0002774447202682495, 0.00028853490948677063, 0.00029962509870529175, 0.00031071528792381287, 0.000321805477142334, 0.0003328956663608551, 0.0003439858555793762, 0.00035507604479789734, 0.00036616623401641846, 0.0003772564232349396, 0.0003883466124534607, 0.0003994368016719818, 0.00041052699089050293, 0.00042161718010902405, 0.00043270736932754517, 0.0004437975585460663, 0.0004548877477645874, 0.0004659779369831085, 0.00047706812620162964, 0.00048815831542015076, 0.0004992485046386719]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 11.0, 17.0, 10.0, 22.0, 14.0, 32.0, 51.0, 62.0, 99.0, 210.0, 426.0, 978.0, 2767.0, 10401.0, 98433.0, 860371.0, 62425.0, 8180.0, 2253.0, 853.0, 413.0, 186.0, 100.0, 59.0, 38.0, 31.0, 22.0, 10.0, 10.0, 11.0, 12.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8740234375, -0.8470687866210938, -0.8201141357421875, -0.7931594848632812, -0.766204833984375, -0.7392501831054688, -0.7122955322265625, -0.6853408813476562, -0.65838623046875, -0.6314315795898438, -0.6044769287109375, -0.5775222778320312, -0.550567626953125, -0.5236129760742188, -0.4966583251953125, -0.46970367431640625, -0.4427490234375, -0.41579437255859375, -0.3888397216796875, -0.36188507080078125, -0.334930419921875, -0.30797576904296875, -0.2810211181640625, -0.25406646728515625, -0.22711181640625, -0.20015716552734375, -0.1732025146484375, -0.14624786376953125, -0.119293212890625, -0.09233856201171875, -0.0653839111328125, -0.03842926025390625, -0.011474609375, 0.01548004150390625, 0.0424346923828125, 0.06938934326171875, 0.096343994140625, 0.12329864501953125, 0.1502532958984375, 0.17720794677734375, 0.20416259765625, 0.23111724853515625, 0.2580718994140625, 0.28502655029296875, 0.311981201171875, 0.33893585205078125, 0.3658905029296875, 0.39284515380859375, 0.4197998046875, 0.44675445556640625, 0.4737091064453125, 0.5006637573242188, 0.527618408203125, 0.5545730590820312, 0.5815277099609375, 0.6084823608398438, 0.63543701171875, 0.6623916625976562, 0.6893463134765625, 0.7163009643554688, 0.743255615234375, 0.7702102661132812, 0.7971649169921875, 0.8241195678710938, 0.85107421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 9.0, 22.0, 12.0, 17.0, 23.0, 42.0, 40.0, 49.0, 67.0, 72.0, 70.0, 105.0, 80.0, 79.0, 56.0, 49.0, 37.0, 31.0, 28.0, 21.0, 13.0, 9.0, 9.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08489990234375, -0.08214282989501953, -0.07938575744628906, -0.0766286849975586, -0.07387161254882812, -0.07111454010009766, -0.06835746765136719, -0.06560039520263672, -0.06284332275390625, -0.06008625030517578, -0.05732917785644531, -0.054572105407714844, -0.051815032958984375, -0.049057960510253906, -0.04630088806152344, -0.04354381561279297, -0.0407867431640625, -0.03802967071533203, -0.03527259826660156, -0.032515525817871094, -0.029758453369140625, -0.027001380920410156, -0.024244308471679688, -0.02148723602294922, -0.01873016357421875, -0.01597309112548828, -0.013216018676757812, -0.010458946228027344, -0.007701873779296875, -0.004944801330566406, -0.0021877288818359375, 0.0005693435668945312, 0.003326416015625, 0.006083488464355469, 0.008840560913085938, 0.011597633361816406, 0.014354705810546875, 0.017111778259277344, 0.019868850708007812, 0.02262592315673828, 0.02538299560546875, 0.02814006805419922, 0.030897140502929688, 0.033654212951660156, 0.036411285400390625, 0.039168357849121094, 0.04192543029785156, 0.04468250274658203, 0.0474395751953125, 0.05019664764404297, 0.05295372009277344, 0.055710792541503906, 0.058467864990234375, 0.061224937438964844, 0.06398200988769531, 0.06673908233642578, 0.06949615478515625, 0.07225322723388672, 0.07501029968261719, 0.07776737213134766, 0.08052444458007812, 0.0832815170288086, 0.08603858947753906, 0.08879566192626953, 0.091552734375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 32.0, 44.0, 103.0, 234.0, 246.0, 189.0, 62.0, 46.0, 22.0, 7.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.347467422485352, -12.080865859985352, -11.814263343811035, -11.547661781311035, -11.281060218811035, -11.014457702636719, -10.747856140136719, -10.481254577636719, -10.214653015136719, -9.948051452636719, -9.681448936462402, -9.414847373962402, -9.148245811462402, -8.881643295288086, -8.615041732788086, -8.348440170288086, -8.08183765411377, -7.815235614776611, -7.548634052276611, -7.282032012939453, -7.015430450439453, -6.748828411102295, -6.482226371765137, -6.215624809265137, -5.9490227699279785, -5.68242073059082, -5.41581916809082, -5.149217128753662, -4.882615089416504, -4.616013526916504, -4.349411487579346, -4.0828094482421875, -3.8162078857421875, -3.5496060848236084, -3.2830042839050293, -3.016402244567871, -2.749800443649292, -2.483198642730713, -2.2165966033935547, -1.9499948024749756, -1.6833930015563965, -1.4167912006378174, -1.1501892805099487, -0.8835874199867249, -0.616985559463501, -0.3503837585449219, -0.08378183841705322, 0.18282008171081543, 0.44942188262939453, 0.7160237431526184, 0.9826256036758423, 1.249227523803711, 1.51582932472229, 1.7824311256408691, 2.0490331649780273, 2.3156349658966064, 2.5822367668151855, 2.8488385677337646, 3.1154403686523438, 3.382042407989502, 3.648644208908081, 3.91524600982666, 4.181848049163818, 4.448450088500977, 4.715051651000977]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 5.0, 7.0, 19.0, 23.0, 29.0, 43.0, 61.0, 45.0, 60.0, 80.0, 74.0, 91.0, 91.0, 74.0, 75.0, 66.0, 47.0, 22.0, 32.0, 15.0, 13.0, 8.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.14798641204834, -4.033320426940918, -3.918654203414917, -3.803987979888916, -3.689321994781494, -3.574655771255493, -3.459989547729492, -3.3453235626220703, -3.2306575775146484, -3.1159913539886475, -3.0013253688812256, -2.8866591453552246, -2.7719931602478027, -2.6573269367218018, -2.542660713195801, -2.427994728088379, -2.313328504562378, -2.198662281036377, -2.083996295928955, -1.969330072402954, -1.8546640872955322, -1.7399978637695312, -1.6253317594528198, -1.5106656551361084, -1.395999550819397, -1.2813334465026855, -1.1666673421859741, -1.0520012378692627, -0.9373350739479065, -0.8226689696311951, -0.7080028057098389, -0.5933367013931274, -0.4786708354949951, -0.3640047311782837, -0.24933859705924988, -0.13467246294021606, -0.02000635862350464, 0.09465974569320679, 0.209325909614563, 0.3239920139312744, 0.43865811824798584, 0.5533242225646973, 0.6679903268814087, 0.7826564908027649, 0.8973225951194763, 1.011988639831543, 1.126654863357544, 1.2413209676742554, 1.3559870719909668, 1.4706531763076782, 1.5853192806243896, 1.6999855041503906, 1.8146514892578125, 1.9293177127838135, 2.0439839363098145, 2.1586499214172363, 2.273315906524658, 2.387982130050659, 2.502648115158081, 2.617314338684082, 2.731980323791504, 2.846646547317505, 2.961312770843506, 3.0759787559509277, 3.1906449794769287]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 12.0, 8.0, 19.0, 24.0, 30.0, 48.0, 94.0, 124.0, 210.0, 366.0, 604.0, 991.0, 1683.0, 3011.0, 5455.0, 10718.0, 22240.0, 60584.0, 360490.0, 459299.0, 72454.0, 24917.0, 11353.0, 5982.0, 3225.0, 1883.0, 1032.0, 636.0, 382.0, 246.0, 131.0, 111.0, 60.0, 51.0, 27.0, 18.0, 4.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-2.4140625, -2.34521484375, -2.2763671875, -2.20751953125, -2.138671875, -2.06982421875, -2.0009765625, -1.93212890625, -1.86328125, -1.79443359375, -1.7255859375, -1.65673828125, -1.587890625, -1.51904296875, -1.4501953125, -1.38134765625, -1.3125, -1.24365234375, -1.1748046875, -1.10595703125, -1.037109375, -0.96826171875, -0.8994140625, -0.83056640625, -0.76171875, -0.69287109375, -0.6240234375, -0.55517578125, -0.486328125, -0.41748046875, -0.3486328125, -0.27978515625, -0.2109375, -0.14208984375, -0.0732421875, -0.00439453125, 0.064453125, 0.13330078125, 0.2021484375, 0.27099609375, 0.33984375, 0.40869140625, 0.4775390625, 0.54638671875, 0.615234375, 0.68408203125, 0.7529296875, 0.82177734375, 0.890625, 0.95947265625, 1.0283203125, 1.09716796875, 1.166015625, 1.23486328125, 1.3037109375, 1.37255859375, 1.44140625, 1.51025390625, 1.5791015625, 1.64794921875, 1.716796875, 1.78564453125, 1.8544921875, 1.92333984375, 1.9921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 13.0, 12.0, 16.0, 20.0, 15.0, 29.0, 23.0, 34.0, 49.0, 25.0, 46.0, 52.0, 42.0, 61.0, 40.0, 47.0, 42.0, 52.0, 46.0, 45.0, 29.0, 39.0, 23.0, 34.0, 22.0, 17.0, 18.0, 10.0, 15.0, 7.0, 13.0, 9.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.63671875, -5.4742431640625, -5.311767578125, -5.1492919921875, -4.98681640625, -4.8243408203125, -4.661865234375, -4.4993896484375, -4.3369140625, -4.1744384765625, -4.011962890625, -3.8494873046875, -3.68701171875, -3.5245361328125, -3.362060546875, -3.1995849609375, -3.037109375, -2.8746337890625, -2.712158203125, -2.5496826171875, -2.38720703125, -2.2247314453125, -2.062255859375, -1.8997802734375, -1.7373046875, -1.5748291015625, -1.412353515625, -1.2498779296875, -1.08740234375, -0.9249267578125, -0.762451171875, -0.5999755859375, -0.4375, -0.2750244140625, -0.112548828125, 0.0499267578125, 0.21240234375, 0.3748779296875, 0.537353515625, 0.6998291015625, 0.8623046875, 1.0247802734375, 1.187255859375, 1.3497314453125, 1.51220703125, 1.6746826171875, 1.837158203125, 1.9996337890625, 2.162109375, 2.3245849609375, 2.487060546875, 2.6495361328125, 2.81201171875, 2.9744873046875, 3.136962890625, 3.2994384765625, 3.4619140625, 3.6243896484375, 3.786865234375, 3.9493408203125, 4.11181640625, 4.2742919921875, 4.436767578125, 4.5992431640625, 4.76171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 1.0, 9.0, 8.0, 6.0, 15.0, 16.0, 19.0, 15.0, 27.0, 32.0, 30.0, 29.0, 47.0, 46.0, 68.0, 78.0, 331.0, 8335.0, 1032146.0, 6557.0, 277.0, 95.0, 57.0, 38.0, 38.0, 46.0, 17.0, 27.0, 25.0, 20.0, 19.0, 22.0, 10.0, 7.0, 4.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.5625, -18.0535888671875, -17.544677734375, -17.0357666015625, -16.52685546875, -16.0179443359375, -15.509033203125, -15.0001220703125, -14.4912109375, -13.9822998046875, -13.473388671875, -12.9644775390625, -12.45556640625, -11.9466552734375, -11.437744140625, -10.9288330078125, -10.419921875, -9.9110107421875, -9.402099609375, -8.8931884765625, -8.38427734375, -7.8753662109375, -7.366455078125, -6.8575439453125, -6.3486328125, -5.8397216796875, -5.330810546875, -4.8218994140625, -4.31298828125, -3.8040771484375, -3.295166015625, -2.7862548828125, -2.27734375, -1.7684326171875, -1.259521484375, -0.7506103515625, -0.24169921875, 0.2672119140625, 0.776123046875, 1.2850341796875, 1.7939453125, 2.3028564453125, 2.811767578125, 3.3206787109375, 3.82958984375, 4.3385009765625, 4.847412109375, 5.3563232421875, 5.865234375, 6.3741455078125, 6.883056640625, 7.3919677734375, 7.90087890625, 8.4097900390625, 8.918701171875, 9.4276123046875, 9.9365234375, 10.4454345703125, 10.954345703125, 11.4632568359375, 11.97216796875, 12.4810791015625, 12.989990234375, 13.4989013671875, 14.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 3.0, 8.0, 14.0, 5.0, 11.0, 16.0, 19.0, 19.0, 33.0, 25.0, 33.0, 23.0, 39.0, 35.0, 51.0, 48.0, 51.0, 54.0, 37.0, 38.0, 41.0, 51.0, 36.0, 35.0, 46.0, 34.0, 18.0, 29.0, 23.0, 18.0, 22.0, 20.0, 12.0, 11.0, 5.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.6875, -6.50421142578125, -6.3209228515625, -6.13763427734375, -5.954345703125, -5.77105712890625, -5.5877685546875, -5.40447998046875, -5.22119140625, -5.03790283203125, -4.8546142578125, -4.67132568359375, -4.488037109375, -4.30474853515625, -4.1214599609375, -3.93817138671875, -3.7548828125, -3.57159423828125, -3.3883056640625, -3.20501708984375, -3.021728515625, -2.83843994140625, -2.6551513671875, -2.47186279296875, -2.28857421875, -2.10528564453125, -1.9219970703125, -1.73870849609375, -1.555419921875, -1.37213134765625, -1.1888427734375, -1.00555419921875, -0.822265625, -0.63897705078125, -0.4556884765625, -0.27239990234375, -0.089111328125, 0.09417724609375, 0.2774658203125, 0.46075439453125, 0.64404296875, 0.82733154296875, 1.0106201171875, 1.19390869140625, 1.377197265625, 1.56048583984375, 1.7437744140625, 1.92706298828125, 2.1103515625, 2.29364013671875, 2.4769287109375, 2.66021728515625, 2.843505859375, 3.02679443359375, 3.2100830078125, 3.39337158203125, 3.57666015625, 3.75994873046875, 3.9432373046875, 4.12652587890625, 4.309814453125, 4.49310302734375, 4.6763916015625, 4.85968017578125, 5.04296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 7.0, 13.0, 8.0, 20.0, 25.0, 37.0, 59.0, 93.0, 139.0, 222.0, 365.0, 657.0, 1382.0, 3288.0, 9069.0, 32897.0, 703880.0, 254593.0, 27883.0, 8064.0, 2946.0, 1283.0, 632.0, 351.0, 217.0, 134.0, 83.0, 60.0, 40.0, 20.0, 23.0, 13.0, 6.0, 11.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2958984375, -1.256561279296875, -1.21722412109375, -1.177886962890625, -1.1385498046875, -1.099212646484375, -1.05987548828125, -1.020538330078125, -0.981201171875, -0.941864013671875, -0.90252685546875, -0.863189697265625, -0.8238525390625, -0.784515380859375, -0.74517822265625, -0.705841064453125, -0.66650390625, -0.627166748046875, -0.58782958984375, -0.548492431640625, -0.5091552734375, -0.469818115234375, -0.43048095703125, -0.391143798828125, -0.351806640625, -0.312469482421875, -0.27313232421875, -0.233795166015625, -0.1944580078125, -0.155120849609375, -0.11578369140625, -0.076446533203125, -0.037109375, 0.002227783203125, 0.04156494140625, 0.080902099609375, 0.1202392578125, 0.159576416015625, 0.19891357421875, 0.238250732421875, 0.277587890625, 0.316925048828125, 0.35626220703125, 0.395599365234375, 0.4349365234375, 0.474273681640625, 0.51361083984375, 0.552947998046875, 0.59228515625, 0.631622314453125, 0.67095947265625, 0.710296630859375, 0.7496337890625, 0.788970947265625, 0.82830810546875, 0.867645263671875, 0.906982421875, 0.946319580078125, 0.98565673828125, 1.024993896484375, 1.0643310546875, 1.103668212890625, 1.14300537109375, 1.182342529296875, 1.2216796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 5.0, 8.0, 22.0, 16.0, 23.0, 30.0, 55.0, 114.0, 236.0, 226.0, 83.0, 65.0, 25.0, 19.0, 13.0, 5.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016188621520996094, -0.0001572445034980774, -0.00015260279178619385, -0.0001479610800743103, -0.00014331936836242676, -0.0001386776566505432, -0.00013403594493865967, -0.00012939423322677612, -0.00012475252151489258, -0.00012011080980300903, -0.00011546909809112549, -0.00011082738637924194, -0.0001061856746673584, -0.00010154396295547485, -9.690225124359131e-05, -9.226053953170776e-05, -8.761882781982422e-05, -8.297711610794067e-05, -7.833540439605713e-05, -7.369369268417358e-05, -6.905198097229004e-05, -6.44102692604065e-05, -5.976855754852295e-05, -5.5126845836639404e-05, -5.048513412475586e-05, -4.5843422412872314e-05, -4.120171070098877e-05, -3.6559998989105225e-05, -3.191828727722168e-05, -2.7276575565338135e-05, -2.263486385345459e-05, -1.7993152141571045e-05, -1.33514404296875e-05, -8.709728717803955e-06, -4.06801700592041e-06, 5.736947059631348e-07, 5.21540641784668e-06, 9.857118129730225e-06, 1.449882984161377e-05, 1.9140541553497314e-05, 2.378225326538086e-05, 2.8423964977264404e-05, 3.306567668914795e-05, 3.7707388401031494e-05, 4.234910011291504e-05, 4.6990811824798584e-05, 5.163252353668213e-05, 5.6274235248565674e-05, 6.091594696044922e-05, 6.555765867233276e-05, 7.019937038421631e-05, 7.484108209609985e-05, 7.94827938079834e-05, 8.412450551986694e-05, 8.876621723175049e-05, 9.340792894363403e-05, 9.804964065551758e-05, 0.00010269135236740112, 0.00010733306407928467, 0.00011197477579116821, 0.00011661648750305176, 0.0001212581992149353, 0.00012589991092681885, 0.0001305416226387024, 0.00013518333435058594]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 1.0, 6.0, 12.0, 13.0, 12.0, 19.0, 25.0, 56.0, 56.0, 85.0, 92.0, 167.0, 301.0, 444.0, 869.0, 1661.0, 3638.0, 9532.0, 32619.0, 288354.0, 655372.0, 36902.0, 10306.0, 3903.0, 1795.0, 905.0, 555.0, 294.0, 197.0, 119.0, 82.0, 55.0, 30.0, 19.0, 17.0, 12.0, 5.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.028076171875, -0.99267578125, -0.957275390625, -0.921875, -0.886474609375, -0.85107421875, -0.815673828125, -0.7802734375, -0.744873046875, -0.70947265625, -0.674072265625, -0.638671875, -0.603271484375, -0.56787109375, -0.532470703125, -0.4970703125, -0.461669921875, -0.42626953125, -0.390869140625, -0.35546875, -0.320068359375, -0.28466796875, -0.249267578125, -0.2138671875, -0.178466796875, -0.14306640625, -0.107666015625, -0.072265625, -0.036865234375, -0.00146484375, 0.033935546875, 0.0693359375, 0.104736328125, 0.14013671875, 0.175537109375, 0.2109375, 0.246337890625, 0.28173828125, 0.317138671875, 0.3525390625, 0.387939453125, 0.42333984375, 0.458740234375, 0.494140625, 0.529541015625, 0.56494140625, 0.600341796875, 0.6357421875, 0.671142578125, 0.70654296875, 0.741943359375, 0.77734375, 0.812744140625, 0.84814453125, 0.883544921875, 0.9189453125, 0.954345703125, 0.98974609375, 1.025146484375, 1.060546875, 1.095947265625, 1.13134765625, 1.166748046875, 1.2021484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 4.0, 9.0, 16.0, 14.0, 13.0, 20.0, 30.0, 44.0, 88.0, 400.0, 142.0, 55.0, 37.0, 35.0, 21.0, 10.0, 15.0, 8.0, 6.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5880203247070312, -0.5715484619140625, -0.5550765991210938, -0.538604736328125, -0.5221328735351562, -0.5056610107421875, -0.48918914794921875, -0.47271728515625, -0.45624542236328125, -0.4397735595703125, -0.42330169677734375, -0.406829833984375, -0.39035797119140625, -0.3738861083984375, -0.35741424560546875, -0.3409423828125, -0.32447052001953125, -0.3079986572265625, -0.29152679443359375, -0.275054931640625, -0.25858306884765625, -0.2421112060546875, -0.22563934326171875, -0.20916748046875, -0.19269561767578125, -0.1762237548828125, -0.15975189208984375, -0.143280029296875, -0.12680816650390625, -0.1103363037109375, -0.09386444091796875, -0.077392578125, -0.06092071533203125, -0.0444488525390625, -0.02797698974609375, -0.011505126953125, 0.00496673583984375, 0.0214385986328125, 0.03791046142578125, 0.05438232421875, 0.07085418701171875, 0.0873260498046875, 0.10379791259765625, 0.120269775390625, 0.13674163818359375, 0.1532135009765625, 0.16968536376953125, 0.1861572265625, 0.20262908935546875, 0.2191009521484375, 0.23557281494140625, 0.252044677734375, 0.26851654052734375, 0.2849884033203125, 0.30146026611328125, 0.31793212890625, 0.33440399169921875, 0.3508758544921875, 0.36734771728515625, 0.383819580078125, 0.40029144287109375, 0.4167633056640625, 0.43323516845703125, 0.44970703125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 9.0, 26.0, 58.0, 167.0, 315.0, 254.0, 106.0, 41.0, 15.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.3998908996582, -32.76668167114258, -32.13346862792969, -31.500259399414062, -30.867048263549805, -30.233837127685547, -29.60062599182129, -28.96741485595703, -28.334205627441406, -27.70099449157715, -27.06778335571289, -26.434574127197266, -25.801362991333008, -25.16815185546875, -24.534940719604492, -23.901729583740234, -23.26852035522461, -22.63530921936035, -22.002098083496094, -21.36888885498047, -20.73567771911621, -20.102466583251953, -19.469255447387695, -18.836044311523438, -18.20283317565918, -17.569622039794922, -16.936410903930664, -16.30320167541504, -15.669990539550781, -15.036779403686523, -14.403568267822266, -13.770358085632324, -13.1371488571167, -12.503937721252441, -11.8707275390625, -11.237516403198242, -10.6043062210083, -9.971095085144043, -9.337884902954102, -8.704673767089844, -8.071462631225586, -7.438251972198486, -6.805041313171387, -6.171830177307129, -5.5386199951171875, -4.90540885925293, -4.27219820022583, -3.6389875411987305, -3.005777359008789, -2.3725666999816895, -1.7393559217453003, -1.1061451435089111, -0.4729344844818115, 0.16027617454528809, 0.7934870719909668, 1.4266977310180664, 2.059908390045166, 2.6931190490722656, 3.3263297080993652, 3.959540605545044, 4.592751502990723, 5.225961685180664, 5.859172821044922, 6.4923834800720215, 7.125594139099121]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 11.0, 14.0, 17.0, 17.0, 14.0, 17.0, 28.0, 24.0, 31.0, 41.0, 33.0, 36.0, 45.0, 52.0, 47.0, 48.0, 43.0, 53.0, 49.0, 47.0, 31.0, 47.0, 35.0, 35.0, 27.0, 29.0, 28.0, 15.0, 12.0, 16.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.205902099609375, -9.90009593963623, -9.594289779663086, -9.288483619689941, -8.982677459716797, -8.676871299743652, -8.371065139770508, -8.065258979797363, -7.759452819824219, -7.453646659851074, -7.14784049987793, -6.842034339904785, -6.536228179931641, -6.230422019958496, -5.924615859985352, -5.618809700012207, -5.3130035400390625, -5.007197380065918, -4.701391220092773, -4.395585060119629, -4.089778900146484, -3.78397274017334, -3.4781665802001953, -3.172360420227051, -2.8665542602539062, -2.5607481002807617, -2.254941940307617, -1.9491357803344727, -1.6433296203613281, -1.3375234603881836, -1.031717300415039, -0.7259111404418945, -0.42010498046875, -0.11429882049560547, 0.19150733947753906, 0.4973134994506836, 0.8031196594238281, 1.1089258193969727, 1.4147319793701172, 1.7205381393432617, 2.0263442993164062, 2.332150459289551, 2.6379566192626953, 2.94376277923584, 3.2495689392089844, 3.555375099182129, 3.8611812591552734, 4.166987419128418, 4.4727935791015625, 4.778599739074707, 5.084405899047852, 5.390212059020996, 5.696018218994141, 6.001824378967285, 6.30763053894043, 6.613436698913574, 6.919242858886719, 7.225049018859863, 7.530855178833008, 7.836661338806152, 8.142467498779297, 8.448273658752441, 8.754079818725586, 9.05988597869873, 9.365692138671875]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 10.0, 17.0, 9.0, 13.0, 25.0, 38.0, 34.0, 63.0, 113.0, 199.0, 330.0, 718.0, 1531.0, 4072.0, 13613.0, 70164.0, 1661647.0, 2336200.0, 82939.0, 14835.0, 4480.0, 1664.0, 701.0, 348.0, 171.0, 103.0, 81.0, 42.0, 32.0, 21.0, 13.0, 10.0, 5.0, 6.0, 12.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.52886962890625, -5.3507080078125, -5.17254638671875, -4.994384765625, -4.81622314453125, -4.6380615234375, -4.45989990234375, -4.28173828125, -4.10357666015625, -3.9254150390625, -3.74725341796875, -3.569091796875, -3.39093017578125, -3.2127685546875, -3.03460693359375, -2.8564453125, -2.67828369140625, -2.5001220703125, -2.32196044921875, -2.143798828125, -1.96563720703125, -1.7874755859375, -1.60931396484375, -1.43115234375, -1.25299072265625, -1.0748291015625, -0.89666748046875, -0.718505859375, -0.54034423828125, -0.3621826171875, -0.18402099609375, -0.005859375, 0.17230224609375, 0.3504638671875, 0.52862548828125, 0.706787109375, 0.88494873046875, 1.0631103515625, 1.24127197265625, 1.41943359375, 1.59759521484375, 1.7757568359375, 1.95391845703125, 2.132080078125, 2.31024169921875, 2.4884033203125, 2.66656494140625, 2.8447265625, 3.02288818359375, 3.2010498046875, 3.37921142578125, 3.557373046875, 3.73553466796875, 3.9136962890625, 4.09185791015625, 4.27001953125, 4.44818115234375, 4.6263427734375, 4.80450439453125, 4.982666015625, 5.16082763671875, 5.3389892578125, 5.51715087890625, 5.6953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 4.0, 24.0, 24.0, 30.0, 35.0, 55.0, 60.0, 72.0, 81.0, 88.0, 87.0, 77.0, 110.0, 69.0, 49.0, 41.0, 20.0, 22.0, 14.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.073486328125, -4.93603515625, -4.798583984375, -4.6611328125, -4.523681640625, -4.38623046875, -4.248779296875, -4.111328125, -3.973876953125, -3.83642578125, -3.698974609375, -3.5615234375, -3.424072265625, -3.28662109375, -3.149169921875, -3.01171875, -2.874267578125, -2.73681640625, -2.599365234375, -2.4619140625, -2.324462890625, -2.18701171875, -2.049560546875, -1.912109375, -1.774658203125, -1.63720703125, -1.499755859375, -1.3623046875, -1.224853515625, -1.08740234375, -0.949951171875, -0.8125, -0.675048828125, -0.53759765625, -0.400146484375, -0.2626953125, -0.125244140625, 0.01220703125, 0.149658203125, 0.287109375, 0.424560546875, 0.56201171875, 0.699462890625, 0.8369140625, 0.974365234375, 1.11181640625, 1.249267578125, 1.38671875, 1.524169921875, 1.66162109375, 1.799072265625, 1.9365234375, 2.073974609375, 2.21142578125, 2.348876953125, 2.486328125, 2.623779296875, 2.76123046875, 2.898681640625, 3.0361328125, 3.173583984375, 3.31103515625, 3.448486328125, 3.5859375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 16.0, 50.0, 280.0, 18906.0, 4173348.0, 1513.0, 128.0, 27.0, 8.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.046875, -22.967529296875, -21.88818359375, -20.808837890625, -19.7294921875, -18.650146484375, -17.57080078125, -16.491455078125, -15.412109375, -14.332763671875, -13.25341796875, -12.174072265625, -11.0947265625, -10.015380859375, -8.93603515625, -7.856689453125, -6.77734375, -5.697998046875, -4.61865234375, -3.539306640625, -2.4599609375, -1.380615234375, -0.30126953125, 0.778076171875, 1.857421875, 2.936767578125, 4.01611328125, 5.095458984375, 6.1748046875, 7.254150390625, 8.33349609375, 9.412841796875, 10.4921875, 11.571533203125, 12.65087890625, 13.730224609375, 14.8095703125, 15.888916015625, 16.96826171875, 18.047607421875, 19.126953125, 20.206298828125, 21.28564453125, 22.364990234375, 23.4443359375, 24.523681640625, 25.60302734375, 26.682373046875, 27.76171875, 28.841064453125, 29.92041015625, 30.999755859375, 32.0791015625, 33.158447265625, 34.23779296875, 35.317138671875, 36.396484375, 37.475830078125, 38.55517578125, 39.634521484375, 40.7138671875, 41.793212890625, 42.87255859375, 43.951904296875, 45.03125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 4.0, 7.0, 11.0, 12.0, 24.0, 34.0, 33.0, 44.0, 60.0, 121.0, 172.0, 305.0, 521.0, 1050.0, 669.0, 338.0, 206.0, 138.0, 99.0, 68.0, 27.0, 30.0, 22.0, 13.0, 12.0, 9.0, 9.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.2490997314453125, -1.214019775390625, -1.1789398193359375, -1.14385986328125, -1.1087799072265625, -1.073699951171875, -1.0386199951171875, -1.0035400390625, -0.9684600830078125, -0.933380126953125, -0.8983001708984375, -0.86322021484375, -0.8281402587890625, -0.793060302734375, -0.7579803466796875, -0.722900390625, -0.6878204345703125, -0.652740478515625, -0.6176605224609375, -0.58258056640625, -0.5475006103515625, -0.512420654296875, -0.4773406982421875, -0.4422607421875, -0.4071807861328125, -0.372100830078125, -0.3370208740234375, -0.30194091796875, -0.2668609619140625, -0.231781005859375, -0.1967010498046875, -0.16162109375, -0.1265411376953125, -0.091461181640625, -0.0563812255859375, -0.02130126953125, 0.0137786865234375, 0.048858642578125, 0.0839385986328125, 0.1190185546875, 0.1540985107421875, 0.189178466796875, 0.2242584228515625, 0.25933837890625, 0.2944183349609375, 0.329498291015625, 0.3645782470703125, 0.399658203125, 0.4347381591796875, 0.469818115234375, 0.5048980712890625, 0.53997802734375, 0.5750579833984375, 0.610137939453125, 0.6452178955078125, 0.6802978515625, 0.7153778076171875, 0.750457763671875, 0.7855377197265625, 0.82061767578125, 0.8556976318359375, 0.890777587890625, 0.9258575439453125, 0.9609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 11.0, 18.0, 30.0, 33.0, 62.0, 75.0, 121.0, 146.0, 135.0, 114.0, 85.0, 52.0, 46.0, 18.0, 9.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.353464126586914, -7.154359817504883, -6.955255508422852, -6.75615119934082, -6.557046890258789, -6.357943058013916, -6.158838748931885, -5.9597344398498535, -5.760630130767822, -5.561525821685791, -5.36242151260376, -5.1633172035217285, -4.9642133712768555, -4.765109062194824, -4.566004753112793, -4.366900444030762, -4.1677961349487305, -3.968691825866699, -3.769587516784668, -3.570483446121216, -3.3713791370391846, -3.1722748279571533, -2.973170757293701, -2.77406644821167, -2.5749621391296387, -2.3758578300476074, -2.176753520965576, -1.977649450302124, -1.7785451412200928, -1.5794408321380615, -1.3803366422653198, -1.1812324523925781, -0.9821276664733887, -0.7830234169960022, -0.5839191675186157, -0.38481491804122925, -0.18571066856384277, 0.013393580913543701, 0.21249783039093018, 0.4116020202636719, 0.6107063293457031, 0.8098105788230896, 1.008914828300476, 1.2080190181732178, 1.407123327255249, 1.6062276363372803, 1.805331826210022, 2.0044360160827637, 2.203540325164795, 2.402644634246826, 2.6017489433288574, 2.8008530139923096, 2.999957323074341, 3.199061632156372, 3.398165702819824, 3.5972700119018555, 3.7963743209838867, 3.995478630065918, 4.194582939147949, 4.3936872482299805, 4.592791557312012, 4.791895389556885, 4.990999698638916, 5.190104007720947, 5.3892083168029785]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 4.0, 3.0, 13.0, 10.0, 14.0, 12.0, 25.0, 27.0, 39.0, 37.0, 37.0, 45.0, 46.0, 52.0, 70.0, 69.0, 61.0, 57.0, 51.0, 54.0, 45.0, 41.0, 41.0, 26.0, 28.0, 22.0, 18.0, 19.0, 10.0, 6.0, 4.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.372010707855225, -4.262429714202881, -4.152849197387695, -4.043268203735352, -3.933687448501587, -3.8241066932678223, -3.7145259380340576, -3.604945182800293, -3.4953644275665283, -3.3857836723327637, -3.276202917098999, -3.1666221618652344, -3.0570411682128906, -2.947460412979126, -2.8378796577453613, -2.7282989025115967, -2.618718147277832, -2.5091373920440674, -2.3995566368103027, -2.289975643157959, -2.1803948879241943, -2.0708141326904297, -1.961233377456665, -1.8516526222229004, -1.7420716285705566, -1.632490873336792, -1.5229099988937378, -1.4133292436599731, -1.3037484884262085, -1.1941676139831543, -1.0845868587493896, -0.975006103515625, -0.8654253482818604, -0.7558445334434509, -0.6462637782096863, -0.5366829633712769, -0.4271021783351898, -0.3175213932991028, -0.20794057846069336, -0.09835982322692871, 0.011220991611480713, 0.12080178409814835, 0.23038257658481598, 0.3399633765220642, 0.44954416155815125, 0.5591249465942383, 0.6687057614326477, 0.7782865166664124, 0.8878673315048218, 0.9974481463432312, 1.1070289611816406, 1.2166097164154053, 1.32619047164917, 1.4357712268829346, 1.5453521013259888, 1.6549328565597534, 1.7645137310028076, 1.8740944862365723, 1.9836753606796265, 2.0932559967041016, 2.2028369903564453, 2.31241774559021, 2.4219985008239746, 2.5315792560577393, 2.641160011291504]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 10.0, 18.0, 17.0, 29.0, 52.0, 104.0, 231.0, 540.0, 1607.0, 5843.0, 32101.0, 465609.0, 498980.0, 34519.0, 6094.0, 1707.0, 635.0, 229.0, 98.0, 52.0, 23.0, 15.0, 10.0, 5.0, 4.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.224609375, -1.182403564453125, -1.14019775390625, -1.097991943359375, -1.0557861328125, -1.013580322265625, -0.97137451171875, -0.929168701171875, -0.886962890625, -0.844757080078125, -0.80255126953125, -0.760345458984375, -0.7181396484375, -0.675933837890625, -0.63372802734375, -0.591522216796875, -0.54931640625, -0.507110595703125, -0.46490478515625, -0.422698974609375, -0.3804931640625, -0.338287353515625, -0.29608154296875, -0.253875732421875, -0.211669921875, -0.169464111328125, -0.12725830078125, -0.085052490234375, -0.0428466796875, -0.000640869140625, 0.04156494140625, 0.083770751953125, 0.1259765625, 0.168182373046875, 0.21038818359375, 0.252593994140625, 0.2947998046875, 0.337005615234375, 0.37921142578125, 0.421417236328125, 0.463623046875, 0.505828857421875, 0.54803466796875, 0.590240478515625, 0.6324462890625, 0.674652099609375, 0.71685791015625, 0.759063720703125, 0.80126953125, 0.843475341796875, 0.88568115234375, 0.927886962890625, 0.9700927734375, 1.012298583984375, 1.05450439453125, 1.096710205078125, 1.138916015625, 1.181121826171875, 1.22332763671875, 1.265533447265625, 1.3077392578125, 1.349945068359375, 1.39215087890625, 1.434356689453125, 1.4765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 14.0, 15.0, 25.0, 42.0, 33.0, 59.0, 79.0, 69.0, 88.0, 97.0, 93.0, 87.0, 75.0, 57.0, 57.0, 24.0, 26.0, 18.0, 10.0, 6.0, 6.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.277313232421875, -4.17181396484375, -4.066314697265625, -3.9608154296875, -3.855316162109375, -3.74981689453125, -3.644317626953125, -3.538818359375, -3.433319091796875, -3.32781982421875, -3.222320556640625, -3.1168212890625, -3.011322021484375, -2.90582275390625, -2.800323486328125, -2.69482421875, -2.589324951171875, -2.48382568359375, -2.378326416015625, -2.2728271484375, -2.167327880859375, -2.06182861328125, -1.956329345703125, -1.850830078125, -1.745330810546875, -1.63983154296875, -1.534332275390625, -1.4288330078125, -1.323333740234375, -1.21783447265625, -1.112335205078125, -1.0068359375, -0.901336669921875, -0.79583740234375, -0.690338134765625, -0.5848388671875, -0.479339599609375, -0.37384033203125, -0.268341064453125, -0.162841796875, -0.057342529296875, 0.04815673828125, 0.153656005859375, 0.2591552734375, 0.364654541015625, 0.47015380859375, 0.575653076171875, 0.68115234375, 0.786651611328125, 0.89215087890625, 0.997650146484375, 1.1031494140625, 1.208648681640625, 1.31414794921875, 1.419647216796875, 1.525146484375, 1.630645751953125, 1.73614501953125, 1.841644287109375, 1.9471435546875, 2.052642822265625, 2.15814208984375, 2.263641357421875, 2.369140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 9.0, 9.0, 23.0, 33.0, 57.0, 84.0, 127.0, 228.0, 430.0, 881.0, 2146.0, 5343.0, 15867.0, 63566.0, 343031.0, 482565.0, 99776.0, 22375.0, 6983.0, 2690.0, 1174.0, 516.0, 255.0, 148.0, 104.0, 46.0, 21.0, 20.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6122970581054688, -0.5932464599609375, -0.5741958618164062, -0.555145263671875, -0.5360946655273438, -0.5170440673828125, -0.49799346923828125, -0.47894287109375, -0.45989227294921875, -0.4408416748046875, -0.42179107666015625, -0.402740478515625, -0.38368988037109375, -0.3646392822265625, -0.34558868408203125, -0.3265380859375, -0.30748748779296875, -0.2884368896484375, -0.26938629150390625, -0.250335693359375, -0.23128509521484375, -0.2122344970703125, -0.19318389892578125, -0.17413330078125, -0.15508270263671875, -0.1360321044921875, -0.11698150634765625, -0.097930908203125, -0.07888031005859375, -0.0598297119140625, -0.04077911376953125, -0.021728515625, -0.00267791748046875, 0.0163726806640625, 0.03542327880859375, 0.054473876953125, 0.07352447509765625, 0.0925750732421875, 0.11162567138671875, 0.13067626953125, 0.14972686767578125, 0.1687774658203125, 0.18782806396484375, 0.206878662109375, 0.22592926025390625, 0.2449798583984375, 0.26403045654296875, 0.2830810546875, 0.30213165283203125, 0.3211822509765625, 0.34023284912109375, 0.359283447265625, 0.37833404541015625, 0.3973846435546875, 0.41643524169921875, 0.43548583984375, 0.45453643798828125, 0.4735870361328125, 0.49263763427734375, 0.511688232421875, 0.5307388305664062, 0.5497894287109375, 0.5688400268554688, 0.587890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 9.0, 9.0, 13.0, 13.0, 15.0, 26.0, 19.0, 36.0, 33.0, 41.0, 50.0, 46.0, 59.0, 70.0, 58.0, 61.0, 56.0, 55.0, 53.0, 47.0, 43.0, 35.0, 26.0, 36.0, 16.0, 17.0, 11.0, 14.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4093017578125, -3.283447265625, -3.1575927734375, -3.03173828125, -2.9058837890625, -2.780029296875, -2.6541748046875, -2.5283203125, -2.4024658203125, -2.276611328125, -2.1507568359375, -2.02490234375, -1.8990478515625, -1.773193359375, -1.6473388671875, -1.521484375, -1.3956298828125, -1.269775390625, -1.1439208984375, -1.01806640625, -0.8922119140625, -0.766357421875, -0.6405029296875, -0.5146484375, -0.3887939453125, -0.262939453125, -0.1370849609375, -0.01123046875, 0.1146240234375, 0.240478515625, 0.3663330078125, 0.4921875, 0.6180419921875, 0.743896484375, 0.8697509765625, 0.99560546875, 1.1214599609375, 1.247314453125, 1.3731689453125, 1.4990234375, 1.6248779296875, 1.750732421875, 1.8765869140625, 2.00244140625, 2.1282958984375, 2.254150390625, 2.3800048828125, 2.505859375, 2.6317138671875, 2.757568359375, 2.8834228515625, 3.00927734375, 3.1351318359375, 3.260986328125, 3.3868408203125, 3.5126953125, 3.6385498046875, 3.764404296875, 3.8902587890625, 4.01611328125, 4.1419677734375, 4.267822265625, 4.3936767578125, 4.51953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 20.0, 25.0, 37.0, 66.0, 91.0, 152.0, 271.0, 517.0, 891.0, 1761.0, 3407.0, 7594.0, 20829.0, 75326.0, 378474.0, 431378.0, 88468.0, 22913.0, 8504.0, 3674.0, 1885.0, 1026.0, 507.0, 274.0, 153.0, 104.0, 65.0, 38.0, 33.0, 19.0, 12.0, 7.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.22216796875, -0.21632957458496094, -0.21049118041992188, -0.2046527862548828, -0.19881439208984375, -0.1929759979248047, -0.18713760375976562, -0.18129920959472656, -0.1754608154296875, -0.16962242126464844, -0.16378402709960938, -0.1579456329345703, -0.15210723876953125, -0.1462688446044922, -0.14043045043945312, -0.13459205627441406, -0.128753662109375, -0.12291526794433594, -0.11707687377929688, -0.11123847961425781, -0.10540008544921875, -0.09956169128417969, -0.09372329711914062, -0.08788490295410156, -0.0820465087890625, -0.07620811462402344, -0.07036972045898438, -0.06453132629394531, -0.05869293212890625, -0.05285453796386719, -0.047016143798828125, -0.04117774963378906, -0.03533935546875, -0.029500961303710938, -0.023662567138671875, -0.017824172973632812, -0.01198577880859375, -0.0061473846435546875, -0.000308990478515625, 0.0055294036865234375, 0.0113677978515625, 0.017206192016601562, 0.023044586181640625, 0.028882980346679688, 0.03472137451171875, 0.04055976867675781, 0.046398162841796875, 0.05223655700683594, 0.058074951171875, 0.06391334533691406, 0.06975173950195312, 0.07559013366699219, 0.08142852783203125, 0.08726692199707031, 0.09310531616210938, 0.09894371032714844, 0.1047821044921875, 0.11062049865722656, 0.11645889282226562, 0.12229728698730469, 0.12813568115234375, 0.1339740753173828, 0.13981246948242188, 0.14565086364746094, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 9.0, 19.0, 25.0, 33.0, 41.0, 70.0, 101.0, 102.0, 132.0, 120.0, 91.0, 70.0, 52.0, 35.0, 25.0, 19.0, 15.0, 4.0, 4.0, 9.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011783838272094727, -0.00011319946497678757, -0.00010856054723262787, -0.00010392162948846817, -9.928271174430847e-05, -9.464379400014877e-05, -9.000487625598907e-05, -8.536595851182938e-05, -8.072704076766968e-05, -7.608812302350998e-05, -7.144920527935028e-05, -6.681028753519058e-05, -6.217136979103088e-05, -5.7532452046871185e-05, -5.289353430271149e-05, -4.825461655855179e-05, -4.361569881439209e-05, -3.897678107023239e-05, -3.433786332607269e-05, -2.9698945581912994e-05, -2.5060027837753296e-05, -2.0421110093593597e-05, -1.57821923494339e-05, -1.11432746052742e-05, -6.504356861114502e-06, -1.8654391169548035e-06, 2.773478627204895e-06, 7.4123963713645935e-06, 1.2051314115524292e-05, 1.669023185968399e-05, 2.132914960384369e-05, 2.5968067348003387e-05, 3.0606985092163086e-05, 3.5245902836322784e-05, 3.988482058048248e-05, 4.452373832464218e-05, 4.916265606880188e-05, 5.380157381296158e-05, 5.844049155712128e-05, 6.307940930128098e-05, 6.771832704544067e-05, 7.235724478960037e-05, 7.699616253376007e-05, 8.163508027791977e-05, 8.627399802207947e-05, 9.091291576623917e-05, 9.555183351039886e-05, 0.00010019075125455856, 0.00010482966899871826, 0.00010946858674287796, 0.00011410750448703766, 0.00011874642223119736, 0.00012338533997535706, 0.00012802425771951675, 0.00013266317546367645, 0.00013730209320783615, 0.00014194101095199585, 0.00014657992869615555, 0.00015121884644031525, 0.00015585776418447495, 0.00016049668192863464, 0.00016513559967279434, 0.00016977451741695404, 0.00017441343516111374, 0.00017905235290527344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 13.0, 4.0, 14.0, 12.0, 15.0, 23.0, 36.0, 67.0, 66.0, 137.0, 188.0, 366.0, 647.0, 1184.0, 2266.0, 4590.0, 10643.0, 29567.0, 108000.0, 451810.0, 327216.0, 73766.0, 21596.0, 8270.0, 3830.0, 1847.0, 956.0, 546.0, 320.0, 180.0, 126.0, 74.0, 54.0, 40.0, 23.0, 10.0, 12.0, 9.0, 12.0, 7.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166259765625, -0.16049957275390625, -0.1547393798828125, -0.14897918701171875, -0.143218994140625, -0.13745880126953125, -0.1316986083984375, -0.12593841552734375, -0.12017822265625, -0.11441802978515625, -0.1086578369140625, -0.10289764404296875, -0.097137451171875, -0.09137725830078125, -0.0856170654296875, -0.07985687255859375, -0.0740966796875, -0.06833648681640625, -0.0625762939453125, -0.05681610107421875, -0.051055908203125, -0.04529571533203125, -0.0395355224609375, -0.03377532958984375, -0.02801513671875, -0.02225494384765625, -0.0164947509765625, -0.01073455810546875, -0.004974365234375, 0.00078582763671875, 0.0065460205078125, 0.01230621337890625, 0.01806640625, 0.02382659912109375, 0.0295867919921875, 0.03534698486328125, 0.041107177734375, 0.04686737060546875, 0.0526275634765625, 0.05838775634765625, 0.06414794921875, 0.06990814208984375, 0.0756683349609375, 0.08142852783203125, 0.087188720703125, 0.09294891357421875, 0.0987091064453125, 0.10446929931640625, 0.1102294921875, 0.11598968505859375, 0.1217498779296875, 0.12751007080078125, 0.133270263671875, 0.13903045654296875, 0.1447906494140625, 0.15055084228515625, 0.15631103515625, 0.16207122802734375, 0.1678314208984375, 0.17359161376953125, 0.179351806640625, 0.18511199951171875, 0.1908721923828125, 0.19663238525390625, 0.202392578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 12.0, 12.0, 22.0, 10.0, 18.0, 38.0, 42.0, 39.0, 56.0, 82.0, 86.0, 94.0, 93.0, 80.0, 69.0, 63.0, 47.0, 38.0, 22.0, 21.0, 14.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037109375, -0.03561687469482422, -0.03412437438964844, -0.032631874084472656, -0.031139373779296875, -0.029646873474121094, -0.028154373168945312, -0.02666187286376953, -0.02516937255859375, -0.02367687225341797, -0.022184371948242188, -0.020691871643066406, -0.019199371337890625, -0.017706871032714844, -0.016214370727539062, -0.014721870422363281, -0.0132293701171875, -0.011736869812011719, -0.010244369506835938, -0.008751869201660156, -0.007259368896484375, -0.005766868591308594, -0.0042743682861328125, -0.0027818679809570312, -0.00128936767578125, 0.00020313262939453125, 0.0016956329345703125, 0.0031881332397460938, 0.004680633544921875, 0.006173133850097656, 0.0076656341552734375, 0.009158134460449219, 0.010650634765625, 0.012143135070800781, 0.013635635375976562, 0.015128135681152344, 0.016620635986328125, 0.018113136291503906, 0.019605636596679688, 0.02109813690185547, 0.02259063720703125, 0.02408313751220703, 0.025575637817382812, 0.027068138122558594, 0.028560638427734375, 0.030053138732910156, 0.03154563903808594, 0.03303813934326172, 0.0345306396484375, 0.03602313995361328, 0.03751564025878906, 0.039008140563964844, 0.040500640869140625, 0.041993141174316406, 0.04348564147949219, 0.04497814178466797, 0.04647064208984375, 0.04796314239501953, 0.04945564270019531, 0.050948143005371094, 0.052440643310546875, 0.053933143615722656, 0.05542564392089844, 0.05691814422607422, 0.05841064453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 10.0, 7.0, 19.0, 26.0, 39.0, 66.0, 94.0, 175.0, 165.0, 137.0, 104.0, 72.0, 31.0, 17.0, 10.0, 8.0, 7.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.084479808807373, -4.936653137207031, -4.7888264656066895, -4.641000270843506, -4.493173599243164, -4.345346927642822, -4.1975202560424805, -4.049693584442139, -3.901867151260376, -3.754040479660034, -3.6062140464782715, -3.4583873748779297, -3.310560703277588, -3.162734270095825, -3.0149075984954834, -2.8670811653137207, -2.719254493713379, -2.571427822113037, -2.4236013889312744, -2.2757747173309326, -2.12794828414917, -1.9801216125488281, -1.8322949409484863, -1.684468388557434, -1.5366418361663818, -1.3888152837753296, -1.2409887313842773, -1.0931620597839355, -0.9453355073928833, -0.797508955001831, -0.649682343006134, -0.501855731010437, -0.35402917861938477, -0.20620259642601013, -0.0583760142326355, 0.08945056796073914, 0.23727715015411377, 0.385103702545166, 0.532930314540863, 0.6807569265365601, 0.8285834789276123, 0.9764100313186646, 1.1242365837097168, 1.2720632553100586, 1.4198898077011108, 1.567716360092163, 1.7155430316925049, 1.8633695840835571, 2.0111961364746094, 2.159022808074951, 2.306849241256714, 2.4546759128570557, 2.6025023460388184, 2.75032901763916, 2.898155689239502, 3.0459823608398438, 3.1938087940216064, 3.3416354656219482, 3.489461898803711, 3.6372885704040527, 3.7851152420043945, 3.9329416751861572, 4.08076810836792, 4.228594779968262, 4.3764214515686035]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 17.0, 13.0, 22.0, 28.0, 39.0, 51.0, 50.0, 51.0, 68.0, 85.0, 95.0, 68.0, 79.0, 62.0, 55.0, 55.0, 35.0, 33.0, 22.0, 22.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4835197925567627, -3.3976821899414062, -3.31184458732605, -3.2260069847106934, -3.140169620513916, -3.0543320178985596, -2.968494415283203, -2.8826568126678467, -2.7968192100524902, -2.710981607437134, -2.6251440048217773, -2.539306640625, -2.4534690380096436, -2.367631435394287, -2.2817938327789307, -2.195956230163574, -2.110118865966797, -2.0242812633514404, -1.9384437799453735, -1.852606177330017, -1.7667686939239502, -1.6809310913085938, -1.5950934886932373, -1.5092558860778809, -1.423418402671814, -1.3375808000564575, -1.2517433166503906, -1.1659057140350342, -1.0800681114196777, -0.9942306280136108, -0.9083930253982544, -0.8225554823875427, -0.7367181777954102, -0.6508806347846985, -0.5650430917739868, -0.47920548915863037, -0.3933679461479187, -0.30753040313720703, -0.22169280052185059, -0.13585525751113892, -0.050017714500427246, 0.03581984341144562, 0.12165740132331848, 0.20749497413635254, 0.2933325171470642, 0.3791700601577759, 0.4650076627731323, 0.550845205783844, 0.6366827487945557, 0.7225202918052673, 0.808357834815979, 0.8941954374313354, 0.9800329804420471, 1.0658705234527588, 1.1517081260681152, 1.2375457286834717, 1.3233832120895386, 1.409220814704895, 1.495058298110962, 1.5808959007263184, 1.6667335033416748, 1.7525709867477417, 1.8384085893630981, 1.924246072769165, 2.0100836753845215]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 8.0, 14.0, 22.0, 42.0, 65.0, 157.0, 244.0, 519.0, 1053.0, 2354.0, 6112.0, 19030.0, 79613.0, 644098.0, 238707.0, 38524.0, 11053.0, 3887.0, 1583.0, 687.0, 370.0, 178.0, 88.0, 51.0, 29.0, 22.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.19921875, -3.09173583984375, -2.9842529296875, -2.87677001953125, -2.769287109375, -2.66180419921875, -2.5543212890625, -2.44683837890625, -2.33935546875, -2.23187255859375, -2.1243896484375, -2.01690673828125, -1.909423828125, -1.80194091796875, -1.6944580078125, -1.58697509765625, -1.4794921875, -1.37200927734375, -1.2645263671875, -1.15704345703125, -1.049560546875, -0.94207763671875, -0.8345947265625, -0.72711181640625, -0.61962890625, -0.51214599609375, -0.4046630859375, -0.29718017578125, -0.189697265625, -0.08221435546875, 0.0252685546875, 0.13275146484375, 0.240234375, 0.34771728515625, 0.4552001953125, 0.56268310546875, 0.670166015625, 0.77764892578125, 0.8851318359375, 0.99261474609375, 1.10009765625, 1.20758056640625, 1.3150634765625, 1.42254638671875, 1.530029296875, 1.63751220703125, 1.7449951171875, 1.85247802734375, 1.9599609375, 2.06744384765625, 2.1749267578125, 2.28240966796875, 2.389892578125, 2.49737548828125, 2.6048583984375, 2.71234130859375, 2.81982421875, 2.92730712890625, 3.0347900390625, 3.14227294921875, 3.249755859375, 3.35723876953125, 3.4647216796875, 3.57220458984375, 3.6796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 4.0, 8.0, 11.0, 11.0, 14.0, 10.0, 32.0, 23.0, 33.0, 35.0, 43.0, 70.0, 60.0, 57.0, 78.0, 56.0, 54.0, 71.0, 41.0, 49.0, 49.0, 39.0, 34.0, 21.0, 22.0, 18.0, 13.0, 7.0, 5.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-6.9296875, -6.764923095703125, -6.60015869140625, -6.435394287109375, -6.2706298828125, -6.105865478515625, -5.94110107421875, -5.776336669921875, -5.611572265625, -5.446807861328125, -5.28204345703125, -5.117279052734375, -4.9525146484375, -4.787750244140625, -4.62298583984375, -4.458221435546875, -4.29345703125, -4.128692626953125, -3.96392822265625, -3.799163818359375, -3.6343994140625, -3.469635009765625, -3.30487060546875, -3.140106201171875, -2.975341796875, -2.810577392578125, -2.64581298828125, -2.481048583984375, -2.3162841796875, -2.151519775390625, -1.98675537109375, -1.821990966796875, -1.6572265625, -1.492462158203125, -1.32769775390625, -1.162933349609375, -0.9981689453125, -0.833404541015625, -0.66864013671875, -0.503875732421875, -0.339111328125, -0.174346923828125, -0.00958251953125, 0.155181884765625, 0.3199462890625, 0.484710693359375, 0.64947509765625, 0.814239501953125, 0.97900390625, 1.143768310546875, 1.30853271484375, 1.473297119140625, 1.6380615234375, 1.802825927734375, 1.96759033203125, 2.132354736328125, 2.297119140625, 2.461883544921875, 2.62664794921875, 2.791412353515625, 2.9561767578125, 3.120941162109375, 3.28570556640625, 3.450469970703125, 3.615234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 12.0, 12.0, 14.0, 14.0, 16.0, 22.0, 21.0, 21.0, 25.0, 26.0, 27.0, 24.0, 33.0, 41.0, 47.0, 88.0, 342.0, 5564.0, 915583.0, 123997.0, 1963.0, 218.0, 76.0, 38.0, 30.0, 25.0, 20.0, 33.0, 26.0, 16.0, 20.0, 19.0, 18.0, 15.0, 14.0, 8.0, 11.0, 9.0, 8.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.0078125, -9.67236328125, -9.3369140625, -9.00146484375, -8.666015625, -8.33056640625, -7.9951171875, -7.65966796875, -7.32421875, -6.98876953125, -6.6533203125, -6.31787109375, -5.982421875, -5.64697265625, -5.3115234375, -4.97607421875, -4.640625, -4.30517578125, -3.9697265625, -3.63427734375, -3.298828125, -2.96337890625, -2.6279296875, -2.29248046875, -1.95703125, -1.62158203125, -1.2861328125, -0.95068359375, -0.615234375, -0.27978515625, 0.0556640625, 0.39111328125, 0.7265625, 1.06201171875, 1.3974609375, 1.73291015625, 2.068359375, 2.40380859375, 2.7392578125, 3.07470703125, 3.41015625, 3.74560546875, 4.0810546875, 4.41650390625, 4.751953125, 5.08740234375, 5.4228515625, 5.75830078125, 6.09375, 6.42919921875, 6.7646484375, 7.10009765625, 7.435546875, 7.77099609375, 8.1064453125, 8.44189453125, 8.77734375, 9.11279296875, 9.4482421875, 9.78369140625, 10.119140625, 10.45458984375, 10.7900390625, 11.12548828125, 11.4609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 13.0, 21.0, 20.0, 17.0, 12.0, 21.0, 30.0, 23.0, 21.0, 27.0, 29.0, 27.0, 42.0, 34.0, 37.0, 43.0, 42.0, 44.0, 38.0, 31.0, 50.0, 24.0, 27.0, 24.0, 22.0, 34.0, 22.0, 22.0, 19.0, 23.0, 20.0, 17.0, 13.0, 6.0, 10.0, 14.0, 8.0, 11.0, 5.0, 10.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.630859375, -3.502593994140625, -3.37432861328125, -3.246063232421875, -3.1177978515625, -2.989532470703125, -2.86126708984375, -2.733001708984375, -2.604736328125, -2.476470947265625, -2.34820556640625, -2.219940185546875, -2.0916748046875, -1.963409423828125, -1.83514404296875, -1.706878662109375, -1.57861328125, -1.450347900390625, -1.32208251953125, -1.193817138671875, -1.0655517578125, -0.937286376953125, -0.80902099609375, -0.680755615234375, -0.552490234375, -0.424224853515625, -0.29595947265625, -0.167694091796875, -0.0394287109375, 0.088836669921875, 0.21710205078125, 0.345367431640625, 0.4736328125, 0.601898193359375, 0.73016357421875, 0.858428955078125, 0.9866943359375, 1.114959716796875, 1.24322509765625, 1.371490478515625, 1.499755859375, 1.628021240234375, 1.75628662109375, 1.884552001953125, 2.0128173828125, 2.141082763671875, 2.26934814453125, 2.397613525390625, 2.52587890625, 2.654144287109375, 2.78240966796875, 2.910675048828125, 3.0389404296875, 3.167205810546875, 3.29547119140625, 3.423736572265625, 3.552001953125, 3.680267333984375, 3.80853271484375, 3.936798095703125, 4.0650634765625, 4.193328857421875, 4.32159423828125, 4.449859619140625, 4.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 7.0, 21.0, 24.0, 35.0, 85.0, 145.0, 298.0, 627.0, 1408.0, 4508.0, 20673.0, 259957.0, 711070.0, 39692.0, 6552.0, 1915.0, 751.0, 331.0, 154.0, 98.0, 55.0, 40.0, 23.0, 19.0, 8.0, 12.0, 2.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1396484375, -1.0904388427734375, -1.041229248046875, -0.9920196533203125, -0.94281005859375, -0.8936004638671875, -0.844390869140625, -0.7951812744140625, -0.7459716796875, -0.6967620849609375, -0.647552490234375, -0.5983428955078125, -0.54913330078125, -0.4999237060546875, -0.450714111328125, -0.4015045166015625, -0.352294921875, -0.3030853271484375, -0.253875732421875, -0.2046661376953125, -0.15545654296875, -0.1062469482421875, -0.057037353515625, -0.0078277587890625, 0.0413818359375, 0.0905914306640625, 0.139801025390625, 0.1890106201171875, 0.23822021484375, 0.2874298095703125, 0.336639404296875, 0.3858489990234375, 0.43505859375, 0.4842681884765625, 0.533477783203125, 0.5826873779296875, 0.63189697265625, 0.6811065673828125, 0.730316162109375, 0.7795257568359375, 0.8287353515625, 0.8779449462890625, 0.927154541015625, 0.9763641357421875, 1.02557373046875, 1.0747833251953125, 1.123992919921875, 1.1732025146484375, 1.222412109375, 1.2716217041015625, 1.320831298828125, 1.3700408935546875, 1.41925048828125, 1.4684600830078125, 1.517669677734375, 1.5668792724609375, 1.6160888671875, 1.6652984619140625, 1.714508056640625, 1.7637176513671875, 1.81292724609375, 1.8621368408203125, 1.911346435546875, 1.9605560302734375, 2.009765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 7.0, 15.0, 15.0, 25.0, 35.0, 47.0, 71.0, 107.0, 182.0, 142.0, 118.0, 76.0, 33.0, 31.0, 18.0, 19.0, 14.0, 12.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002149343490600586, -0.00020877830684185028, -0.00020262226462364197, -0.00019646622240543365, -0.00019031018018722534, -0.00018415413796901703, -0.00017799809575080872, -0.0001718420535326004, -0.0001656860113143921, -0.00015952996909618378, -0.00015337392687797546, -0.00014721788465976715, -0.00014106184244155884, -0.00013490580022335052, -0.0001287497580051422, -0.0001225937157869339, -0.00011643767356872559, -0.00011028163135051727, -0.00010412558913230896, -9.796954691410065e-05, -9.181350469589233e-05, -8.565746247768402e-05, -7.950142025947571e-05, -7.33453780412674e-05, -6.718933582305908e-05, -6.103329360485077e-05, -5.4877251386642456e-05, -4.872120916843414e-05, -4.256516695022583e-05, -3.640912473201752e-05, -3.0253082513809204e-05, -2.409704029560089e-05, -1.7940998077392578e-05, -1.1784955859184265e-05, -5.628913640975952e-06, 5.271285772323608e-07, 6.683170795440674e-06, 1.2839213013648987e-05, 1.89952552318573e-05, 2.5151297450065613e-05, 3.1307339668273926e-05, 3.746338188648224e-05, 4.361942410469055e-05, 4.9775466322898865e-05, 5.593150854110718e-05, 6.208755075931549e-05, 6.82435929775238e-05, 7.439963519573212e-05, 8.055567741394043e-05, 8.671171963214874e-05, 9.286776185035706e-05, 9.902380406856537e-05, 0.00010517984628677368, 0.000111335888504982, 0.00011749193072319031, 0.00012364797294139862, 0.00012980401515960693, 0.00013596005737781525, 0.00014211609959602356, 0.00014827214181423187, 0.00015442818403244019, 0.0001605842262506485, 0.0001667402684688568, 0.00017289631068706512, 0.00017905235290527344]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 11.0, 17.0, 25.0, 44.0, 47.0, 92.0, 147.0, 218.0, 359.0, 613.0, 1109.0, 2104.0, 4314.0, 10179.0, 30302.0, 145194.0, 678716.0, 128470.0, 28017.0, 9730.0, 4184.0, 2006.0, 1115.0, 565.0, 323.0, 197.0, 133.0, 104.0, 55.0, 45.0, 24.0, 26.0, 14.0, 9.0, 8.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.033203125, -1.0040740966796875, -0.974945068359375, -0.9458160400390625, -0.91668701171875, -0.8875579833984375, -0.858428955078125, -0.8292999267578125, -0.8001708984375, -0.7710418701171875, -0.741912841796875, -0.7127838134765625, -0.68365478515625, -0.6545257568359375, -0.625396728515625, -0.5962677001953125, -0.567138671875, -0.5380096435546875, -0.508880615234375, -0.4797515869140625, -0.45062255859375, -0.4214935302734375, -0.392364501953125, -0.3632354736328125, -0.3341064453125, -0.3049774169921875, -0.275848388671875, -0.2467193603515625, -0.21759033203125, -0.1884613037109375, -0.159332275390625, -0.1302032470703125, -0.10107421875, -0.0719451904296875, -0.042816162109375, -0.0136871337890625, 0.01544189453125, 0.0445709228515625, 0.073699951171875, 0.1028289794921875, 0.1319580078125, 0.1610870361328125, 0.190216064453125, 0.2193450927734375, 0.24847412109375, 0.2776031494140625, 0.306732177734375, 0.3358612060546875, 0.364990234375, 0.3941192626953125, 0.423248291015625, 0.4523773193359375, 0.48150634765625, 0.5106353759765625, 0.539764404296875, 0.5688934326171875, 0.5980224609375, 0.6271514892578125, 0.656280517578125, 0.6854095458984375, 0.71453857421875, 0.7436676025390625, 0.772796630859375, 0.8019256591796875, 0.8310546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 2.0, 7.0, 7.0, 12.0, 22.0, 39.0, 42.0, 53.0, 89.0, 151.0, 187.0, 146.0, 76.0, 44.0, 34.0, 22.0, 17.0, 9.0, 10.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6259765625, -0.6065673828125, -0.587158203125, -0.5677490234375, -0.54833984375, -0.5289306640625, -0.509521484375, -0.4901123046875, -0.470703125, -0.4512939453125, -0.431884765625, -0.4124755859375, -0.39306640625, -0.3736572265625, -0.354248046875, -0.3348388671875, -0.3154296875, -0.2960205078125, -0.276611328125, -0.2572021484375, -0.23779296875, -0.2183837890625, -0.198974609375, -0.1795654296875, -0.16015625, -0.1407470703125, -0.121337890625, -0.1019287109375, -0.08251953125, -0.0631103515625, -0.043701171875, -0.0242919921875, -0.0048828125, 0.0145263671875, 0.033935546875, 0.0533447265625, 0.07275390625, 0.0921630859375, 0.111572265625, 0.1309814453125, 0.150390625, 0.1697998046875, 0.189208984375, 0.2086181640625, 0.22802734375, 0.2474365234375, 0.266845703125, 0.2862548828125, 0.3056640625, 0.3250732421875, 0.344482421875, 0.3638916015625, 0.38330078125, 0.4027099609375, 0.422119140625, 0.4415283203125, 0.4609375, 0.4803466796875, 0.499755859375, 0.5191650390625, 0.53857421875, 0.5579833984375, 0.577392578125, 0.5968017578125, 0.6162109375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 12.0, 15.0, 9.0, 16.0, 42.0, 40.0, 59.0, 88.0, 129.0, 130.0, 105.0, 98.0, 78.0, 61.0, 34.0, 17.0, 13.0, 17.0, 9.0, 6.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.66705322265625, -7.446164608001709, -7.225276470184326, -7.004387855529785, -6.783499240875244, -6.562610626220703, -6.34172248840332, -6.120833873748779, -5.899945259094238, -5.679056644439697, -5.4581685066223145, -5.237279891967773, -5.016391277313232, -4.795502662658691, -4.574614524841309, -4.353725910186768, -4.132837295532227, -3.9119489192962646, -3.6910603046417236, -3.4701719284057617, -3.2492833137512207, -3.028394937515259, -2.807506561279297, -2.586617946624756, -2.365729808807373, -2.144841432571411, -1.9239528179168701, -1.7030644416809082, -1.4821758270263672, -1.2612874507904053, -1.0403989553451538, -0.8195104598999023, -0.5986218452453613, -0.37773334980010986, -0.1568448841571808, 0.06404358148574829, 0.28493207693099976, 0.5058205127716064, 0.7267090082168579, 0.9475975036621094, 1.1684859991073608, 1.3893744945526123, 1.6102629899978638, 1.8311514854431152, 2.052039861679077, 2.272928237915039, 2.49381685256958, 2.714705467224121, 2.935593843460083, 3.156482219696045, 3.377370834350586, 3.598259210586548, 3.819147825241089, 4.040036201477051, 4.260924816131592, 4.481813430786133, 4.702701568603516, 4.923590183258057, 5.1444783210754395, 5.3653669357299805, 5.5862555503845215, 5.8071441650390625, 6.028032302856445, 6.248920917510986, 6.469809532165527]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 4.0, 8.0, 7.0, 11.0, 8.0, 11.0, 12.0, 21.0, 12.0, 21.0, 24.0, 31.0, 31.0, 39.0, 41.0, 41.0, 40.0, 52.0, 33.0, 48.0, 40.0, 32.0, 37.0, 40.0, 35.0, 36.0, 34.0, 31.0, 27.0, 32.0, 25.0, 27.0, 20.0, 11.0, 14.0, 14.0, 14.0, 3.0, 5.0, 4.0, 10.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.317837238311768, -7.08499002456665, -6.852142810821533, -6.619295597076416, -6.386447906494141, -6.153600692749023, -5.920753479003906, -5.687906265258789, -5.455059051513672, -5.222211837768555, -4.9893646240234375, -4.75651741027832, -4.523670196533203, -4.290822982788086, -4.0579752922058105, -3.8251280784606934, -3.592280864715576, -3.359433650970459, -3.126586437225342, -2.8937389850616455, -2.6608917713165283, -2.428044557571411, -2.195197105407715, -1.9623498916625977, -1.7295026779174805, -1.4966554641723633, -1.2638081312179565, -1.0309607982635498, -0.7981135845184326, -0.5652663707733154, -0.3324190378189087, -0.09957170486450195, 0.13327550888061523, 0.3661227822303772, 0.5989700555801392, 0.8318173289299011, 1.064664602279663, 1.2975118160247803, 1.530359148979187, 1.7632064819335938, 1.996053695678711, 2.228900909423828, 2.4617481231689453, 2.6945955753326416, 2.927442789077759, 3.160290002822876, 3.3931374549865723, 3.6259846687316895, 3.8588318824768066, 4.091679096221924, 4.324526309967041, 4.557373523712158, 4.790221214294434, 5.023068428039551, 5.255915641784668, 5.488762855529785, 5.721610069274902, 5.9544572830200195, 6.187304496765137, 6.420151710510254, 6.652998924255371, 6.885846138000488, 7.118693828582764, 7.351541042327881, 7.584388256072998]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 3.0, 8.0, 8.0, 17.0, 20.0, 30.0, 26.0, 72.0, 85.0, 156.0, 293.0, 640.0, 1775.0, 6013.0, 31885.0, 641030.0, 3408779.0, 87095.0, 11616.0, 2821.0, 941.0, 414.0, 203.0, 109.0, 64.0, 48.0, 29.0, 27.0, 12.0, 10.0, 8.0, 8.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.1796875, -6.9698486328125, -6.760009765625, -6.5501708984375, -6.34033203125, -6.1304931640625, -5.920654296875, -5.7108154296875, -5.5009765625, -5.2911376953125, -5.081298828125, -4.8714599609375, -4.66162109375, -4.4517822265625, -4.241943359375, -4.0321044921875, -3.822265625, -3.6124267578125, -3.402587890625, -3.1927490234375, -2.98291015625, -2.7730712890625, -2.563232421875, -2.3533935546875, -2.1435546875, -1.9337158203125, -1.723876953125, -1.5140380859375, -1.30419921875, -1.0943603515625, -0.884521484375, -0.6746826171875, -0.46484375, -0.2550048828125, -0.045166015625, 0.1646728515625, 0.37451171875, 0.5843505859375, 0.794189453125, 1.0040283203125, 1.2138671875, 1.4237060546875, 1.633544921875, 1.8433837890625, 2.05322265625, 2.2630615234375, 2.472900390625, 2.6827392578125, 2.892578125, 3.1024169921875, 3.312255859375, 3.5220947265625, 3.73193359375, 3.9417724609375, 4.151611328125, 4.3614501953125, 4.5712890625, 4.7811279296875, 4.990966796875, 5.2008056640625, 5.41064453125, 5.6204833984375, 5.830322265625, 6.0401611328125, 6.25]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 7.0, 6.0, 10.0, 19.0, 25.0, 26.0, 32.0, 59.0, 56.0, 61.0, 80.0, 84.0, 82.0, 70.0, 64.0, 61.0, 52.0, 51.0, 35.0, 26.0, 17.0, 13.0, 13.0, 13.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.908203125, -3.808563232421875, -3.70892333984375, -3.609283447265625, -3.5096435546875, -3.410003662109375, -3.31036376953125, -3.210723876953125, -3.111083984375, -3.011444091796875, -2.91180419921875, -2.812164306640625, -2.7125244140625, -2.612884521484375, -2.51324462890625, -2.413604736328125, -2.31396484375, -2.214324951171875, -2.11468505859375, -2.015045166015625, -1.9154052734375, -1.815765380859375, -1.71612548828125, -1.616485595703125, -1.516845703125, -1.417205810546875, -1.31756591796875, -1.217926025390625, -1.1182861328125, -1.018646240234375, -0.91900634765625, -0.819366455078125, -0.7197265625, -0.620086669921875, -0.52044677734375, -0.420806884765625, -0.3211669921875, -0.221527099609375, -0.12188720703125, -0.022247314453125, 0.077392578125, 0.177032470703125, 0.27667236328125, 0.376312255859375, 0.4759521484375, 0.575592041015625, 0.67523193359375, 0.774871826171875, 0.87451171875, 0.974151611328125, 1.07379150390625, 1.173431396484375, 1.2730712890625, 1.372711181640625, 1.47235107421875, 1.571990966796875, 1.671630859375, 1.771270751953125, 1.87091064453125, 1.970550537109375, 2.0701904296875, 2.169830322265625, 2.26947021484375, 2.369110107421875, 2.46875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 15.0, 31.0, 43.0, 113.0, 308.0, 1645.0, 53296.0, 4120618.0, 16792.0, 969.0, 219.0, 98.0, 43.0, 22.0, 21.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -9.880859375, -9.37109375, -8.861328125, -8.3515625, -7.841796875, -7.33203125, -6.822265625, -6.3125, -5.802734375, -5.29296875, -4.783203125, -4.2734375, -3.763671875, -3.25390625, -2.744140625, -2.234375, -1.724609375, -1.21484375, -0.705078125, -0.1953125, 0.314453125, 0.82421875, 1.333984375, 1.84375, 2.353515625, 2.86328125, 3.373046875, 3.8828125, 4.392578125, 4.90234375, 5.412109375, 5.921875, 6.431640625, 6.94140625, 7.451171875, 7.9609375, 8.470703125, 8.98046875, 9.490234375, 10.0, 10.509765625, 11.01953125, 11.529296875, 12.0390625, 12.548828125, 13.05859375, 13.568359375, 14.078125, 14.587890625, 15.09765625, 15.607421875, 16.1171875, 16.626953125, 17.13671875, 17.646484375, 18.15625, 18.666015625, 19.17578125, 19.685546875, 20.1953125, 20.705078125, 21.21484375, 21.724609375, 22.234375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 9.0, 6.0, 9.0, 17.0, 26.0, 22.0, 31.0, 43.0, 75.0, 99.0, 120.0, 153.0, 226.0, 407.0, 727.0, 751.0, 420.0, 273.0, 188.0, 133.0, 65.0, 70.0, 49.0, 35.0, 18.0, 21.0, 22.0, 7.0, 13.0, 4.0, 2.0, 9.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89794921875, -0.8680801391601562, -0.8382110595703125, -0.8083419799804688, -0.778472900390625, -0.7486038208007812, -0.7187347412109375, -0.6888656616210938, -0.65899658203125, -0.6291275024414062, -0.5992584228515625, -0.5693893432617188, -0.539520263671875, -0.5096511840820312, -0.4797821044921875, -0.44991302490234375, -0.4200439453125, -0.39017486572265625, -0.3603057861328125, -0.33043670654296875, -0.300567626953125, -0.27069854736328125, -0.2408294677734375, -0.21096038818359375, -0.18109130859375, -0.15122222900390625, -0.1213531494140625, -0.09148406982421875, -0.061614990234375, -0.03174591064453125, -0.0018768310546875, 0.02799224853515625, 0.057861328125, 0.08773040771484375, 0.1175994873046875, 0.14746856689453125, 0.177337646484375, 0.20720672607421875, 0.2370758056640625, 0.26694488525390625, 0.29681396484375, 0.32668304443359375, 0.3565521240234375, 0.38642120361328125, 0.416290283203125, 0.44615936279296875, 0.4760284423828125, 0.5058975219726562, 0.5357666015625, 0.5656356811523438, 0.5955047607421875, 0.6253738403320312, 0.655242919921875, 0.6851119995117188, 0.7149810791015625, 0.7448501586914062, 0.77471923828125, 0.8045883178710938, 0.8344573974609375, 0.8643264770507812, 0.894195556640625, 0.9240646362304688, 0.9539337158203125, 0.9838027954101562, 1.013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 16.0, 11.0, 15.0, 28.0, 28.0, 52.0, 64.0, 71.0, 100.0, 107.0, 118.0, 75.0, 69.0, 59.0, 36.0, 34.0, 21.0, 21.0, 8.0, 13.0, 14.0, 7.0, 0.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.490677356719971, -4.362713813781738, -4.234749794006348, -4.106786251068115, -3.9788224697113037, -3.850858688354492, -3.7228951454162598, -3.5949313640594482, -3.4669675827026367, -3.339003801345825, -3.2110402584075928, -3.0830764770507812, -2.9551126956939697, -2.827148914337158, -2.699185371398926, -2.5712215900421143, -2.443258047103882, -2.3152942657470703, -2.187330722808838, -2.0593669414520264, -1.9314031600952148, -1.8034394979476929, -1.675475835800171, -1.5475120544433594, -1.4195483922958374, -1.2915847301483154, -1.163620948791504, -1.035657286643982, -0.9076935648918152, -0.7797298431396484, -0.6517661809921265, -0.5238024592399597, -0.39583897590637207, -0.2678752541542053, -0.13991156220436096, -0.011947870254516602, 0.11601585149765015, 0.2439795732498169, 0.37194323539733887, 0.4999069571495056, 0.6278706789016724, 0.7558344006538391, 0.8837981224060059, 1.0117617845535278, 1.1397254467010498, 1.2676892280578613, 1.3956528902053833, 1.5236165523529053, 1.6515803337097168, 1.7795439958572388, 1.9075077772140503, 2.0354714393615723, 2.163435220718384, 2.2913990020751953, 2.4193625450134277, 2.5473263263702393, 2.675290107727051, 2.8032538890838623, 2.9312174320220947, 3.0591812133789062, 3.1871449947357178, 3.3151087760925293, 3.4430723190307617, 3.5710361003875732, 3.6989996433258057]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 12.0, 13.0, 9.0, 13.0, 23.0, 35.0, 32.0, 29.0, 41.0, 55.0, 66.0, 61.0, 53.0, 63.0, 67.0, 55.0, 41.0, 56.0, 55.0, 42.0, 27.0, 28.0, 22.0, 23.0, 17.0, 21.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.8028132915496826, -3.7039666175842285, -3.6051201820373535, -3.5062735080718994, -3.4074270725250244, -3.3085803985595703, -3.2097339630126953, -3.110887289047241, -3.012040615081787, -2.913193941116333, -2.814347505569458, -2.715500831604004, -2.616654396057129, -2.517807722091675, -2.4189610481262207, -2.3201146125793457, -2.2212681770324707, -2.1224215030670166, -2.0235750675201416, -1.9247283935546875, -1.825881838798523, -1.7270352840423584, -1.6281887292861938, -1.5293421745300293, -1.4304955005645752, -1.3316489458084106, -1.232802391052246, -1.133955717086792, -1.0351091623306274, -0.9362626075744629, -0.8374160528182983, -0.738569438457489, -0.6397228240966797, -0.5408762693405151, -0.4420296549797058, -0.34318310022354126, -0.24433651566505432, -0.14548993110656738, -0.04664337635040283, 0.052203238010406494, 0.15104979276657104, 0.24989637732505798, 0.3487429618835449, 0.4475895166397095, 0.546436071395874, 0.6452826857566833, 0.7441292405128479, 0.8429758548736572, 0.9418224096298218, 1.0406689643859863, 1.1395155191421509, 1.2383620738983154, 1.3372087478637695, 1.436055302619934, 1.5349018573760986, 1.6337485313415527, 1.7325949668884277, 1.8314415216445923, 1.9302880764007568, 2.029134750366211, 2.127981185913086, 2.22682785987854, 2.325674533843994, 2.424520969390869, 2.5233676433563232]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 7.0, 13.0, 36.0, 22.0, 42.0, 62.0, 101.0, 153.0, 290.0, 549.0, 1260.0, 3028.0, 9263.0, 40415.0, 293162.0, 577431.0, 96677.0, 17533.0, 4918.0, 1746.0, 829.0, 407.0, 206.0, 133.0, 83.0, 43.0, 36.0, 21.0, 17.0, 12.0, 10.0, 4.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7158203125, -0.692901611328125, -0.66998291015625, -0.647064208984375, -0.6241455078125, -0.601226806640625, -0.57830810546875, -0.555389404296875, -0.532470703125, -0.509552001953125, -0.48663330078125, -0.463714599609375, -0.4407958984375, -0.417877197265625, -0.39495849609375, -0.372039794921875, -0.34912109375, -0.326202392578125, -0.30328369140625, -0.280364990234375, -0.2574462890625, -0.234527587890625, -0.21160888671875, -0.188690185546875, -0.165771484375, -0.142852783203125, -0.11993408203125, -0.097015380859375, -0.0740966796875, -0.051177978515625, -0.02825927734375, -0.005340576171875, 0.017578125, 0.040496826171875, 0.06341552734375, 0.086334228515625, 0.1092529296875, 0.132171630859375, 0.15509033203125, 0.178009033203125, 0.200927734375, 0.223846435546875, 0.24676513671875, 0.269683837890625, 0.2926025390625, 0.315521240234375, 0.33843994140625, 0.361358642578125, 0.38427734375, 0.407196044921875, 0.43011474609375, 0.453033447265625, 0.4759521484375, 0.498870849609375, 0.52178955078125, 0.544708251953125, 0.567626953125, 0.590545654296875, 0.61346435546875, 0.636383056640625, 0.6593017578125, 0.682220458984375, 0.70513916015625, 0.728057861328125, 0.7509765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 7.0, 14.0, 14.0, 23.0, 24.0, 22.0, 44.0, 44.0, 51.0, 56.0, 67.0, 77.0, 59.0, 69.0, 55.0, 64.0, 57.0, 51.0, 35.0, 32.0, 31.0, 22.0, 21.0, 16.0, 14.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.17523193359375, -2.1043701171875, -2.03350830078125, -1.962646484375, -1.89178466796875, -1.8209228515625, -1.75006103515625, -1.67919921875, -1.60833740234375, -1.5374755859375, -1.46661376953125, -1.395751953125, -1.32489013671875, -1.2540283203125, -1.18316650390625, -1.1123046875, -1.04144287109375, -0.9705810546875, -0.89971923828125, -0.828857421875, -0.75799560546875, -0.6871337890625, -0.61627197265625, -0.54541015625, -0.47454833984375, -0.4036865234375, -0.33282470703125, -0.261962890625, -0.19110107421875, -0.1202392578125, -0.04937744140625, 0.021484375, 0.09234619140625, 0.1632080078125, 0.23406982421875, 0.304931640625, 0.37579345703125, 0.4466552734375, 0.51751708984375, 0.58837890625, 0.65924072265625, 0.7301025390625, 0.80096435546875, 0.871826171875, 0.94268798828125, 1.0135498046875, 1.08441162109375, 1.1552734375, 1.22613525390625, 1.2969970703125, 1.36785888671875, 1.438720703125, 1.50958251953125, 1.5804443359375, 1.65130615234375, 1.72216796875, 1.79302978515625, 1.8638916015625, 1.93475341796875, 2.005615234375, 2.07647705078125, 2.1473388671875, 2.21820068359375, 2.2890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 19.0, 19.0, 24.0, 34.0, 54.0, 91.0, 113.0, 221.0, 344.0, 637.0, 1262.0, 2637.0, 5809.0, 16577.0, 58124.0, 238949.0, 464340.0, 190392.0, 45623.0, 13358.0, 5119.0, 2238.0, 1010.0, 584.0, 347.0, 191.0, 140.0, 85.0, 57.0, 40.0, 21.0, 14.0, 19.0, 12.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.49609375, -0.4828338623046875, -0.469573974609375, -0.4563140869140625, -0.44305419921875, -0.4297943115234375, -0.416534423828125, -0.4032745361328125, -0.3900146484375, -0.3767547607421875, -0.363494873046875, -0.3502349853515625, -0.33697509765625, -0.3237152099609375, -0.310455322265625, -0.2971954345703125, -0.283935546875, -0.2706756591796875, -0.257415771484375, -0.2441558837890625, -0.23089599609375, -0.2176361083984375, -0.204376220703125, -0.1911163330078125, -0.1778564453125, -0.1645965576171875, -0.151336669921875, -0.1380767822265625, -0.12481689453125, -0.1115570068359375, -0.098297119140625, -0.0850372314453125, -0.07177734375, -0.0585174560546875, -0.045257568359375, -0.0319976806640625, -0.01873779296875, -0.0054779052734375, 0.007781982421875, 0.0210418701171875, 0.0343017578125, 0.0475616455078125, 0.060821533203125, 0.0740814208984375, 0.08734130859375, 0.1006011962890625, 0.113861083984375, 0.1271209716796875, 0.140380859375, 0.1536407470703125, 0.166900634765625, 0.1801605224609375, 0.19342041015625, 0.2066802978515625, 0.219940185546875, 0.2332000732421875, 0.2464599609375, 0.2597198486328125, 0.272979736328125, 0.2862396240234375, 0.29949951171875, 0.3127593994140625, 0.326019287109375, 0.3392791748046875, 0.3525390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 10.0, 5.0, 7.0, 12.0, 17.0, 26.0, 18.0, 20.0, 20.0, 38.0, 33.0, 41.0, 51.0, 58.0, 54.0, 61.0, 71.0, 58.0, 51.0, 50.0, 46.0, 38.0, 39.0, 37.0, 27.0, 29.0, 28.0, 14.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.17578125, -4.061065673828125, -3.94635009765625, -3.831634521484375, -3.7169189453125, -3.602203369140625, -3.48748779296875, -3.372772216796875, -3.258056640625, -3.143341064453125, -3.02862548828125, -2.913909912109375, -2.7991943359375, -2.684478759765625, -2.56976318359375, -2.455047607421875, -2.34033203125, -2.225616455078125, -2.11090087890625, -1.996185302734375, -1.8814697265625, -1.766754150390625, -1.65203857421875, -1.537322998046875, -1.422607421875, -1.307891845703125, -1.19317626953125, -1.078460693359375, -0.9637451171875, -0.849029541015625, -0.73431396484375, -0.619598388671875, -0.5048828125, -0.390167236328125, -0.27545166015625, -0.160736083984375, -0.0460205078125, 0.068695068359375, 0.18341064453125, 0.298126220703125, 0.412841796875, 0.527557373046875, 0.64227294921875, 0.756988525390625, 0.8717041015625, 0.986419677734375, 1.10113525390625, 1.215850830078125, 1.33056640625, 1.445281982421875, 1.55999755859375, 1.674713134765625, 1.7894287109375, 1.904144287109375, 2.01885986328125, 2.133575439453125, 2.248291015625, 2.363006591796875, 2.47772216796875, 2.592437744140625, 2.7071533203125, 2.821868896484375, 2.93658447265625, 3.051300048828125, 3.166015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 14.0, 7.0, 7.0, 15.0, 19.0, 48.0, 47.0, 88.0, 155.0, 321.0, 589.0, 1228.0, 2783.0, 7110.0, 22831.0, 104706.0, 494179.0, 329133.0, 60742.0, 15220.0, 5202.0, 2078.0, 937.0, 456.0, 224.0, 161.0, 87.0, 62.0, 28.0, 32.0, 11.0, 14.0, 4.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.20093536376953125, -0.1953277587890625, -0.18972015380859375, -0.184112548828125, -0.17850494384765625, -0.1728973388671875, -0.16728973388671875, -0.16168212890625, -0.15607452392578125, -0.1504669189453125, -0.14485931396484375, -0.139251708984375, -0.13364410400390625, -0.1280364990234375, -0.12242889404296875, -0.1168212890625, -0.11121368408203125, -0.1056060791015625, -0.09999847412109375, -0.094390869140625, -0.08878326416015625, -0.0831756591796875, -0.07756805419921875, -0.07196044921875, -0.06635284423828125, -0.0607452392578125, -0.05513763427734375, -0.049530029296875, -0.04392242431640625, -0.0383148193359375, -0.03270721435546875, -0.027099609375, -0.02149200439453125, -0.0158843994140625, -0.01027679443359375, -0.004669189453125, 0.00093841552734375, 0.0065460205078125, 0.01215362548828125, 0.01776123046875, 0.02336883544921875, 0.0289764404296875, 0.03458404541015625, 0.040191650390625, 0.04579925537109375, 0.0514068603515625, 0.05701446533203125, 0.0626220703125, 0.06822967529296875, 0.0738372802734375, 0.07944488525390625, 0.085052490234375, 0.09066009521484375, 0.0962677001953125, 0.10187530517578125, 0.10748291015625, 0.11309051513671875, 0.1186981201171875, 0.12430572509765625, 0.129913330078125, 0.13552093505859375, 0.1411285400390625, 0.14673614501953125, 0.15234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 9.0, 11.0, 13.0, 11.0, 16.0, 31.0, 26.0, 29.0, 37.0, 56.0, 61.0, 81.0, 66.0, 79.0, 74.0, 66.0, 66.0, 46.0, 42.0, 43.0, 37.0, 23.0, 18.0, 8.0, 13.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208917617797852e-05, -8.940789848566055e-05, -8.672662079334259e-05, -8.404534310102463e-05, -8.136406540870667e-05, -7.86827877163887e-05, -7.600151002407074e-05, -7.332023233175278e-05, -7.063895463943481e-05, -6.795767694711685e-05, -6.527639925479889e-05, -6.259512156248093e-05, -5.9913843870162964e-05, -5.7232566177845e-05, -5.455128848552704e-05, -5.1870010793209076e-05, -4.918873310089111e-05, -4.650745540857315e-05, -4.382617771625519e-05, -4.1144900023937225e-05, -3.846362233161926e-05, -3.57823446393013e-05, -3.310106694698334e-05, -3.0419789254665375e-05, -2.7738511562347412e-05, -2.505723387002945e-05, -2.2375956177711487e-05, -1.9694678485393524e-05, -1.701340079307556e-05, -1.4332123100757599e-05, -1.1650845408439636e-05, -8.969567716121674e-06, -6.288290023803711e-06, -3.6070123314857483e-06, -9.257346391677856e-07, 1.755543053150177e-06, 4.43682074546814e-06, 7.118098437786102e-06, 9.799376130104065e-06, 1.2480653822422028e-05, 1.516193151473999e-05, 1.7843209207057953e-05, 2.0524486899375916e-05, 2.3205764591693878e-05, 2.588704228401184e-05, 2.8568319976329803e-05, 3.1249597668647766e-05, 3.393087536096573e-05, 3.661215305328369e-05, 3.9293430745601654e-05, 4.197470843791962e-05, 4.465598613023758e-05, 4.733726382255554e-05, 5.0018541514873505e-05, 5.269981920719147e-05, 5.538109689950943e-05, 5.806237459182739e-05, 6.0743652284145355e-05, 6.342492997646332e-05, 6.610620766878128e-05, 6.878748536109924e-05, 7.14687630534172e-05, 7.415004074573517e-05, 7.683131843805313e-05, 7.95125961303711e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 14.0, 19.0, 37.0, 44.0, 76.0, 195.0, 400.0, 777.0, 1872.0, 5334.0, 22871.0, 282742.0, 671391.0, 49536.0, 8487.0, 2671.0, 1034.0, 482.0, 253.0, 125.0, 64.0, 49.0, 22.0, 20.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.32990264892578125, -0.3199615478515625, -0.31002044677734375, -0.300079345703125, -0.29013824462890625, -0.2801971435546875, -0.27025604248046875, -0.26031494140625, -0.25037384033203125, -0.2404327392578125, -0.23049163818359375, -0.220550537109375, -0.21060943603515625, -0.2006683349609375, -0.19072723388671875, -0.1807861328125, -0.17084503173828125, -0.1609039306640625, -0.15096282958984375, -0.141021728515625, -0.13108062744140625, -0.1211395263671875, -0.11119842529296875, -0.10125732421875, -0.09131622314453125, -0.0813751220703125, -0.07143402099609375, -0.061492919921875, -0.05155181884765625, -0.0416107177734375, -0.03166961669921875, -0.021728515625, -0.01178741455078125, -0.0018463134765625, 0.00809478759765625, 0.018035888671875, 0.02797698974609375, 0.0379180908203125, 0.04785919189453125, 0.05780029296875, 0.06774139404296875, 0.0776824951171875, 0.08762359619140625, 0.097564697265625, 0.10750579833984375, 0.1174468994140625, 0.12738800048828125, 0.1373291015625, 0.14727020263671875, 0.1572113037109375, 0.16715240478515625, 0.177093505859375, 0.18703460693359375, 0.1969757080078125, 0.20691680908203125, 0.21685791015625, 0.22679901123046875, 0.2367401123046875, 0.24668121337890625, 0.256622314453125, 0.26656341552734375, 0.2765045166015625, 0.28644561767578125, 0.29638671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 8.0, 13.0, 22.0, 27.0, 36.0, 69.0, 82.0, 152.0, 166.0, 150.0, 107.0, 51.0, 38.0, 23.0, 13.0, 6.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.0611572265625, -0.05908203125, -0.0570068359375, -0.054931640625, -0.0528564453125, -0.05078125, -0.0487060546875, -0.046630859375, -0.0445556640625, -0.04248046875, -0.0404052734375, -0.038330078125, -0.0362548828125, -0.0341796875, -0.0321044921875, -0.030029296875, -0.0279541015625, -0.02587890625, -0.0238037109375, -0.021728515625, -0.0196533203125, -0.017578125, -0.0155029296875, -0.013427734375, -0.0113525390625, -0.00927734375, -0.0072021484375, -0.005126953125, -0.0030517578125, -0.0009765625, 0.0010986328125, 0.003173828125, 0.0052490234375, 0.00732421875, 0.0093994140625, 0.011474609375, 0.0135498046875, 0.015625, 0.0177001953125, 0.019775390625, 0.0218505859375, 0.02392578125, 0.0260009765625, 0.028076171875, 0.0301513671875, 0.0322265625, 0.0343017578125, 0.036376953125, 0.0384521484375, 0.04052734375, 0.0426025390625, 0.044677734375, 0.0467529296875, 0.048828125, 0.0509033203125, 0.052978515625, 0.0550537109375, 0.05712890625, 0.0592041015625, 0.061279296875, 0.0633544921875, 0.0654296875, 0.0675048828125, 0.069580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 19.0, 24.0, 33.0, 31.0, 70.0, 88.0, 118.0, 107.0, 127.0, 82.0, 65.0, 55.0, 36.0, 30.0, 17.0, 18.0, 16.0, 8.0, 5.0, 6.0, 1.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2435925006866455, -3.153115749359131, -3.062638998031616, -2.9721622467041016, -2.881685256958008, -2.791208505630493, -2.7007317543029785, -2.610255002975464, -2.519778251647949, -2.4293015003204346, -2.33882474899292, -2.2483479976654053, -2.1578712463378906, -2.067394256591797, -1.9769175052642822, -1.8864407539367676, -1.795964002609253, -1.7054872512817383, -1.6150104999542236, -1.5245336294174194, -1.4340568780899048, -1.3435801267623901, -1.253103256225586, -1.1626265048980713, -1.0721497535705566, -0.981673002243042, -0.8911961913108826, -0.8007193803787231, -0.7102426290512085, -0.6197658777236938, -0.5292890667915344, -0.438812255859375, -0.34833574295043945, -0.2578589618206024, -0.16738218069076538, -0.07690539956092834, 0.013571381568908691, 0.10404816269874573, 0.19452494382858276, 0.2850017547607422, 0.37547850608825684, 0.46595528721809387, 0.5564320683479309, 0.6469088792800903, 0.737385630607605, 0.8278623819351196, 0.918339192867279, 1.0088160037994385, 1.0992927551269531, 1.1897695064544678, 1.2802462577819824, 1.3707231283187866, 1.4611998796463013, 1.551676630973816, 1.6421535015106201, 1.7326302528381348, 1.8231070041656494, 1.913583755493164, 2.0040605068206787, 2.0945372581481934, 2.185014247894287, 2.2754909992218018, 2.3659677505493164, 2.456444501876831, 2.5469212532043457]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 12.0, 12.0, 20.0, 22.0, 35.0, 28.0, 46.0, 57.0, 59.0, 79.0, 64.0, 74.0, 91.0, 46.0, 66.0, 70.0, 45.0, 28.0, 33.0, 27.0, 20.0, 17.0, 14.0, 11.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.759587049484253, -2.686246871948242, -2.6129066944122314, -2.5395665168762207, -2.46622633934021, -2.392886161804199, -2.3195459842681885, -2.2462058067321777, -2.172865629196167, -2.0995254516601562, -2.0261852741241455, -1.9528450965881348, -1.879504919052124, -1.8061647415161133, -1.7328245639801025, -1.6594843864440918, -1.5861440896987915, -1.5128039121627808, -1.43946373462677, -1.3661235570907593, -1.2927833795547485, -1.2194432020187378, -1.1461029052734375, -1.0727627277374268, -0.9994226098060608, -0.92608243227005, -0.8527422547340393, -0.7794020175933838, -0.706061840057373, -0.6327216625213623, -0.5593814849853516, -0.4860413074493408, -0.41270124912261963, -0.3393610715866089, -0.26602089405059814, -0.19268068671226501, -0.11934050917625427, -0.04600033164024353, 0.0273398756980896, 0.10068005323410034, 0.17402023077011108, 0.24736040830612183, 0.32070058584213257, 0.3940407931804657, 0.46738097071647644, 0.5407211780548096, 0.6140613555908203, 0.687401533126831, 0.7607417106628418, 0.8340818881988525, 0.9074220657348633, 0.980762243270874, 1.0541024208068848, 1.1274425983428955, 1.2007827758789062, 1.274122953414917, 1.3474631309509277, 1.4208033084869385, 1.4941434860229492, 1.56748366355896, 1.6408238410949707, 1.7141640186309814, 1.7875041961669922, 1.860844373703003, 1.9341846704483032]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 14.0, 20.0, 28.0, 29.0, 48.0, 65.0, 110.0, 158.0, 310.0, 509.0, 912.0, 1704.0, 3366.0, 7353.0, 18630.0, 60834.0, 296499.0, 507023.0, 103733.0, 27608.0, 10160.0, 4573.0, 2173.0, 1164.0, 631.0, 348.0, 188.0, 121.0, 83.0, 52.0, 25.0, 21.0, 19.0, 14.0, 4.0, 8.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84765625, -2.75634765625, -2.6650390625, -2.57373046875, -2.482421875, -2.39111328125, -2.2998046875, -2.20849609375, -2.1171875, -2.02587890625, -1.9345703125, -1.84326171875, -1.751953125, -1.66064453125, -1.5693359375, -1.47802734375, -1.38671875, -1.29541015625, -1.2041015625, -1.11279296875, -1.021484375, -0.93017578125, -0.8388671875, -0.74755859375, -0.65625, -0.56494140625, -0.4736328125, -0.38232421875, -0.291015625, -0.19970703125, -0.1083984375, -0.01708984375, 0.07421875, 0.16552734375, 0.2568359375, 0.34814453125, 0.439453125, 0.53076171875, 0.6220703125, 0.71337890625, 0.8046875, 0.89599609375, 0.9873046875, 1.07861328125, 1.169921875, 1.26123046875, 1.3525390625, 1.44384765625, 1.53515625, 1.62646484375, 1.7177734375, 1.80908203125, 1.900390625, 1.99169921875, 2.0830078125, 2.17431640625, 2.265625, 2.35693359375, 2.4482421875, 2.53955078125, 2.630859375, 2.72216796875, 2.8134765625, 2.90478515625, 2.99609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 9.0, 3.0, 5.0, 16.0, 13.0, 12.0, 19.0, 27.0, 25.0, 26.0, 32.0, 37.0, 51.0, 62.0, 53.0, 65.0, 66.0, 75.0, 61.0, 46.0, 38.0, 44.0, 34.0, 28.0, 23.0, 15.0, 22.0, 20.0, 19.0, 11.0, 5.0, 12.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.28125, -4.14056396484375, -3.9998779296875, -3.85919189453125, -3.718505859375, -3.57781982421875, -3.4371337890625, -3.29644775390625, -3.15576171875, -3.01507568359375, -2.8743896484375, -2.73370361328125, -2.593017578125, -2.45233154296875, -2.3116455078125, -2.17095947265625, -2.0302734375, -1.88958740234375, -1.7489013671875, -1.60821533203125, -1.467529296875, -1.32684326171875, -1.1861572265625, -1.04547119140625, -0.90478515625, -0.76409912109375, -0.6234130859375, -0.48272705078125, -0.342041015625, -0.20135498046875, -0.0606689453125, 0.08001708984375, 0.220703125, 0.36138916015625, 0.5020751953125, 0.64276123046875, 0.783447265625, 0.92413330078125, 1.0648193359375, 1.20550537109375, 1.34619140625, 1.48687744140625, 1.6275634765625, 1.76824951171875, 1.908935546875, 2.04962158203125, 2.1903076171875, 2.33099365234375, 2.4716796875, 2.61236572265625, 2.7530517578125, 2.89373779296875, 3.034423828125, 3.17510986328125, 3.3157958984375, 3.45648193359375, 3.59716796875, 3.73785400390625, 3.8785400390625, 4.01922607421875, 4.159912109375, 4.30059814453125, 4.4412841796875, 4.58197021484375, 4.72265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 8.0, 14.0, 11.0, 15.0, 11.0, 17.0, 16.0, 26.0, 24.0, 23.0, 34.0, 24.0, 52.0, 45.0, 48.0, 104.0, 411.0, 5130.0, 725483.0, 312707.0, 3478.0, 354.0, 82.0, 62.0, 42.0, 33.0, 32.0, 25.0, 31.0, 27.0, 23.0, 12.0, 12.0, 22.0, 13.0, 11.0, 12.0, 13.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0], "bins": [-11.5546875, -11.19287109375, -10.8310546875, -10.46923828125, -10.107421875, -9.74560546875, -9.3837890625, -9.02197265625, -8.66015625, -8.29833984375, -7.9365234375, -7.57470703125, -7.212890625, -6.85107421875, -6.4892578125, -6.12744140625, -5.765625, -5.40380859375, -5.0419921875, -4.68017578125, -4.318359375, -3.95654296875, -3.5947265625, -3.23291015625, -2.87109375, -2.50927734375, -2.1474609375, -1.78564453125, -1.423828125, -1.06201171875, -0.7001953125, -0.33837890625, 0.0234375, 0.38525390625, 0.7470703125, 1.10888671875, 1.470703125, 1.83251953125, 2.1943359375, 2.55615234375, 2.91796875, 3.27978515625, 3.6416015625, 4.00341796875, 4.365234375, 4.72705078125, 5.0888671875, 5.45068359375, 5.8125, 6.17431640625, 6.5361328125, 6.89794921875, 7.259765625, 7.62158203125, 7.9833984375, 8.34521484375, 8.70703125, 9.06884765625, 9.4306640625, 9.79248046875, 10.154296875, 10.51611328125, 10.8779296875, 11.23974609375, 11.6015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 5.0, 7.0, 12.0, 7.0, 14.0, 17.0, 20.0, 21.0, 23.0, 15.0, 26.0, 33.0, 34.0, 38.0, 27.0, 27.0, 36.0, 45.0, 41.0, 39.0, 32.0, 40.0, 31.0, 43.0, 34.0, 28.0, 30.0, 31.0, 25.0, 23.0, 26.0, 21.0, 14.0, 22.0, 11.0, 12.0, 19.0, 8.0, 11.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.77734375, -3.65057373046875, -3.5238037109375, -3.39703369140625, -3.270263671875, -3.14349365234375, -3.0167236328125, -2.88995361328125, -2.76318359375, -2.63641357421875, -2.5096435546875, -2.38287353515625, -2.256103515625, -2.12933349609375, -2.0025634765625, -1.87579345703125, -1.7490234375, -1.62225341796875, -1.4954833984375, -1.36871337890625, -1.241943359375, -1.11517333984375, -0.9884033203125, -0.86163330078125, -0.73486328125, -0.60809326171875, -0.4813232421875, -0.35455322265625, -0.227783203125, -0.10101318359375, 0.0257568359375, 0.15252685546875, 0.279296875, 0.40606689453125, 0.5328369140625, 0.65960693359375, 0.786376953125, 0.91314697265625, 1.0399169921875, 1.16668701171875, 1.29345703125, 1.42022705078125, 1.5469970703125, 1.67376708984375, 1.800537109375, 1.92730712890625, 2.0540771484375, 2.18084716796875, 2.3076171875, 2.43438720703125, 2.5611572265625, 2.68792724609375, 2.814697265625, 2.94146728515625, 3.0682373046875, 3.19500732421875, 3.32177734375, 3.44854736328125, 3.5753173828125, 3.70208740234375, 3.828857421875, 3.95562744140625, 4.0823974609375, 4.20916748046875, 4.3359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 15.0, 23.0, 19.0, 50.0, 90.0, 139.0, 247.0, 488.0, 943.0, 2012.0, 5286.0, 18294.0, 114226.0, 736898.0, 138859.0, 20778.0, 5824.0, 2265.0, 1002.0, 484.0, 243.0, 136.0, 83.0, 48.0, 34.0, 16.0, 13.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2421875, -1.2028045654296875, -1.163421630859375, -1.1240386962890625, -1.08465576171875, -1.0452728271484375, -1.005889892578125, -0.9665069580078125, -0.9271240234375, -0.8877410888671875, -0.848358154296875, -0.8089752197265625, -0.76959228515625, -0.7302093505859375, -0.690826416015625, -0.6514434814453125, -0.612060546875, -0.5726776123046875, -0.533294677734375, -0.4939117431640625, -0.45452880859375, -0.4151458740234375, -0.375762939453125, -0.3363800048828125, -0.2969970703125, -0.2576141357421875, -0.218231201171875, -0.1788482666015625, -0.13946533203125, -0.1000823974609375, -0.060699462890625, -0.0213165283203125, 0.01806640625, 0.0574493408203125, 0.096832275390625, 0.1362152099609375, 0.17559814453125, 0.2149810791015625, 0.254364013671875, 0.2937469482421875, 0.3331298828125, 0.3725128173828125, 0.411895751953125, 0.4512786865234375, 0.49066162109375, 0.5300445556640625, 0.569427490234375, 0.6088104248046875, 0.648193359375, 0.6875762939453125, 0.726959228515625, 0.7663421630859375, 0.80572509765625, 0.8451080322265625, 0.884490966796875, 0.9238739013671875, 0.9632568359375, 1.0026397705078125, 1.042022705078125, 1.0814056396484375, 1.12078857421875, 1.1601715087890625, 1.199554443359375, 1.2389373779296875, 1.2783203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 2.0, 7.0, 8.0, 8.0, 8.0, 11.0, 16.0, 17.0, 34.0, 60.0, 65.0, 75.0, 84.0, 135.0, 90.0, 77.0, 61.0, 60.0, 44.0, 32.0, 18.0, 19.0, 11.0, 10.0, 10.0, 4.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00015783309936523438, -0.00015268847346305847, -0.00014754384756088257, -0.00014239922165870667, -0.00013725459575653076, -0.00013210996985435486, -0.00012696534395217896, -0.00012182071805000305, -0.00011667609214782715, -0.00011153146624565125, -0.00010638684034347534, -0.00010124221444129944, -9.609758853912354e-05, -9.095296263694763e-05, -8.580833673477173e-05, -8.066371083259583e-05, -7.551908493041992e-05, -7.037445902824402e-05, -6.522983312606812e-05, -6.008520722389221e-05, -5.494058132171631e-05, -4.9795955419540405e-05, -4.46513295173645e-05, -3.95067036151886e-05, -3.4362077713012695e-05, -2.9217451810836792e-05, -2.407282590866089e-05, -1.8928200006484985e-05, -1.3783574104309082e-05, -8.638948202133179e-06, -3.4943222999572754e-06, 1.650303602218628e-06, 6.794929504394531e-06, 1.1939555406570435e-05, 1.7084181308746338e-05, 2.222880721092224e-05, 2.7373433113098145e-05, 3.251805901527405e-05, 3.766268491744995e-05, 4.2807310819625854e-05, 4.795193672180176e-05, 5.309656262397766e-05, 5.8241188526153564e-05, 6.338581442832947e-05, 6.853044033050537e-05, 7.367506623268127e-05, 7.881969213485718e-05, 8.396431803703308e-05, 8.910894393920898e-05, 9.425356984138489e-05, 9.939819574356079e-05, 0.0001045428216457367, 0.0001096874475479126, 0.0001148320734500885, 0.0001199766993522644, 0.0001251213252544403, 0.0001302659511566162, 0.00013541057705879211, 0.00014055520296096802, 0.00014569982886314392, 0.00015084445476531982, 0.00015598908066749573, 0.00016113370656967163, 0.00016627833247184753, 0.00017142295837402344]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 4.0, 8.0, 10.0, 5.0, 24.0, 29.0, 40.0, 51.0, 76.0, 132.0, 197.0, 320.0, 546.0, 1049.0, 2164.0, 5183.0, 14551.0, 58375.0, 384336.0, 480786.0, 72006.0, 17373.0, 6005.0, 2515.0, 1161.0, 603.0, 368.0, 212.0, 134.0, 90.0, 59.0, 34.0, 24.0, 24.0, 17.0, 15.0, 8.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96728515625, -0.9361495971679688, -0.9050140380859375, -0.8738784790039062, -0.842742919921875, -0.8116073608398438, -0.7804718017578125, -0.7493362426757812, -0.71820068359375, -0.6870651245117188, -0.6559295654296875, -0.6247940063476562, -0.593658447265625, -0.5625228881835938, -0.5313873291015625, -0.5002517700195312, -0.4691162109375, -0.43798065185546875, -0.4068450927734375, -0.37570953369140625, -0.344573974609375, -0.31343841552734375, -0.2823028564453125, -0.25116729736328125, -0.22003173828125, -0.18889617919921875, -0.1577606201171875, -0.12662506103515625, -0.095489501953125, -0.06435394287109375, -0.0332183837890625, -0.00208282470703125, 0.029052734375, 0.06018829345703125, 0.0913238525390625, 0.12245941162109375, 0.153594970703125, 0.18473052978515625, 0.2158660888671875, 0.24700164794921875, 0.27813720703125, 0.30927276611328125, 0.3404083251953125, 0.37154388427734375, 0.402679443359375, 0.43381500244140625, 0.4649505615234375, 0.49608612060546875, 0.5272216796875, 0.5583572387695312, 0.5894927978515625, 0.6206283569335938, 0.651763916015625, 0.6828994750976562, 0.7140350341796875, 0.7451705932617188, 0.77630615234375, 0.8074417114257812, 0.8385772705078125, 0.8697128295898438, 0.900848388671875, 0.9319839477539062, 0.9631195068359375, 0.9942550659179688, 1.025390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 8.0, 6.0, 8.0, 21.0, 21.0, 22.0, 29.0, 28.0, 60.0, 78.0, 87.0, 94.0, 107.0, 83.0, 76.0, 75.0, 54.0, 36.0, 30.0, 17.0, 14.0, 4.0, 6.0, 6.0, 10.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3915596008300781, -0.37662506103515625, -0.3616905212402344, -0.3467559814453125, -0.3318214416503906, -0.31688690185546875, -0.3019523620605469, -0.287017822265625, -0.2720832824707031, -0.25714874267578125, -0.24221420288085938, -0.2272796630859375, -0.21234512329101562, -0.19741058349609375, -0.18247604370117188, -0.16754150390625, -0.15260696411132812, -0.13767242431640625, -0.12273788452148438, -0.1078033447265625, -0.09286880493164062, -0.07793426513671875, -0.06299972534179688, -0.048065185546875, -0.033130645751953125, -0.01819610595703125, -0.003261566162109375, 0.0116729736328125, 0.026607513427734375, 0.04154205322265625, 0.056476593017578125, 0.0714111328125, 0.08634567260742188, 0.10128021240234375, 0.11621475219726562, 0.1311492919921875, 0.14608383178710938, 0.16101837158203125, 0.17595291137695312, 0.190887451171875, 0.20582199096679688, 0.22075653076171875, 0.23569107055664062, 0.2506256103515625, 0.2655601501464844, 0.28049468994140625, 0.2954292297363281, 0.31036376953125, 0.3252983093261719, 0.34023284912109375, 0.3551673889160156, 0.3701019287109375, 0.3850364685058594, 0.39997100830078125, 0.4149055480957031, 0.429840087890625, 0.4447746276855469, 0.45970916748046875, 0.4746437072753906, 0.4895782470703125, 0.5045127868652344, 0.5194473266601562, 0.5343818664550781, 0.54931640625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 10.0, 11.0, 20.0, 35.0, 52.0, 128.0, 207.0, 203.0, 152.0, 73.0, 52.0, 25.0, 16.0, 11.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.38946008682251, -5.03520393371582, -4.680947780609131, -4.326691627502441, -3.972435712814331, -3.6181795597076416, -3.2639236450195312, -2.909667491912842, -2.5554113388061523, -2.201155185699463, -1.846899151802063, -1.492643117904663, -1.1383869647979736, -0.7841308116912842, -0.42987489700317383, -0.07561874389648438, 0.2786374092102051, 0.6328935027122498, 0.9871495962142944, 1.3414056301116943, 1.6956617832183838, 2.0499179363250732, 2.4041738510131836, 2.758430004119873, 3.1126861572265625, 3.466942310333252, 3.8211984634399414, 4.175454139709473, 4.52971076965332, 4.883966445922852, 5.238222599029541, 5.5924787521362305, 5.946735382080078, 6.300991535186768, 6.655247688293457, 7.009503364562988, 7.363759994506836, 7.718015670776367, 8.072271347045898, 8.426527976989746, 8.780784606933594, 9.135040283203125, 9.489296913146973, 9.843552589416504, 10.197809219360352, 10.552064895629883, 10.906320571899414, 11.260577201843262, 11.614832878112793, 11.969088554382324, 12.323345184326172, 12.677600860595703, 13.03185749053955, 13.386113166809082, 13.74036979675293, 14.094625473022461, 14.448881149291992, 14.803136825561523, 15.157393455505371, 15.511649131774902, 15.86590576171875, 16.22016143798828, 16.574417114257812, 16.928672790527344, 17.282930374145508]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 2.0, 9.0, 11.0, 13.0, 12.0, 14.0, 17.0, 27.0, 18.0, 36.0, 32.0, 30.0, 34.0, 36.0, 37.0, 30.0, 38.0, 43.0, 43.0, 36.0, 54.0, 41.0, 38.0, 30.0, 37.0, 49.0, 19.0, 26.0, 24.0, 20.0, 23.0, 15.0, 18.0, 13.0, 12.0, 8.0, 8.0, 10.0, 5.0, 2.0, 5.0, 7.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1865620613098145, -6.943087577819824, -6.699612617492676, -6.4561381340026855, -6.212663650512695, -5.969188690185547, -5.725714206695557, -5.482239723205566, -5.238764762878418, -4.995290279388428, -4.751815319061279, -4.508340835571289, -4.264866352081299, -4.021391868591309, -3.77791690826416, -3.53444242477417, -3.2909679412841797, -3.0474932193756104, -2.80401873588562, -2.560544013977051, -2.3170695304870605, -2.073594808578491, -1.8301200866699219, -1.586645483970642, -1.3431708812713623, -1.0996962785720825, -0.856221616268158, -0.6127469539642334, -0.3692723512649536, -0.12579774856567383, 0.11767697334289551, 0.3611515760421753, 0.6046266555786133, 0.8481012582778931, 1.0915758609771729, 1.3350505828857422, 1.578525185585022, 1.8219997882843018, 2.065474510192871, 2.3089489936828613, 2.5524237155914307, 2.7958984375, 3.0393729209899902, 3.2828476428985596, 3.526322364807129, 3.769796848297119, 4.013271331787109, 4.256746292114258, 4.500220775604248, 4.743695259094238, 4.987170219421387, 5.230644702911377, 5.474119186401367, 5.717594146728516, 5.961068630218506, 6.204543113708496, 6.4480180740356445, 6.691492557525635, 6.934967517852783, 7.178442001342773, 7.421916484832764, 7.665390968322754, 7.908865928649902, 8.15234088897705, 8.395814895629883]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 6.0, 16.0, 25.0, 28.0, 50.0, 63.0, 115.0, 136.0, 220.0, 354.0, 657.0, 1183.0, 2451.0, 5655.0, 16456.0, 71271.0, 992198.0, 2938674.0, 127088.0, 23582.0, 7538.0, 3099.0, 1465.0, 755.0, 432.0, 262.0, 170.0, 89.0, 61.0, 42.0, 37.0, 32.0, 16.0, 19.0, 8.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.181640625, -3.059967041015625, -2.93829345703125, -2.816619873046875, -2.6949462890625, -2.573272705078125, -2.45159912109375, -2.329925537109375, -2.208251953125, -2.086578369140625, -1.96490478515625, -1.843231201171875, -1.7215576171875, -1.599884033203125, -1.47821044921875, -1.356536865234375, -1.23486328125, -1.113189697265625, -0.99151611328125, -0.869842529296875, -0.7481689453125, -0.626495361328125, -0.50482177734375, -0.383148193359375, -0.261474609375, -0.139801025390625, -0.01812744140625, 0.103546142578125, 0.2252197265625, 0.346893310546875, 0.46856689453125, 0.590240478515625, 0.7119140625, 0.833587646484375, 0.95526123046875, 1.076934814453125, 1.1986083984375, 1.320281982421875, 1.44195556640625, 1.563629150390625, 1.685302734375, 1.806976318359375, 1.92864990234375, 2.050323486328125, 2.1719970703125, 2.293670654296875, 2.41534423828125, 2.537017822265625, 2.65869140625, 2.780364990234375, 2.90203857421875, 3.023712158203125, 3.1453857421875, 3.267059326171875, 3.38873291015625, 3.510406494140625, 3.632080078125, 3.753753662109375, 3.87542724609375, 3.997100830078125, 4.1187744140625, 4.240447998046875, 4.36212158203125, 4.483795166015625, 4.60546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 6.0, 9.0, 13.0, 16.0, 36.0, 28.0, 38.0, 45.0, 59.0, 65.0, 70.0, 77.0, 58.0, 62.0, 82.0, 54.0, 62.0, 49.0, 32.0, 26.0, 22.0, 22.0, 16.0, 11.0, 13.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.802154541015625, -2.71368408203125, -2.625213623046875, -2.5367431640625, -2.448272705078125, -2.35980224609375, -2.271331787109375, -2.182861328125, -2.094390869140625, -2.00592041015625, -1.917449951171875, -1.8289794921875, -1.740509033203125, -1.65203857421875, -1.563568115234375, -1.47509765625, -1.386627197265625, -1.29815673828125, -1.209686279296875, -1.1212158203125, -1.032745361328125, -0.94427490234375, -0.855804443359375, -0.767333984375, -0.678863525390625, -0.59039306640625, -0.501922607421875, -0.4134521484375, -0.324981689453125, -0.23651123046875, -0.148040771484375, -0.0595703125, 0.028900146484375, 0.11737060546875, 0.205841064453125, 0.2943115234375, 0.382781982421875, 0.47125244140625, 0.559722900390625, 0.648193359375, 0.736663818359375, 0.82513427734375, 0.913604736328125, 1.0020751953125, 1.090545654296875, 1.17901611328125, 1.267486572265625, 1.35595703125, 1.444427490234375, 1.53289794921875, 1.621368408203125, 1.7098388671875, 1.798309326171875, 1.88677978515625, 1.975250244140625, 2.063720703125, 2.152191162109375, 2.24066162109375, 2.329132080078125, 2.4176025390625, 2.506072998046875, 2.59454345703125, 2.683013916015625, 2.771484375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 11.0, 7.0, 11.0, 21.0, 30.0, 45.0, 85.0, 127.0, 342.0, 1472.0, 27982.0, 4120721.0, 40904.0, 1743.0, 397.0, 153.0, 70.0, 54.0, 27.0, 28.0, 16.0, 7.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.2430419921875, -13.853271484375, -13.4635009765625, -13.07373046875, -12.6839599609375, -12.294189453125, -11.9044189453125, -11.5146484375, -11.1248779296875, -10.735107421875, -10.3453369140625, -9.95556640625, -9.5657958984375, -9.176025390625, -8.7862548828125, -8.396484375, -8.0067138671875, -7.616943359375, -7.2271728515625, -6.83740234375, -6.4476318359375, -6.057861328125, -5.6680908203125, -5.2783203125, -4.8885498046875, -4.498779296875, -4.1090087890625, -3.71923828125, -3.3294677734375, -2.939697265625, -2.5499267578125, -2.16015625, -1.7703857421875, -1.380615234375, -0.9908447265625, -0.60107421875, -0.2113037109375, 0.178466796875, 0.5682373046875, 0.9580078125, 1.3477783203125, 1.737548828125, 2.1273193359375, 2.51708984375, 2.9068603515625, 3.296630859375, 3.6864013671875, 4.076171875, 4.4659423828125, 4.855712890625, 5.2454833984375, 5.63525390625, 6.0250244140625, 6.414794921875, 6.8045654296875, 7.1943359375, 7.5841064453125, 7.973876953125, 8.3636474609375, 8.75341796875, 9.1431884765625, 9.532958984375, 9.9227294921875, 10.3125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 21.0, 14.0, 17.0, 29.0, 26.0, 43.0, 74.0, 96.0, 166.0, 273.0, 457.0, 1092.0, 755.0, 378.0, 195.0, 122.0, 92.0, 58.0, 48.0, 24.0, 21.0, 16.0, 17.0, 6.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.97039794921875, -0.9407958984375, -0.91119384765625, -0.881591796875, -0.85198974609375, -0.8223876953125, -0.79278564453125, -0.76318359375, -0.73358154296875, -0.7039794921875, -0.67437744140625, -0.644775390625, -0.61517333984375, -0.5855712890625, -0.55596923828125, -0.5263671875, -0.49676513671875, -0.4671630859375, -0.43756103515625, -0.407958984375, -0.37835693359375, -0.3487548828125, -0.31915283203125, -0.28955078125, -0.25994873046875, -0.2303466796875, -0.20074462890625, -0.171142578125, -0.14154052734375, -0.1119384765625, -0.08233642578125, -0.052734375, -0.02313232421875, 0.0064697265625, 0.03607177734375, 0.065673828125, 0.09527587890625, 0.1248779296875, 0.15447998046875, 0.18408203125, 0.21368408203125, 0.2432861328125, 0.27288818359375, 0.302490234375, 0.33209228515625, 0.3616943359375, 0.39129638671875, 0.4208984375, 0.45050048828125, 0.4801025390625, 0.50970458984375, 0.539306640625, 0.56890869140625, 0.5985107421875, 0.62811279296875, 0.65771484375, 0.68731689453125, 0.7169189453125, 0.74652099609375, 0.776123046875, 0.80572509765625, 0.8353271484375, 0.86492919921875, 0.89453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 8.0, 6.0, 9.0, 18.0, 19.0, 27.0, 48.0, 72.0, 73.0, 100.0, 104.0, 111.0, 96.0, 87.0, 52.0, 37.0, 40.0, 17.0, 12.0, 8.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.718958854675293, -3.6025497913360596, -3.486140727996826, -3.3697316646575928, -3.2533226013183594, -3.136913537979126, -3.0205044746398926, -2.9040956497192383, -2.787686347961426, -2.6712772846221924, -2.554868221282959, -2.4384591579437256, -2.322050094604492, -2.205641031265259, -2.0892319679260254, -1.9728230237960815, -1.8564140796661377, -1.7400050163269043, -1.623595952987671, -1.5071868896484375, -1.390777826309204, -1.2743687629699707, -1.1579598188400269, -1.0415507555007935, -0.9251416921615601, -0.8087326288223267, -0.6923235654830933, -0.5759145617485046, -0.45950549840927124, -0.34309643507003784, -0.22668743133544922, -0.11027836799621582, 0.0061304569244384766, 0.12253950536251068, 0.23894855380058289, 0.3553575873374939, 0.4717666506767273, 0.5881757140159607, 0.7045847177505493, 0.8209937810897827, 0.9374028444290161, 1.0538119077682495, 1.170220971107483, 1.2866299152374268, 1.4030389785766602, 1.5194480419158936, 1.635857105255127, 1.7522661685943604, 1.8686752319335938, 1.9850842952728271, 2.1014933586120605, 2.217902421951294, 2.3343114852905273, 2.4507205486297607, 2.567129611968994, 2.6835384368896484, 2.799947738647461, 2.9163568019866943, 3.0327658653259277, 3.149174928665161, 3.2655839920043945, 3.381993055343628, 3.4984021186828613, 3.6148109436035156, 3.731220006942749]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 12.0, 17.0, 20.0, 21.0, 33.0, 31.0, 35.0, 38.0, 55.0, 55.0, 64.0, 74.0, 61.0, 51.0, 67.0, 58.0, 60.0, 49.0, 41.0, 32.0, 25.0, 22.0, 15.0, 12.0, 10.0, 11.0, 7.0, 7.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.964372158050537, -2.870063543319702, -2.775754928588867, -2.6814465522766113, -2.5871379375457764, -2.4928293228149414, -2.3985207080841064, -2.3042120933532715, -2.2099037170410156, -2.1155951023101807, -2.0212864875793457, -1.9269779920578003, -1.8326694965362549, -1.73836088180542, -1.644052267074585, -1.54974365234375, -1.455435037612915, -1.36112642288208, -1.2668179273605347, -1.1725093126296997, -1.0782008171081543, -0.9838922023773193, -0.8895835876464844, -0.7952750325202942, -0.700966477394104, -0.6066579222679138, -0.5123493671417236, -0.41804075241088867, -0.3237321972846985, -0.2294236421585083, -0.13511502742767334, -0.040806472301483154, 0.05350208282470703, 0.1478106528520584, 0.2421192228794098, 0.33642780780792236, 0.43073636293411255, 0.5250449180603027, 0.6193535327911377, 0.7136620879173279, 0.8079706430435181, 0.9022791981697083, 0.9965877532958984, 1.0908963680267334, 1.1852049827575684, 1.2795134782791138, 1.3738220930099487, 1.4681305885314941, 1.562439203262329, 1.656747817993164, 1.7510563135147095, 1.8453649282455444, 1.9396734237670898, 2.033982038497925, 2.1282906532287598, 2.2225992679595947, 2.3169078826904297, 2.4112164974212646, 2.5055251121520996, 2.5998334884643555, 2.6941421031951904, 2.7884507179260254, 2.8827593326568604, 2.9770679473876953, 3.071376323699951]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 8.0, 10.0, 15.0, 30.0, 42.0, 62.0, 98.0, 208.0, 471.0, 1231.0, 3376.0, 12123.0, 59278.0, 370261.0, 491907.0, 86372.0, 16438.0, 4167.0, 1365.0, 520.0, 245.0, 119.0, 59.0, 46.0, 27.0, 14.0, 18.0, 13.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4714012145996094, -0.45574188232421875, -0.4400825500488281, -0.4244232177734375, -0.4087638854980469, -0.39310455322265625, -0.3774452209472656, -0.361785888671875, -0.3461265563964844, -0.33046722412109375, -0.3148078918457031, -0.2991485595703125, -0.2834892272949219, -0.26782989501953125, -0.2521705627441406, -0.23651123046875, -0.22085189819335938, -0.20519256591796875, -0.18953323364257812, -0.1738739013671875, -0.15821456909179688, -0.14255523681640625, -0.12689590454101562, -0.111236572265625, -0.09557723999023438, -0.07991790771484375, -0.06425857543945312, -0.0485992431640625, -0.032939910888671875, -0.01728057861328125, -0.001621246337890625, 0.0140380859375, 0.029697418212890625, 0.04535675048828125, 0.061016082763671875, 0.0766754150390625, 0.09233474731445312, 0.10799407958984375, 0.12365341186523438, 0.139312744140625, 0.15497207641601562, 0.17063140869140625, 0.18629074096679688, 0.2019500732421875, 0.21760940551757812, 0.23326873779296875, 0.24892807006835938, 0.26458740234375, 0.2802467346191406, 0.29590606689453125, 0.3115653991699219, 0.3272247314453125, 0.3428840637207031, 0.35854339599609375, 0.3742027282714844, 0.389862060546875, 0.4055213928222656, 0.42118072509765625, 0.4368400573730469, 0.4524993896484375, 0.4681587219238281, 0.48381805419921875, 0.4994773864746094, 0.51513671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 14.0, 16.0, 17.0, 29.0, 32.0, 45.0, 59.0, 66.0, 82.0, 90.0, 86.0, 70.0, 85.0, 68.0, 58.0, 45.0, 25.0, 24.0, 15.0, 14.0, 7.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.8203125, -2.74053955078125, -2.6607666015625, -2.58099365234375, -2.501220703125, -2.42144775390625, -2.3416748046875, -2.26190185546875, -2.18212890625, -2.10235595703125, -2.0225830078125, -1.94281005859375, -1.863037109375, -1.78326416015625, -1.7034912109375, -1.62371826171875, -1.5439453125, -1.46417236328125, -1.3843994140625, -1.30462646484375, -1.224853515625, -1.14508056640625, -1.0653076171875, -0.98553466796875, -0.90576171875, -0.82598876953125, -0.7462158203125, -0.66644287109375, -0.586669921875, -0.50689697265625, -0.4271240234375, -0.34735107421875, -0.267578125, -0.18780517578125, -0.1080322265625, -0.02825927734375, 0.051513671875, 0.13128662109375, 0.2110595703125, 0.29083251953125, 0.37060546875, 0.45037841796875, 0.5301513671875, 0.60992431640625, 0.689697265625, 0.76947021484375, 0.8492431640625, 0.92901611328125, 1.0087890625, 1.08856201171875, 1.1683349609375, 1.24810791015625, 1.327880859375, 1.40765380859375, 1.4874267578125, 1.56719970703125, 1.64697265625, 1.72674560546875, 1.8065185546875, 1.88629150390625, 1.966064453125, 2.04583740234375, 2.1256103515625, 2.20538330078125, 2.28515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 7.0, 18.0, 15.0, 23.0, 30.0, 46.0, 67.0, 92.0, 120.0, 181.0, 311.0, 475.0, 948.0, 1865.0, 4090.0, 11101.0, 33998.0, 118573.0, 341070.0, 352817.0, 126051.0, 36329.0, 11511.0, 4487.0, 1886.0, 955.0, 515.0, 310.0, 193.0, 153.0, 93.0, 71.0, 40.0, 34.0, 27.0, 17.0, 14.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2750968933105469, -0.26528167724609375, -0.2554664611816406, -0.2456512451171875, -0.23583602905273438, -0.22602081298828125, -0.21620559692382812, -0.206390380859375, -0.19657516479492188, -0.18675994873046875, -0.17694473266601562, -0.1671295166015625, -0.15731430053710938, -0.14749908447265625, -0.13768386840820312, -0.12786865234375, -0.11805343627929688, -0.10823822021484375, -0.09842300415039062, -0.0886077880859375, -0.07879257202148438, -0.06897735595703125, -0.059162139892578125, -0.049346923828125, -0.039531707763671875, -0.02971649169921875, -0.019901275634765625, -0.0100860595703125, -0.000270843505859375, 0.00954437255859375, 0.019359588623046875, 0.0291748046875, 0.038990020751953125, 0.04880523681640625, 0.058620452880859375, 0.0684356689453125, 0.07825088500976562, 0.08806610107421875, 0.09788131713867188, 0.107696533203125, 0.11751174926757812, 0.12732696533203125, 0.13714218139648438, 0.1469573974609375, 0.15677261352539062, 0.16658782958984375, 0.17640304565429688, 0.18621826171875, 0.19603347778320312, 0.20584869384765625, 0.21566390991210938, 0.2254791259765625, 0.23529434204101562, 0.24510955810546875, 0.2549247741699219, 0.264739990234375, 0.2745552062988281, 0.28437042236328125, 0.2941856384277344, 0.3040008544921875, 0.3138160705566406, 0.32363128662109375, 0.3334465026855469, 0.34326171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 6.0, 5.0, 14.0, 17.0, 18.0, 17.0, 31.0, 32.0, 35.0, 42.0, 52.0, 40.0, 45.0, 49.0, 44.0, 63.0, 65.0, 43.0, 64.0, 45.0, 46.0, 33.0, 33.0, 25.0, 26.0, 24.0, 10.0, 16.0, 8.0, 9.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.92083740234375, -2.8143310546875, -2.70782470703125, -2.601318359375, -2.49481201171875, -2.3883056640625, -2.28179931640625, -2.17529296875, -2.06878662109375, -1.9622802734375, -1.85577392578125, -1.749267578125, -1.64276123046875, -1.5362548828125, -1.42974853515625, -1.3232421875, -1.21673583984375, -1.1102294921875, -1.00372314453125, -0.897216796875, -0.79071044921875, -0.6842041015625, -0.57769775390625, -0.47119140625, -0.36468505859375, -0.2581787109375, -0.15167236328125, -0.045166015625, 0.06134033203125, 0.1678466796875, 0.27435302734375, 0.380859375, 0.48736572265625, 0.5938720703125, 0.70037841796875, 0.806884765625, 0.91339111328125, 1.0198974609375, 1.12640380859375, 1.23291015625, 1.33941650390625, 1.4459228515625, 1.55242919921875, 1.658935546875, 1.76544189453125, 1.8719482421875, 1.97845458984375, 2.0849609375, 2.19146728515625, 2.2979736328125, 2.40447998046875, 2.510986328125, 2.61749267578125, 2.7239990234375, 2.83050537109375, 2.93701171875, 3.04351806640625, 3.1500244140625, 3.25653076171875, 3.363037109375, 3.46954345703125, 3.5760498046875, 3.68255615234375, 3.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 4.0, 12.0, 15.0, 29.0, 52.0, 67.0, 137.0, 303.0, 659.0, 1832.0, 7820.0, 101507.0, 886482.0, 42041.0, 5123.0, 1415.0, 540.0, 216.0, 125.0, 65.0, 36.0, 22.0, 15.0, 12.0, 1.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43505859375, -0.42240142822265625, -0.4097442626953125, -0.39708709716796875, -0.384429931640625, -0.37177276611328125, -0.3591156005859375, -0.34645843505859375, -0.33380126953125, -0.32114410400390625, -0.3084869384765625, -0.29582977294921875, -0.283172607421875, -0.27051544189453125, -0.2578582763671875, -0.24520111083984375, -0.2325439453125, -0.21988677978515625, -0.2072296142578125, -0.19457244873046875, -0.181915283203125, -0.16925811767578125, -0.1566009521484375, -0.14394378662109375, -0.13128662109375, -0.11862945556640625, -0.1059722900390625, -0.09331512451171875, -0.080657958984375, -0.06800079345703125, -0.0553436279296875, -0.04268646240234375, -0.030029296875, -0.01737213134765625, -0.0047149658203125, 0.00794219970703125, 0.020599365234375, 0.03325653076171875, 0.0459136962890625, 0.05857086181640625, 0.07122802734375, 0.08388519287109375, 0.0965423583984375, 0.10919952392578125, 0.121856689453125, 0.13451385498046875, 0.1471710205078125, 0.15982818603515625, 0.1724853515625, 0.18514251708984375, 0.1977996826171875, 0.21045684814453125, 0.223114013671875, 0.23577117919921875, 0.2484283447265625, 0.26108551025390625, 0.27374267578125, 0.28639984130859375, 0.2990570068359375, 0.31171417236328125, 0.324371337890625, 0.33702850341796875, 0.3496856689453125, 0.36234283447265625, 0.375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 6.0, 10.0, 14.0, 16.0, 35.0, 52.0, 78.0, 95.0, 94.0, 116.0, 123.0, 87.0, 88.0, 56.0, 33.0, 31.0, 14.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010162591934204102, -9.807851165533066e-05, -9.45311039686203e-05, -9.098369628190994e-05, -8.743628859519958e-05, -8.388888090848923e-05, -8.034147322177887e-05, -7.679406553506851e-05, -7.324665784835815e-05, -6.96992501616478e-05, -6.615184247493744e-05, -6.260443478822708e-05, -5.9057027101516724e-05, -5.5509619414806366e-05, -5.196221172809601e-05, -4.841480404138565e-05, -4.486739635467529e-05, -4.1319988667964935e-05, -3.777258098125458e-05, -3.422517329454422e-05, -3.067776560783386e-05, -2.7130357921123505e-05, -2.3582950234413147e-05, -2.003554254770279e-05, -1.648813486099243e-05, -1.2940727174282074e-05, -9.393319487571716e-06, -5.845911800861359e-06, -2.298504114151001e-06, 1.2489035725593567e-06, 4.796311259269714e-06, 8.343718945980072e-06, 1.189112663269043e-05, 1.5438534319400787e-05, 1.8985942006111145e-05, 2.2533349692821503e-05, 2.608075737953186e-05, 2.9628165066242218e-05, 3.3175572752952576e-05, 3.672298043966293e-05, 4.027038812637329e-05, 4.381779581308365e-05, 4.7365203499794006e-05, 5.0912611186504364e-05, 5.446001887321472e-05, 5.800742655992508e-05, 6.155483424663544e-05, 6.51022419333458e-05, 6.864964962005615e-05, 7.219705730676651e-05, 7.574446499347687e-05, 7.929187268018723e-05, 8.283928036689758e-05, 8.638668805360794e-05, 8.99340957403183e-05, 9.348150342702866e-05, 9.702891111373901e-05, 0.00010057631880044937, 0.00010412372648715973, 0.00010767113417387009, 0.00011121854186058044, 0.0001147659495472908, 0.00011831335723400116, 0.00012186076492071152, 0.00012540817260742188]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 11.0, 19.0, 25.0, 34.0, 52.0, 69.0, 149.0, 187.0, 368.0, 714.0, 1501.0, 4258.0, 19823.0, 342446.0, 640002.0, 29756.0, 5344.0, 1872.0, 816.0, 439.0, 233.0, 147.0, 98.0, 54.0, 49.0, 30.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.383544921875, -0.3734779357910156, -0.36341094970703125, -0.3533439636230469, -0.3432769775390625, -0.3332099914550781, -0.32314300537109375, -0.3130760192871094, -0.303009033203125, -0.2929420471191406, -0.28287506103515625, -0.2728080749511719, -0.2627410888671875, -0.2526741027832031, -0.24260711669921875, -0.23254013061523438, -0.22247314453125, -0.21240615844726562, -0.20233917236328125, -0.19227218627929688, -0.1822052001953125, -0.17213821411132812, -0.16207122802734375, -0.15200424194335938, -0.141937255859375, -0.13187026977539062, -0.12180328369140625, -0.11173629760742188, -0.1016693115234375, -0.09160232543945312, -0.08153533935546875, -0.07146835327148438, -0.0614013671875, -0.051334381103515625, -0.04126739501953125, -0.031200408935546875, -0.0211334228515625, -0.011066436767578125, -0.00099945068359375, 0.009067535400390625, 0.019134521484375, 0.029201507568359375, 0.03926849365234375, 0.049335479736328125, 0.0594024658203125, 0.06946945190429688, 0.07953643798828125, 0.08960342407226562, 0.09967041015625, 0.10973739624023438, 0.11980438232421875, 0.12987136840820312, 0.1399383544921875, 0.15000534057617188, 0.16007232666015625, 0.17013931274414062, 0.180206298828125, 0.19027328491210938, 0.20034027099609375, 0.21040725708007812, 0.2204742431640625, 0.23054122924804688, 0.24060821533203125, 0.2506752014160156, 0.2607421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 13.0, 19.0, 38.0, 53.0, 78.0, 128.0, 181.0, 158.0, 118.0, 73.0, 46.0, 26.0, 8.0, 10.0, 13.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.044464111328125, -0.0427403450012207, -0.041016578674316406, -0.03929281234741211, -0.03756904602050781, -0.035845279693603516, -0.03412151336669922, -0.03239774703979492, -0.030673980712890625, -0.028950214385986328, -0.02722644805908203, -0.025502681732177734, -0.023778915405273438, -0.02205514907836914, -0.020331382751464844, -0.018607616424560547, -0.01688385009765625, -0.015160083770751953, -0.013436317443847656, -0.01171255111694336, -0.009988784790039062, -0.008265018463134766, -0.006541252136230469, -0.004817485809326172, -0.003093719482421875, -0.0013699531555175781, 0.00035381317138671875, 0.0020775794982910156, 0.0038013458251953125, 0.005525112152099609, 0.007248878479003906, 0.008972644805908203, 0.0106964111328125, 0.012420177459716797, 0.014143943786621094, 0.01586771011352539, 0.017591476440429688, 0.019315242767333984, 0.02103900909423828, 0.022762775421142578, 0.024486541748046875, 0.026210308074951172, 0.02793407440185547, 0.029657840728759766, 0.03138160705566406, 0.03310537338256836, 0.034829139709472656, 0.03655290603637695, 0.03827667236328125, 0.04000043869018555, 0.041724205017089844, 0.04344797134399414, 0.04517173767089844, 0.046895503997802734, 0.04861927032470703, 0.05034303665161133, 0.052066802978515625, 0.05379056930541992, 0.05551433563232422, 0.057238101959228516, 0.05896186828613281, 0.06068563461303711, 0.062409400939941406, 0.0641331672668457, 0.06585693359375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 8.0, 10.0, 8.0, 23.0, 23.0, 45.0, 85.0, 118.0, 146.0, 141.0, 140.0, 81.0, 56.0, 36.0, 15.0, 15.0, 10.0, 5.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5170416831970215, -2.4128308296203613, -2.308619737625122, -2.204408884048462, -2.1001977920532227, -1.9959869384765625, -1.8917760848999023, -1.7875651121139526, -1.683354139328003, -1.5791431665420532, -1.4749321937561035, -1.3707213401794434, -1.2665103673934937, -1.162299394607544, -1.0580885410308838, -0.9538775682449341, -0.8496665954589844, -0.7454556226730347, -0.6412447094917297, -0.5370337963104248, -0.4328228235244751, -0.3286118507385254, -0.22440093755722046, -0.12019002437591553, -0.01597905158996582, 0.0882318913936615, 0.19244283437728882, 0.29665377736091614, 0.40086472034454346, 0.5050756931304932, 0.6092866063117981, 0.713497519493103, 0.8177084922790527, 0.9219194650650024, 1.0261304378509521, 1.1303412914276123, 1.234552264213562, 1.3387632369995117, 1.4429740905761719, 1.5471850633621216, 1.6513960361480713, 1.755607008934021, 1.8598179817199707, 1.9640288352966309, 2.068239688873291, 2.1724507808685303, 2.2766616344451904, 2.3808727264404297, 2.48508358001709, 2.58929443359375, 2.6935055255889893, 2.7977163791656494, 2.9019274711608887, 3.006138324737549, 3.110349178314209, 3.214560031890869, 3.3187711238861084, 3.4229819774627686, 3.527193069458008, 3.631403923034668, 3.735614776611328, 3.8398258686065674, 3.9440367221832275, 4.048247814178467, 4.152458667755127]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 5.0, 16.0, 13.0, 17.0, 30.0, 32.0, 37.0, 50.0, 58.0, 76.0, 91.0, 79.0, 79.0, 75.0, 77.0, 70.0, 51.0, 34.0, 26.0, 25.0, 10.0, 10.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6410934925079346, -2.565190076828003, -2.489286422729492, -2.4133830070495605, -2.337479591369629, -2.2615761756896973, -2.1856727600097656, -2.109769105911255, -2.0338656902313232, -1.9579622745513916, -1.8820587396621704, -1.8061552047729492, -1.7302517890930176, -1.654348373413086, -1.5784448385238647, -1.5025413036346436, -1.426637887954712, -1.3507344722747803, -1.274830937385559, -1.198927402496338, -1.1230239868164062, -1.0471205711364746, -0.9712170362472534, -0.895313560962677, -0.8194100856781006, -0.7435066103935242, -0.6676031351089478, -0.5916996598243713, -0.5157961845397949, -0.4398927092552185, -0.3639892339706421, -0.2880857586860657, -0.21218228340148926, -0.13627880811691284, -0.060375332832336426, 0.01552814245223999, 0.0914316177368164, 0.16733509302139282, 0.24323856830596924, 0.31914204359054565, 0.39504551887512207, 0.4709489941596985, 0.5468524694442749, 0.6227559447288513, 0.6986594200134277, 0.7745628952980042, 0.8504663705825806, 0.926369845867157, 1.0022733211517334, 1.078176736831665, 1.1540802717208862, 1.2299838066101074, 1.305887222290039, 1.3817906379699707, 1.457694172859192, 1.533597707748413, 1.6095011234283447, 1.6854045391082764, 1.7613080739974976, 1.8372116088867188, 1.9131150245666504, 1.989018440246582, 2.0649218559265137, 2.1408255100250244, 2.216728925704956]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 5.0, 23.0, 22.0, 20.0, 44.0, 85.0, 242.0, 1084.0, 6908.0, 95837.0, 876674.0, 61129.0, 5227.0, 805.0, 202.0, 75.0, 35.0, 30.0, 14.0, 13.0, 14.0, 11.0, 7.0, 5.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.6015625, -9.36407470703125, -9.1265869140625, -8.88909912109375, -8.651611328125, -8.41412353515625, -8.1766357421875, -7.93914794921875, -7.70166015625, -7.46417236328125, -7.2266845703125, -6.98919677734375, -6.751708984375, -6.51422119140625, -6.2767333984375, -6.03924560546875, -5.8017578125, -5.56427001953125, -5.3267822265625, -5.08929443359375, -4.851806640625, -4.61431884765625, -4.3768310546875, -4.13934326171875, -3.90185546875, -3.66436767578125, -3.4268798828125, -3.18939208984375, -2.951904296875, -2.71441650390625, -2.4769287109375, -2.23944091796875, -2.001953125, -1.76446533203125, -1.5269775390625, -1.28948974609375, -1.052001953125, -0.81451416015625, -0.5770263671875, -0.33953857421875, -0.10205078125, 0.13543701171875, 0.3729248046875, 0.61041259765625, 0.847900390625, 1.08538818359375, 1.3228759765625, 1.56036376953125, 1.7978515625, 2.03533935546875, 2.2728271484375, 2.51031494140625, 2.747802734375, 2.98529052734375, 3.2227783203125, 3.46026611328125, 3.69775390625, 3.93524169921875, 4.1727294921875, 4.41021728515625, 4.647705078125, 4.88519287109375, 5.1226806640625, 5.36016845703125, 5.59765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 11.0, 19.0, 37.0, 52.0, 117.0, 148.0, 176.0, 164.0, 133.0, 62.0, 37.0, 20.0, 11.0, 8.0, 3.0, 5.0, 2.0, 3.0], "bins": [-21.4375, -21.03033447265625, -20.6231689453125, -20.21600341796875, -19.808837890625, -19.40167236328125, -18.9945068359375, -18.58734130859375, -18.18017578125, -17.77301025390625, -17.3658447265625, -16.95867919921875, -16.551513671875, -16.14434814453125, -15.7371826171875, -15.33001708984375, -14.9228515625, -14.51568603515625, -14.1085205078125, -13.70135498046875, -13.294189453125, -12.88702392578125, -12.4798583984375, -12.07269287109375, -11.66552734375, -11.25836181640625, -10.8511962890625, -10.44403076171875, -10.036865234375, -9.62969970703125, -9.2225341796875, -8.81536865234375, -8.408203125, -8.00103759765625, -7.5938720703125, -7.18670654296875, -6.779541015625, -6.37237548828125, -5.9652099609375, -5.55804443359375, -5.15087890625, -4.74371337890625, -4.3365478515625, -3.92938232421875, -3.522216796875, -3.11505126953125, -2.7078857421875, -2.30072021484375, -1.8935546875, -1.48638916015625, -1.0792236328125, -0.67205810546875, -0.264892578125, 0.14227294921875, 0.5494384765625, 0.95660400390625, 1.36376953125, 1.77093505859375, 2.1781005859375, 2.58526611328125, 2.992431640625, 3.39959716796875, 3.8067626953125, 4.21392822265625, 4.62109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 7.0, 4.0, 7.0, 6.0, 16.0, 24.0, 26.0, 25.0, 45.0, 60.0, 61.0, 83.0, 97.0, 148.0, 272.0, 784.0, 3442.0, 33726.0, 846382.0, 152673.0, 8192.0, 1325.0, 407.0, 180.0, 120.0, 88.0, 76.0, 73.0, 45.0, 38.0, 28.0, 19.0, 20.0, 16.0, 10.0, 11.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.24609375, -6.04278564453125, -5.8394775390625, -5.63616943359375, -5.432861328125, -5.22955322265625, -5.0262451171875, -4.82293701171875, -4.61962890625, -4.41632080078125, -4.2130126953125, -4.00970458984375, -3.806396484375, -3.60308837890625, -3.3997802734375, -3.19647216796875, -2.9931640625, -2.78985595703125, -2.5865478515625, -2.38323974609375, -2.179931640625, -1.97662353515625, -1.7733154296875, -1.57000732421875, -1.36669921875, -1.16339111328125, -0.9600830078125, -0.75677490234375, -0.553466796875, -0.35015869140625, -0.1468505859375, 0.05645751953125, 0.259765625, 0.46307373046875, 0.6663818359375, 0.86968994140625, 1.072998046875, 1.27630615234375, 1.4796142578125, 1.68292236328125, 1.88623046875, 2.08953857421875, 2.2928466796875, 2.49615478515625, 2.699462890625, 2.90277099609375, 3.1060791015625, 3.30938720703125, 3.5126953125, 3.71600341796875, 3.9193115234375, 4.12261962890625, 4.325927734375, 4.52923583984375, 4.7325439453125, 4.93585205078125, 5.13916015625, 5.34246826171875, 5.5457763671875, 5.74908447265625, 5.952392578125, 6.15570068359375, 6.3590087890625, 6.56231689453125, 6.765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 11.0, 20.0, 12.0, 22.0, 20.0, 33.0, 34.0, 34.0, 38.0, 50.0, 52.0, 51.0, 43.0, 44.0, 48.0, 66.0, 43.0, 47.0, 42.0, 42.0, 40.0, 31.0, 28.0, 31.0, 27.0, 22.0, 18.0, 13.0, 9.0, 4.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-6.23828125, -6.07025146484375, -5.9022216796875, -5.73419189453125, -5.566162109375, -5.39813232421875, -5.2301025390625, -5.06207275390625, -4.89404296875, -4.72601318359375, -4.5579833984375, -4.38995361328125, -4.221923828125, -4.05389404296875, -3.8858642578125, -3.71783447265625, -3.5498046875, -3.38177490234375, -3.2137451171875, -3.04571533203125, -2.877685546875, -2.70965576171875, -2.5416259765625, -2.37359619140625, -2.20556640625, -2.03753662109375, -1.8695068359375, -1.70147705078125, -1.533447265625, -1.36541748046875, -1.1973876953125, -1.02935791015625, -0.861328125, -0.69329833984375, -0.5252685546875, -0.35723876953125, -0.189208984375, -0.02117919921875, 0.1468505859375, 0.31488037109375, 0.48291015625, 0.65093994140625, 0.8189697265625, 0.98699951171875, 1.155029296875, 1.32305908203125, 1.4910888671875, 1.65911865234375, 1.8271484375, 1.99517822265625, 2.1632080078125, 2.33123779296875, 2.499267578125, 2.66729736328125, 2.8353271484375, 3.00335693359375, 3.17138671875, 3.33941650390625, 3.5074462890625, 3.67547607421875, 3.843505859375, 4.01153564453125, 4.1795654296875, 4.34759521484375, 4.515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 11.0, 4.0, 17.0, 15.0, 21.0, 22.0, 54.0, 67.0, 109.0, 168.0, 292.0, 474.0, 847.0, 1555.0, 3119.0, 6629.0, 16204.0, 44914.0, 164306.0, 514087.0, 208017.0, 54344.0, 18476.0, 7454.0, 3398.0, 1681.0, 945.0, 519.0, 290.0, 181.0, 121.0, 67.0, 50.0, 28.0, 18.0, 16.0, 5.0, 9.0, 3.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5119857788085938, -0.4927215576171875, -0.47345733642578125, -0.454193115234375, -0.43492889404296875, -0.4156646728515625, -0.39640045166015625, -0.37713623046875, -0.35787200927734375, -0.3386077880859375, -0.31934356689453125, -0.300079345703125, -0.28081512451171875, -0.2615509033203125, -0.24228668212890625, -0.2230224609375, -0.20375823974609375, -0.1844940185546875, -0.16522979736328125, -0.145965576171875, -0.12670135498046875, -0.1074371337890625, -0.08817291259765625, -0.06890869140625, -0.04964447021484375, -0.0303802490234375, -0.01111602783203125, 0.008148193359375, 0.02741241455078125, 0.0466766357421875, 0.06594085693359375, 0.085205078125, 0.10446929931640625, 0.1237335205078125, 0.14299774169921875, 0.162261962890625, 0.18152618408203125, 0.2007904052734375, 0.22005462646484375, 0.23931884765625, 0.25858306884765625, 0.2778472900390625, 0.29711151123046875, 0.316375732421875, 0.33563995361328125, 0.3549041748046875, 0.37416839599609375, 0.3934326171875, 0.41269683837890625, 0.4319610595703125, 0.45122528076171875, 0.470489501953125, 0.48975372314453125, 0.5090179443359375, 0.5282821655273438, 0.54754638671875, 0.5668106079101562, 0.5860748291015625, 0.6053390502929688, 0.624603271484375, 0.6438674926757812, 0.6631317138671875, 0.6823959350585938, 0.70166015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 6.0, 4.0, 17.0, 13.0, 10.0, 19.0, 30.0, 36.0, 45.0, 73.0, 85.0, 77.0, 88.0, 97.0, 94.0, 58.0, 60.0, 47.0, 31.0, 20.0, 15.0, 13.0, 15.0, 12.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012350082397460938, -0.00011936761438846588, -0.00011523440480232239, -0.0001111011952161789, -0.0001069679856300354, -0.0001028347760438919, -9.870156645774841e-05, -9.456835687160492e-05, -9.043514728546143e-05, -8.630193769931793e-05, -8.216872811317444e-05, -7.803551852703094e-05, -7.390230894088745e-05, -6.976909935474396e-05, -6.563588976860046e-05, -6.150268018245697e-05, -5.7369470596313477e-05, -5.323626101016998e-05, -4.910305142402649e-05, -4.4969841837882996e-05, -4.08366322517395e-05, -3.670342266559601e-05, -3.2570213079452515e-05, -2.843700349330902e-05, -2.4303793907165527e-05, -2.0170584321022034e-05, -1.603737473487854e-05, -1.1904165148735046e-05, -7.770955562591553e-06, -3.637745976448059e-06, 4.954636096954346e-07, 4.628673195838928e-06, 8.761882781982422e-06, 1.2895092368125916e-05, 1.702830195426941e-05, 2.1161511540412903e-05, 2.5294721126556396e-05, 2.942793071269989e-05, 3.3561140298843384e-05, 3.769434988498688e-05, 4.182755947113037e-05, 4.5960769057273865e-05, 5.009397864341736e-05, 5.422718822956085e-05, 5.8360397815704346e-05, 6.249360740184784e-05, 6.662681698799133e-05, 7.076002657413483e-05, 7.489323616027832e-05, 7.902644574642181e-05, 8.315965533256531e-05, 8.72928649187088e-05, 9.14260745048523e-05, 9.555928409099579e-05, 9.969249367713928e-05, 0.00010382570326328278, 0.00010795891284942627, 0.00011209212243556976, 0.00011622533202171326, 0.00012035854160785675, 0.00012449175119400024, 0.00012862496078014374, 0.00013275817036628723, 0.00013689137995243073, 0.00014102458953857422]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 8.0, 8.0, 11.0, 17.0, 20.0, 28.0, 47.0, 86.0, 123.0, 182.0, 339.0, 562.0, 1142.0, 2651.0, 6641.0, 21524.0, 98873.0, 596953.0, 257356.0, 43035.0, 11348.0, 3923.0, 1696.0, 779.0, 447.0, 266.0, 155.0, 89.0, 71.0, 50.0, 38.0, 21.0, 14.0, 6.0, 8.0, 2.0, 7.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.93017578125, -0.9017715454101562, -0.8733673095703125, -0.8449630737304688, -0.816558837890625, -0.7881546020507812, -0.7597503662109375, -0.7313461303710938, -0.70294189453125, -0.6745376586914062, -0.6461334228515625, -0.6177291870117188, -0.589324951171875, -0.5609207153320312, -0.5325164794921875, -0.5041122436523438, -0.4757080078125, -0.44730377197265625, -0.4188995361328125, -0.39049530029296875, -0.362091064453125, -0.33368682861328125, -0.3052825927734375, -0.27687835693359375, -0.24847412109375, -0.22006988525390625, -0.1916656494140625, -0.16326141357421875, -0.134857177734375, -0.10645294189453125, -0.0780487060546875, -0.04964447021484375, -0.021240234375, 0.00716400146484375, 0.0355682373046875, 0.06397247314453125, 0.092376708984375, 0.12078094482421875, 0.1491851806640625, 0.17758941650390625, 0.20599365234375, 0.23439788818359375, 0.2628021240234375, 0.29120635986328125, 0.319610595703125, 0.34801483154296875, 0.3764190673828125, 0.40482330322265625, 0.4332275390625, 0.46163177490234375, 0.4900360107421875, 0.5184402465820312, 0.546844482421875, 0.5752487182617188, 0.6036529541015625, 0.6320571899414062, 0.66046142578125, 0.6888656616210938, 0.7172698974609375, 0.7456741333007812, 0.774078369140625, 0.8024826049804688, 0.8308868408203125, 0.8592910766601562, 0.8876953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 11.0, 13.0, 4.0, 6.0, 9.0, 10.0, 23.0, 18.0, 35.0, 39.0, 57.0, 67.0, 77.0, 104.0, 112.0, 69.0, 62.0, 67.0, 59.0, 33.0, 31.0, 19.0, 14.0, 16.0, 14.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.3756523132324219, -0.36238861083984375, -0.3491249084472656, -0.3358612060546875, -0.3225975036621094, -0.30933380126953125, -0.2960700988769531, -0.282806396484375, -0.2695426940917969, -0.25627899169921875, -0.24301528930664062, -0.2297515869140625, -0.21648788452148438, -0.20322418212890625, -0.18996047973632812, -0.17669677734375, -0.16343307495117188, -0.15016937255859375, -0.13690567016601562, -0.1236419677734375, -0.11037826538085938, -0.09711456298828125, -0.08385086059570312, -0.070587158203125, -0.057323455810546875, -0.04405975341796875, -0.030796051025390625, -0.0175323486328125, -0.004268646240234375, 0.00899505615234375, 0.022258758544921875, 0.0355224609375, 0.048786163330078125, 0.06204986572265625, 0.07531356811523438, 0.0885772705078125, 0.10184097290039062, 0.11510467529296875, 0.12836837768554688, 0.141632080078125, 0.15489578247070312, 0.16815948486328125, 0.18142318725585938, 0.1946868896484375, 0.20795059204101562, 0.22121429443359375, 0.23447799682617188, 0.24774169921875, 0.2610054016113281, 0.27426910400390625, 0.2875328063964844, 0.3007965087890625, 0.3140602111816406, 0.32732391357421875, 0.3405876159667969, 0.353851318359375, 0.3671150207519531, 0.38037872314453125, 0.3936424255371094, 0.4069061279296875, 0.4201698303222656, 0.43343353271484375, 0.4466972351074219, 0.4599609375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 23.0, 106.0, 559.0, 262.0, 41.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.55836868286133, -31.56367301940918, -30.56897735595703, -29.574281692504883, -28.579586029052734, -27.584890365600586, -26.590194702148438, -25.595497131347656, -24.60080337524414, -23.606107711791992, -22.611412048339844, -21.616716384887695, -20.622020721435547, -19.6273250579834, -18.63262939453125, -17.63793182373047, -16.64323616027832, -15.648540496826172, -14.653844833374023, -13.659149169921875, -12.664453506469727, -11.669757843017578, -10.675061225891113, -9.680365562438965, -8.685669898986816, -7.690974235534668, -6.6962785720825195, -5.701582431793213, -4.7068867683410645, -3.712191104888916, -2.7174949645996094, -1.722799301147461, -0.7281036376953125, 0.2665921449661255, 1.2612879276275635, 2.255983829498291, 3.2506794929504395, 4.245375156402588, 5.2400712966918945, 6.234766960144043, 7.229462623596191, 8.22415828704834, 9.218853950500488, 10.213550567626953, 11.208246231079102, 12.20294189453125, 13.197637557983398, 14.192333221435547, 15.187028884887695, 16.181724548339844, 17.176420211791992, 18.17111587524414, 19.16581153869629, 20.160507202148438, 21.15520477294922, 22.149898529052734, 23.144596099853516, 24.139291763305664, 25.133987426757812, 26.12868309020996, 27.12337875366211, 28.118074417114258, 29.112770080566406, 30.107467651367188, 31.102161407470703]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 14.0, 17.0, 20.0, 19.0, 28.0, 30.0, 52.0, 45.0, 59.0, 67.0, 63.0, 76.0, 62.0, 78.0, 66.0, 53.0, 53.0, 40.0, 35.0, 31.0, 22.0, 23.0, 15.0, 11.0, 5.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.181644439697266, -16.769371032714844, -16.357097625732422, -15.944825172424316, -15.532552719116211, -15.120279312133789, -14.708006858825684, -14.295733451843262, -13.883460998535156, -13.471187591552734, -13.058915138244629, -12.646641731262207, -12.234369277954102, -11.82209587097168, -11.409823417663574, -10.997550010681152, -10.585277557373047, -10.173004150390625, -9.76073169708252, -9.348458290100098, -8.936185836791992, -8.52391242980957, -8.111639976501465, -7.699366569519043, -7.287093162536621, -6.874820232391357, -6.462547302246094, -6.05027437210083, -5.638001441955566, -5.2257280349731445, -4.813455581665039, -4.401182174682617, -3.9889097213745117, -3.576636791229248, -3.1643638610839844, -2.7520909309387207, -2.339818000793457, -1.9275448322296143, -1.5152719020843506, -1.102998971939087, -0.6907260417938232, -0.2784530818462372, 0.13381987810134888, 0.5460928678512573, 0.958365797996521, 1.3706388473510742, 1.782911777496338, 2.1951847076416016, 2.6074576377868652, 3.019730567932129, 3.4320034980773926, 3.8442764282226562, 4.25654935836792, 4.668822288513184, 5.0810956954956055, 5.493368148803711, 5.905641555786133, 6.3179144859313965, 6.73018741607666, 7.142460346221924, 7.5547332763671875, 7.967006683349609, 8.379279136657715, 8.791552543640137, 9.203824996948242]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 6.0, 8.0, 9.0, 8.0, 10.0, 20.0, 15.0, 27.0, 24.0, 35.0, 64.0, 70.0, 77.0, 147.0, 175.0, 380.0, 958.0, 2851.0, 12565.0, 137615.0, 3896699.0, 125356.0, 12266.0, 2786.0, 960.0, 430.0, 236.0, 119.0, 112.0, 51.0, 43.0, 28.0, 22.0, 28.0, 18.0, 14.0, 18.0, 7.0, 9.0, 5.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6875, -5.512451171875, -5.33740234375, -5.162353515625, -4.9873046875, -4.812255859375, -4.63720703125, -4.462158203125, -4.287109375, -4.112060546875, -3.93701171875, -3.761962890625, -3.5869140625, -3.411865234375, -3.23681640625, -3.061767578125, -2.88671875, -2.711669921875, -2.53662109375, -2.361572265625, -2.1865234375, -2.011474609375, -1.83642578125, -1.661376953125, -1.486328125, -1.311279296875, -1.13623046875, -0.961181640625, -0.7861328125, -0.611083984375, -0.43603515625, -0.260986328125, -0.0859375, 0.089111328125, 0.26416015625, 0.439208984375, 0.6142578125, 0.789306640625, 0.96435546875, 1.139404296875, 1.314453125, 1.489501953125, 1.66455078125, 1.839599609375, 2.0146484375, 2.189697265625, 2.36474609375, 2.539794921875, 2.71484375, 2.889892578125, 3.06494140625, 3.239990234375, 3.4150390625, 3.590087890625, 3.76513671875, 3.940185546875, 4.115234375, 4.290283203125, 4.46533203125, 4.640380859375, 4.8154296875, 4.990478515625, 5.16552734375, 5.340576171875, 5.515625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 4.0, 9.0, 7.0, 15.0, 22.0, 27.0, 22.0, 39.0, 41.0, 48.0, 70.0, 68.0, 71.0, 63.0, 74.0, 62.0, 66.0, 48.0, 44.0, 30.0, 31.0, 31.0, 15.0, 18.0, 13.0, 14.0, 6.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.62890625, -2.548675537109375, -2.46844482421875, -2.388214111328125, -2.3079833984375, -2.227752685546875, -2.14752197265625, -2.067291259765625, -1.987060546875, -1.906829833984375, -1.82659912109375, -1.746368408203125, -1.6661376953125, -1.585906982421875, -1.50567626953125, -1.425445556640625, -1.34521484375, -1.264984130859375, -1.18475341796875, -1.104522705078125, -1.0242919921875, -0.944061279296875, -0.86383056640625, -0.783599853515625, -0.703369140625, -0.623138427734375, -0.54290771484375, -0.462677001953125, -0.3824462890625, -0.302215576171875, -0.22198486328125, -0.141754150390625, -0.0615234375, 0.018707275390625, 0.09893798828125, 0.179168701171875, 0.2593994140625, 0.339630126953125, 0.41986083984375, 0.500091552734375, 0.580322265625, 0.660552978515625, 0.74078369140625, 0.821014404296875, 0.9012451171875, 0.981475830078125, 1.06170654296875, 1.141937255859375, 1.22216796875, 1.302398681640625, 1.38262939453125, 1.462860107421875, 1.5430908203125, 1.623321533203125, 1.70355224609375, 1.783782958984375, 1.864013671875, 1.944244384765625, 2.02447509765625, 2.104705810546875, 2.1849365234375, 2.265167236328125, 2.34539794921875, 2.425628662109375, 2.505859375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 5.0, 13.0, 10.0, 34.0, 23.0, 41.0, 76.0, 135.0, 248.0, 795.0, 4284.0, 99885.0, 4060329.0, 25237.0, 2206.0, 484.0, 179.0, 91.0, 59.0, 24.0, 22.0, 16.0, 21.0, 8.0, 4.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.29833984375, -9.0107421875, -8.72314453125, -8.435546875, -8.14794921875, -7.8603515625, -7.57275390625, -7.28515625, -6.99755859375, -6.7099609375, -6.42236328125, -6.134765625, -5.84716796875, -5.5595703125, -5.27197265625, -4.984375, -4.69677734375, -4.4091796875, -4.12158203125, -3.833984375, -3.54638671875, -3.2587890625, -2.97119140625, -2.68359375, -2.39599609375, -2.1083984375, -1.82080078125, -1.533203125, -1.24560546875, -0.9580078125, -0.67041015625, -0.3828125, -0.09521484375, 0.1923828125, 0.47998046875, 0.767578125, 1.05517578125, 1.3427734375, 1.63037109375, 1.91796875, 2.20556640625, 2.4931640625, 2.78076171875, 3.068359375, 3.35595703125, 3.6435546875, 3.93115234375, 4.21875, 4.50634765625, 4.7939453125, 5.08154296875, 5.369140625, 5.65673828125, 5.9443359375, 6.23193359375, 6.51953125, 6.80712890625, 7.0947265625, 7.38232421875, 7.669921875, 7.95751953125, 8.2451171875, 8.53271484375, 8.8203125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 12.0, 11.0, 34.0, 16.0, 55.0, 87.0, 136.0, 239.0, 584.0, 1632.0, 598.0, 262.0, 134.0, 76.0, 55.0, 29.0, 25.0, 23.0, 12.0, 10.0, 6.0, 3.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.9434814453125, -0.910400390625, -0.8773193359375, -0.84423828125, -0.8111572265625, -0.778076171875, -0.7449951171875, -0.7119140625, -0.6788330078125, -0.645751953125, -0.6126708984375, -0.57958984375, -0.5465087890625, -0.513427734375, -0.4803466796875, -0.447265625, -0.4141845703125, -0.381103515625, -0.3480224609375, -0.31494140625, -0.2818603515625, -0.248779296875, -0.2156982421875, -0.1826171875, -0.1495361328125, -0.116455078125, -0.0833740234375, -0.05029296875, -0.0172119140625, 0.015869140625, 0.0489501953125, 0.08203125, 0.1151123046875, 0.148193359375, 0.1812744140625, 0.21435546875, 0.2474365234375, 0.280517578125, 0.3135986328125, 0.3466796875, 0.3797607421875, 0.412841796875, 0.4459228515625, 0.47900390625, 0.5120849609375, 0.545166015625, 0.5782470703125, 0.611328125, 0.6444091796875, 0.677490234375, 0.7105712890625, 0.74365234375, 0.7767333984375, 0.809814453125, 0.8428955078125, 0.8759765625, 0.9090576171875, 0.942138671875, 0.9752197265625, 1.00830078125, 1.0413818359375, 1.074462890625, 1.1075439453125, 1.140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 10.0, 2.0, 6.0, 2.0, 7.0, 3.0, 10.0, 9.0, 9.0, 16.0, 21.0, 21.0, 33.0, 57.0, 78.0, 77.0, 107.0, 104.0, 99.0, 73.0, 60.0, 43.0, 24.0, 32.0, 30.0, 15.0, 12.0, 8.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.676827907562256, -2.5784897804260254, -2.480151653289795, -2.3818135261535645, -2.283475160598755, -2.1851370334625244, -2.086798906326294, -1.9884607791900635, -1.8901225328445435, -1.791784405708313, -1.693446159362793, -1.5951080322265625, -1.496769905090332, -1.398431658744812, -1.3000935316085815, -1.2017552852630615, -1.103417158126831, -1.0050790309906006, -0.9067407846450806, -0.8084026575088501, -0.7100644707679749, -0.6117262840270996, -0.5133881568908691, -0.4150499701499939, -0.31671178340911865, -0.2183736115694046, -0.12003543972969055, -0.021697282791137695, 0.07664090394973755, 0.1749790906906128, 0.27331721782684326, 0.3716554045677185, 0.46999359130859375, 0.568331778049469, 0.6666699647903442, 0.7650080919265747, 0.86334627866745, 0.9616844654083252, 1.0600225925445557, 1.1583607196807861, 1.2566989660263062, 1.3550370931625366, 1.4533753395080566, 1.551713466644287, 1.6500515937805176, 1.7483898401260376, 1.846727967262268, 1.945066213607788, 2.0434043407440186, 2.141742467880249, 2.2400805950164795, 2.338418960571289, 2.4367570877075195, 2.53509521484375, 2.6334333419799805, 2.731771469116211, 2.8301095962524414, 2.928447723388672, 3.0267858505249023, 3.125123977661133, 3.2234623432159424, 3.321800470352173, 3.4201385974884033, 3.518476724624634, 3.6168150901794434]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 5.0, 13.0, 9.0, 15.0, 15.0, 29.0, 25.0, 37.0, 39.0, 51.0, 60.0, 51.0, 60.0, 61.0, 52.0, 55.0, 49.0, 51.0, 46.0, 43.0, 28.0, 32.0, 26.0, 25.0, 27.0, 15.0, 14.0, 12.0, 10.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.384866952896118, -2.3088696002960205, -2.232872486114502, -2.1568751335144043, -2.0808777809143066, -2.004880666732788, -1.9288833141326904, -1.8528860807418823, -1.7768888473510742, -1.7008916139602661, -1.624894380569458, -1.5488970279693604, -1.4728997945785522, -1.3969025611877441, -1.3209052085876465, -1.2449079751968384, -1.1689107418060303, -1.0929135084152222, -1.016916275024414, -0.9409189224243164, -0.8649216890335083, -0.7889244556427002, -0.7129271626472473, -0.6369298696517944, -0.5609326362609863, -0.48493537306785583, -0.40893810987472534, -0.33294084668159485, -0.25694358348846436, -0.18094632029533386, -0.10494905710220337, -0.02895176410675049, 0.047045230865478516, 0.12304249405860901, 0.1990397572517395, 0.27503702044487, 0.3510342836380005, 0.427031546831131, 0.5030288100242615, 0.5790261030197144, 0.6550233364105225, 0.7310205698013306, 0.8070178627967834, 0.8830151557922363, 0.9590123891830444, 1.0350096225738525, 1.1110069751739502, 1.1870042085647583, 1.2630014419555664, 1.3389986753463745, 1.4149959087371826, 1.4909932613372803, 1.5669904947280884, 1.6429877281188965, 1.7189850807189941, 1.7949823141098022, 1.8709795475006104, 1.9469767808914185, 2.0229740142822266, 2.098971366882324, 2.174968719482422, 2.2509658336639404, 2.326963186264038, 2.4029603004455566, 2.4789576530456543]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 7.0, 14.0, 7.0, 30.0, 53.0, 68.0, 86.0, 125.0, 265.0, 421.0, 779.0, 1354.0, 2672.0, 5580.0, 12198.0, 29630.0, 80675.0, 221649.0, 368276.0, 202828.0, 72691.0, 27167.0, 11463.0, 5150.0, 2448.0, 1237.0, 660.0, 395.0, 235.0, 124.0, 88.0, 54.0, 43.0, 26.0, 9.0, 12.0, 7.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2457275390625, -0.23815536499023438, -0.23058319091796875, -0.22301101684570312, -0.2154388427734375, -0.20786666870117188, -0.20029449462890625, -0.19272232055664062, -0.185150146484375, -0.17757797241210938, -0.17000579833984375, -0.16243362426757812, -0.1548614501953125, -0.14728927612304688, -0.13971710205078125, -0.13214492797851562, -0.12457275390625, -0.11700057983398438, -0.10942840576171875, -0.10185623168945312, -0.0942840576171875, -0.08671188354492188, -0.07913970947265625, -0.07156753540039062, -0.063995361328125, -0.056423187255859375, -0.04885101318359375, -0.041278839111328125, -0.0337066650390625, -0.026134490966796875, -0.01856231689453125, -0.010990142822265625, -0.00341796875, 0.004154205322265625, 0.01172637939453125, 0.019298553466796875, 0.0268707275390625, 0.034442901611328125, 0.04201507568359375, 0.049587249755859375, 0.057159423828125, 0.06473159790039062, 0.07230377197265625, 0.07987594604492188, 0.0874481201171875, 0.09502029418945312, 0.10259246826171875, 0.11016464233398438, 0.11773681640625, 0.12530899047851562, 0.13288116455078125, 0.14045333862304688, 0.1480255126953125, 0.15559768676757812, 0.16316986083984375, 0.17074203491210938, 0.178314208984375, 0.18588638305664062, 0.19345855712890625, 0.20103073120117188, 0.2086029052734375, 0.21617507934570312, 0.22374725341796875, 0.23131942749023438, 0.2388916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 17.0, 11.0, 17.0, 37.0, 53.0, 52.0, 64.0, 74.0, 101.0, 88.0, 82.0, 65.0, 70.0, 46.0, 43.0, 40.0, 22.0, 20.0, 27.0, 12.0, 10.0, 9.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.90234375, -2.82733154296875, -2.7523193359375, -2.67730712890625, -2.602294921875, -2.52728271484375, -2.4522705078125, -2.37725830078125, -2.30224609375, -2.22723388671875, -2.1522216796875, -2.07720947265625, -2.002197265625, -1.92718505859375, -1.8521728515625, -1.77716064453125, -1.7021484375, -1.62713623046875, -1.5521240234375, -1.47711181640625, -1.402099609375, -1.32708740234375, -1.2520751953125, -1.17706298828125, -1.10205078125, -1.02703857421875, -0.9520263671875, -0.87701416015625, -0.802001953125, -0.72698974609375, -0.6519775390625, -0.57696533203125, -0.501953125, -0.42694091796875, -0.3519287109375, -0.27691650390625, -0.201904296875, -0.12689208984375, -0.0518798828125, 0.02313232421875, 0.09814453125, 0.17315673828125, 0.2481689453125, 0.32318115234375, 0.398193359375, 0.47320556640625, 0.5482177734375, 0.62322998046875, 0.6982421875, 0.77325439453125, 0.8482666015625, 0.92327880859375, 0.998291015625, 1.07330322265625, 1.1483154296875, 1.22332763671875, 1.29833984375, 1.37335205078125, 1.4483642578125, 1.52337646484375, 1.598388671875, 1.67340087890625, 1.7484130859375, 1.82342529296875, 1.8984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 6.0, 7.0, 8.0, 1.0, 21.0, 17.0, 27.0, 46.0, 45.0, 88.0, 105.0, 120.0, 197.0, 358.0, 535.0, 875.0, 1592.0, 3433.0, 8473.0, 24553.0, 79099.0, 239742.0, 388488.0, 203819.0, 63299.0, 19939.0, 7246.0, 2949.0, 1384.0, 746.0, 418.0, 265.0, 187.0, 126.0, 94.0, 64.0, 54.0, 36.0, 31.0, 19.0, 10.0, 9.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2359619140625, -0.2276592254638672, -0.21935653686523438, -0.21105384826660156, -0.20275115966796875, -0.19444847106933594, -0.18614578247070312, -0.1778430938720703, -0.1695404052734375, -0.1612377166748047, -0.15293502807617188, -0.14463233947753906, -0.13632965087890625, -0.12802696228027344, -0.11972427368164062, -0.11142158508300781, -0.103118896484375, -0.09481620788574219, -0.08651351928710938, -0.07821083068847656, -0.06990814208984375, -0.06160545349121094, -0.053302764892578125, -0.04500007629394531, -0.0366973876953125, -0.028394699096679688, -0.020092010498046875, -0.011789321899414062, -0.00348663330078125, 0.0048160552978515625, 0.013118743896484375, 0.021421432495117188, 0.02972412109375, 0.03802680969238281, 0.046329498291015625, 0.05463218688964844, 0.06293487548828125, 0.07123756408691406, 0.07954025268554688, 0.08784294128417969, 0.0961456298828125, 0.10444831848144531, 0.11275100708007812, 0.12105369567871094, 0.12935638427734375, 0.13765907287597656, 0.14596176147460938, 0.1542644500732422, 0.162567138671875, 0.1708698272705078, 0.17917251586914062, 0.18747520446777344, 0.19577789306640625, 0.20408058166503906, 0.21238327026367188, 0.2206859588623047, 0.2289886474609375, 0.2372913360595703, 0.24559402465820312, 0.25389671325683594, 0.26219940185546875, 0.27050209045410156, 0.2788047790527344, 0.2871074676513672, 0.29541015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 13.0, 8.0, 7.0, 14.0, 27.0, 16.0, 22.0, 21.0, 36.0, 45.0, 39.0, 44.0, 48.0, 44.0, 51.0, 53.0, 52.0, 50.0, 52.0, 51.0, 35.0, 55.0, 38.0, 39.0, 30.0, 27.0, 8.0, 13.0, 17.0, 7.0, 5.0, 6.0, 6.0, 1.0, 4.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.794921875, -3.69329833984375, -3.5916748046875, -3.49005126953125, -3.388427734375, -3.28680419921875, -3.1851806640625, -3.08355712890625, -2.98193359375, -2.88031005859375, -2.7786865234375, -2.67706298828125, -2.575439453125, -2.47381591796875, -2.3721923828125, -2.27056884765625, -2.1689453125, -2.06732177734375, -1.9656982421875, -1.86407470703125, -1.762451171875, -1.66082763671875, -1.5592041015625, -1.45758056640625, -1.35595703125, -1.25433349609375, -1.1527099609375, -1.05108642578125, -0.949462890625, -0.84783935546875, -0.7462158203125, -0.64459228515625, -0.54296875, -0.44134521484375, -0.3397216796875, -0.23809814453125, -0.136474609375, -0.03485107421875, 0.0667724609375, 0.16839599609375, 0.27001953125, 0.37164306640625, 0.4732666015625, 0.57489013671875, 0.676513671875, 0.77813720703125, 0.8797607421875, 0.98138427734375, 1.0830078125, 1.18463134765625, 1.2862548828125, 1.38787841796875, 1.489501953125, 1.59112548828125, 1.6927490234375, 1.79437255859375, 1.89599609375, 1.99761962890625, 2.0992431640625, 2.20086669921875, 2.302490234375, 2.40411376953125, 2.5057373046875, 2.60736083984375, 2.708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 5.0, 16.0, 19.0, 26.0, 39.0, 60.0, 66.0, 103.0, 186.0, 321.0, 494.0, 958.0, 2044.0, 5114.0, 16498.0, 74225.0, 383241.0, 445559.0, 89533.0, 19422.0, 5887.0, 2233.0, 1075.0, 505.0, 309.0, 205.0, 110.0, 89.0, 49.0, 32.0, 30.0, 24.0, 20.0, 7.0, 7.0, 2.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.123046875, -0.11881256103515625, -0.1145782470703125, -0.11034393310546875, -0.106109619140625, -0.10187530517578125, -0.0976409912109375, -0.09340667724609375, -0.08917236328125, -0.08493804931640625, -0.0807037353515625, -0.07646942138671875, -0.072235107421875, -0.06800079345703125, -0.0637664794921875, -0.05953216552734375, -0.0552978515625, -0.05106353759765625, -0.0468292236328125, -0.04259490966796875, -0.038360595703125, -0.03412628173828125, -0.0298919677734375, -0.02565765380859375, -0.02142333984375, -0.01718902587890625, -0.0129547119140625, -0.00872039794921875, -0.004486083984375, -0.00025177001953125, 0.0039825439453125, 0.00821685791015625, 0.012451171875, 0.01668548583984375, 0.0209197998046875, 0.02515411376953125, 0.029388427734375, 0.03362274169921875, 0.0378570556640625, 0.04209136962890625, 0.04632568359375, 0.05055999755859375, 0.0547943115234375, 0.05902862548828125, 0.063262939453125, 0.06749725341796875, 0.0717315673828125, 0.07596588134765625, 0.0802001953125, 0.08443450927734375, 0.0886688232421875, 0.09290313720703125, 0.097137451171875, 0.10137176513671875, 0.1056060791015625, 0.10984039306640625, 0.11407470703125, 0.11830902099609375, 0.1225433349609375, 0.12677764892578125, 0.131011962890625, 0.13524627685546875, 0.1394805908203125, 0.14371490478515625, 0.14794921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 6.0, 6.0, 11.0, 15.0, 14.0, 34.0, 47.0, 54.0, 81.0, 85.0, 108.0, 115.0, 100.0, 86.0, 64.0, 45.0, 32.0, 27.0, 20.0, 17.0, 15.0, 2.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001232624053955078, -0.00012029241770505905, -0.00011732243001461029, -0.00011435244232416153, -0.00011138245463371277, -0.00010841246694326401, -0.00010544247925281525, -0.00010247249156236649, -9.950250387191772e-05, -9.653251618146896e-05, -9.35625284910202e-05, -9.059254080057144e-05, -8.762255311012268e-05, -8.465256541967392e-05, -8.168257772922516e-05, -7.87125900387764e-05, -7.574260234832764e-05, -7.277261465787888e-05, -6.980262696743011e-05, -6.683263927698135e-05, -6.386265158653259e-05, -6.089266389608383e-05, -5.792267620563507e-05, -5.495268851518631e-05, -5.198270082473755e-05, -4.901271313428879e-05, -4.604272544384003e-05, -4.3072737753391266e-05, -4.0102750062942505e-05, -3.7132762372493744e-05, -3.416277468204498e-05, -3.119278699159622e-05, -2.822279930114746e-05, -2.52528116106987e-05, -2.228282392024994e-05, -1.9312836229801178e-05, -1.6342848539352417e-05, -1.3372860848903656e-05, -1.0402873158454895e-05, -7.432885468006134e-06, -4.462897777557373e-06, -1.492910087108612e-06, 1.477077603340149e-06, 4.44706529378891e-06, 7.417052984237671e-06, 1.0387040674686432e-05, 1.3357028365135193e-05, 1.6327016055583954e-05, 1.9297003746032715e-05, 2.2266991436481476e-05, 2.5236979126930237e-05, 2.8206966817378998e-05, 3.117695450782776e-05, 3.414694219827652e-05, 3.711692988872528e-05, 4.008691757917404e-05, 4.30569052696228e-05, 4.6026892960071564e-05, 4.8996880650520325e-05, 5.1966868340969086e-05, 5.493685603141785e-05, 5.790684372186661e-05, 6.087683141231537e-05, 6.384681910276413e-05, 6.681680679321289e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 9.0, 19.0, 28.0, 37.0, 55.0, 97.0, 249.0, 640.0, 2083.0, 9092.0, 71176.0, 704578.0, 234217.0, 20740.0, 3763.0, 1044.0, 341.0, 153.0, 93.0, 36.0, 34.0, 20.0, 17.0, 4.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1907958984375, -0.18437767028808594, -0.17795944213867188, -0.1715412139892578, -0.16512298583984375, -0.1587047576904297, -0.15228652954101562, -0.14586830139160156, -0.1394500732421875, -0.13303184509277344, -0.12661361694335938, -0.12019538879394531, -0.11377716064453125, -0.10735893249511719, -0.10094070434570312, -0.09452247619628906, -0.088104248046875, -0.08168601989746094, -0.07526779174804688, -0.06884956359863281, -0.06243133544921875, -0.05601310729980469, -0.049594879150390625, -0.04317665100097656, -0.0367584228515625, -0.030340194702148438, -0.023921966552734375, -0.017503738403320312, -0.01108551025390625, -0.0046672821044921875, 0.001750946044921875, 0.008169174194335938, 0.01458740234375, 0.021005630493164062, 0.027423858642578125, 0.03384208679199219, 0.04026031494140625, 0.04667854309082031, 0.053096771240234375, 0.05951499938964844, 0.0659332275390625, 0.07235145568847656, 0.07876968383789062, 0.08518791198730469, 0.09160614013671875, 0.09802436828613281, 0.10444259643554688, 0.11086082458496094, 0.117279052734375, 0.12369728088378906, 0.13011550903320312, 0.1365337371826172, 0.14295196533203125, 0.1493701934814453, 0.15578842163085938, 0.16220664978027344, 0.1686248779296875, 0.17504310607910156, 0.18146133422851562, 0.1878795623779297, 0.19429779052734375, 0.2007160186767578, 0.20713424682617188, 0.21355247497558594, 0.219970703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 6.0, 11.0, 12.0, 17.0, 22.0, 28.0, 44.0, 50.0, 50.0, 64.0, 89.0, 99.0, 82.0, 74.0, 70.0, 62.0, 35.0, 43.0, 30.0, 28.0, 15.0, 14.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0281829833984375, -0.02735733985900879, -0.026531696319580078, -0.025706052780151367, -0.024880409240722656, -0.024054765701293945, -0.023229122161865234, -0.022403478622436523, -0.021577835083007812, -0.0207521915435791, -0.01992654800415039, -0.01910090446472168, -0.01827526092529297, -0.017449617385864258, -0.016623973846435547, -0.015798330307006836, -0.014972686767578125, -0.014147043228149414, -0.013321399688720703, -0.012495756149291992, -0.011670112609863281, -0.01084446907043457, -0.01001882553100586, -0.009193181991577148, -0.008367538452148438, -0.0075418949127197266, -0.006716251373291016, -0.005890607833862305, -0.005064964294433594, -0.004239320755004883, -0.003413677215576172, -0.002588033676147461, -0.00176239013671875, -0.0009367465972900391, -0.00011110305786132812, 0.0007145404815673828, 0.0015401840209960938, 0.0023658275604248047, 0.0031914710998535156, 0.0040171146392822266, 0.0048427581787109375, 0.0056684017181396484, 0.006494045257568359, 0.00731968879699707, 0.008145332336425781, 0.008970975875854492, 0.009796619415283203, 0.010622262954711914, 0.011447906494140625, 0.012273550033569336, 0.013099193572998047, 0.013924837112426758, 0.014750480651855469, 0.01557612419128418, 0.01640176773071289, 0.0172274112701416, 0.018053054809570312, 0.018878698348999023, 0.019704341888427734, 0.020529985427856445, 0.021355628967285156, 0.022181272506713867, 0.023006916046142578, 0.02383255958557129, 0.024658203125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 3.0, 13.0, 8.0, 11.0, 10.0, 24.0, 31.0, 44.0, 89.0, 133.0, 150.0, 155.0, 101.0, 62.0, 53.0, 28.0, 25.0, 10.0, 12.0, 1.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9297759532928467, -1.8323655128479004, -1.734955072402954, -1.6375447511672974, -1.540134310722351, -1.4427238702774048, -1.345313549041748, -1.2479031085968018, -1.1504926681518555, -1.0530822277069092, -0.9556718468666077, -0.8582614660263062, -0.7608510255813599, -0.6634405851364136, -0.5660302042961121, -0.46861982345581055, -0.37120938301086426, -0.27379897236824036, -0.17638856172561646, -0.07897815108299255, 0.018432259559631348, 0.11584267020225525, 0.21325308084487915, 0.31066346168518066, 0.40807390213012695, 0.5054843425750732, 0.6028947234153748, 0.7003051042556763, 0.7977155447006226, 0.8951259851455688, 0.9925363659858704, 1.0899467468261719, 1.1873574256896973, 1.2847678661346436, 1.3821783065795898, 1.4795886278152466, 1.5769990682601929, 1.6744095087051392, 1.771819829940796, 1.8692302703857422, 1.9666407108306885, 2.0640511512756348, 2.161461591720581, 2.2588720321655273, 2.3562822341918945, 2.453692674636841, 2.551103115081787, 2.6485135555267334, 2.7459239959716797, 2.843334436416626, 2.9407448768615723, 3.0381553173065186, 3.135565757751465, 3.232975959777832, 3.3303864002227783, 3.4277968406677246, 3.525207281112671, 3.622617721557617, 3.7200281620025635, 3.8174386024475098, 3.914848804473877, 4.012259483337402, 4.1096696853637695, 4.207079887390137, 4.304490566253662]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 9.0, 5.0, 4.0, 11.0, 14.0, 21.0, 16.0, 38.0, 51.0, 59.0, 78.0, 85.0, 90.0, 89.0, 84.0, 65.0, 66.0, 42.0, 44.0, 32.0, 31.0, 21.0, 14.0, 13.0, 5.0, 7.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.9620790481567383, -2.8868136405944824, -2.8115482330322266, -2.7362828254699707, -2.661017417907715, -2.585752010345459, -2.510486602783203, -2.435220956802368, -2.3599555492401123, -2.2846901416778564, -2.2094247341156006, -2.1341593265533447, -2.058893918991089, -1.9836283922195435, -1.9083629846572876, -1.8330974578857422, -1.7578321695327759, -1.68256676197052, -1.6073013544082642, -1.5320358276367188, -1.456770420074463, -1.381505012512207, -1.3062396049499512, -1.2309741973876953, -1.1557087898254395, -1.0804433822631836, -1.0051779747009277, -0.9299125075340271, -0.8546470403671265, -0.7793816328048706, -0.7041162252426147, -0.6288507580757141, -0.5535851716995239, -0.4783197343349457, -0.40305429697036743, -0.3277888894081116, -0.2525234520435333, -0.17725801467895508, -0.10199260711669922, -0.026727139949798584, 0.048538267612457275, 0.12380369752645493, 0.19906912744045258, 0.27433454990386963, 0.3495999872684479, 0.4248654246330261, 0.500130832195282, 0.5753962993621826, 0.6506617069244385, 0.7259271144866943, 0.801192581653595, 0.8764579892158508, 0.9517234563827515, 1.0269888639450073, 1.1022542715072632, 1.1775197982788086, 1.2527852058410645, 1.3280506134033203, 1.4033160209655762, 1.478581428527832, 1.5538469552993774, 1.6291123628616333, 1.7043777704238892, 1.7796432971954346, 1.8549085855484009]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 15.0, 22.0, 18.0, 57.0, 83.0, 180.0, 453.0, 1308.0, 4412.0, 20735.0, 177501.0, 756125.0, 71941.0, 11362.0, 2756.0, 843.0, 364.0, 151.0, 81.0, 32.0, 27.0, 15.0, 9.0, 12.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55859375, -3.44122314453125, -3.3238525390625, -3.20648193359375, -3.089111328125, -2.97174072265625, -2.8543701171875, -2.73699951171875, -2.61962890625, -2.50225830078125, -2.3848876953125, -2.26751708984375, -2.150146484375, -2.03277587890625, -1.9154052734375, -1.79803466796875, -1.6806640625, -1.56329345703125, -1.4459228515625, -1.32855224609375, -1.211181640625, -1.09381103515625, -0.9764404296875, -0.85906982421875, -0.74169921875, -0.62432861328125, -0.5069580078125, -0.38958740234375, -0.272216796875, -0.15484619140625, -0.0374755859375, 0.07989501953125, 0.197265625, 0.31463623046875, 0.4320068359375, 0.54937744140625, 0.666748046875, 0.78411865234375, 0.9014892578125, 1.01885986328125, 1.13623046875, 1.25360107421875, 1.3709716796875, 1.48834228515625, 1.605712890625, 1.72308349609375, 1.8404541015625, 1.95782470703125, 2.0751953125, 2.19256591796875, 2.3099365234375, 2.42730712890625, 2.544677734375, 2.66204833984375, 2.7794189453125, 2.89678955078125, 3.01416015625, 3.13153076171875, 3.2489013671875, 3.36627197265625, 3.483642578125, 3.60101318359375, 3.7183837890625, 3.83575439453125, 3.953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 9.0, 20.0, 33.0, 78.0, 142.0, 176.0, 184.0, 151.0, 89.0, 57.0, 35.0, 19.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-20.765625, -20.36798095703125, -19.9703369140625, -19.57269287109375, -19.175048828125, -18.77740478515625, -18.3797607421875, -17.98211669921875, -17.58447265625, -17.18682861328125, -16.7891845703125, -16.39154052734375, -15.993896484375, -15.59625244140625, -15.1986083984375, -14.80096435546875, -14.4033203125, -14.00567626953125, -13.6080322265625, -13.21038818359375, -12.812744140625, -12.41510009765625, -12.0174560546875, -11.61981201171875, -11.22216796875, -10.82452392578125, -10.4268798828125, -10.02923583984375, -9.631591796875, -9.23394775390625, -8.8363037109375, -8.43865966796875, -8.041015625, -7.64337158203125, -7.2457275390625, -6.84808349609375, -6.450439453125, -6.05279541015625, -5.6551513671875, -5.25750732421875, -4.85986328125, -4.46221923828125, -4.0645751953125, -3.66693115234375, -3.269287109375, -2.87164306640625, -2.4739990234375, -2.07635498046875, -1.6787109375, -1.28106689453125, -0.8834228515625, -0.48577880859375, -0.088134765625, 0.30950927734375, 0.7071533203125, 1.10479736328125, 1.50244140625, 1.90008544921875, 2.2977294921875, 2.69537353515625, 3.093017578125, 3.49066162109375, 3.8883056640625, 4.28594970703125, 4.68359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 10.0, 7.0, 11.0, 22.0, 36.0, 51.0, 75.0, 113.0, 214.0, 350.0, 771.0, 1997.0, 7234.0, 47887.0, 756436.0, 208986.0, 18030.0, 3902.0, 1215.0, 510.0, 278.0, 159.0, 61.0, 56.0, 38.0, 38.0, 23.0, 10.0, 12.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.916015625, -2.82122802734375, -2.7264404296875, -2.63165283203125, -2.536865234375, -2.44207763671875, -2.3472900390625, -2.25250244140625, -2.15771484375, -2.06292724609375, -1.9681396484375, -1.87335205078125, -1.778564453125, -1.68377685546875, -1.5889892578125, -1.49420166015625, -1.3994140625, -1.30462646484375, -1.2098388671875, -1.11505126953125, -1.020263671875, -0.92547607421875, -0.8306884765625, -0.73590087890625, -0.64111328125, -0.54632568359375, -0.4515380859375, -0.35675048828125, -0.261962890625, -0.16717529296875, -0.0723876953125, 0.02239990234375, 0.1171875, 0.21197509765625, 0.3067626953125, 0.40155029296875, 0.496337890625, 0.59112548828125, 0.6859130859375, 0.78070068359375, 0.87548828125, 0.97027587890625, 1.0650634765625, 1.15985107421875, 1.254638671875, 1.34942626953125, 1.4442138671875, 1.53900146484375, 1.6337890625, 1.72857666015625, 1.8233642578125, 1.91815185546875, 2.012939453125, 2.10772705078125, 2.2025146484375, 2.29730224609375, 2.39208984375, 2.48687744140625, 2.5816650390625, 2.67645263671875, 2.771240234375, 2.86602783203125, 2.9608154296875, 3.05560302734375, 3.150390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 7.0, 10.0, 12.0, 17.0, 13.0, 17.0, 26.0, 30.0, 26.0, 26.0, 39.0, 38.0, 38.0, 31.0, 41.0, 38.0, 41.0, 37.0, 44.0, 45.0, 45.0, 38.0, 39.0, 36.0, 41.0, 32.0, 19.0, 26.0, 20.0, 18.0, 10.0, 11.0, 8.0, 13.0, 7.0, 8.0, 12.0, 5.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.1112060546875, -3.976318359375, -3.8414306640625, -3.70654296875, -3.5716552734375, -3.436767578125, -3.3018798828125, -3.1669921875, -3.0321044921875, -2.897216796875, -2.7623291015625, -2.62744140625, -2.4925537109375, -2.357666015625, -2.2227783203125, -2.087890625, -1.9530029296875, -1.818115234375, -1.6832275390625, -1.54833984375, -1.4134521484375, -1.278564453125, -1.1436767578125, -1.0087890625, -0.8739013671875, -0.739013671875, -0.6041259765625, -0.46923828125, -0.3343505859375, -0.199462890625, -0.0645751953125, 0.0703125, 0.2052001953125, 0.340087890625, 0.4749755859375, 0.60986328125, 0.7447509765625, 0.879638671875, 1.0145263671875, 1.1494140625, 1.2843017578125, 1.419189453125, 1.5540771484375, 1.68896484375, 1.8238525390625, 1.958740234375, 2.0936279296875, 2.228515625, 2.3634033203125, 2.498291015625, 2.6331787109375, 2.76806640625, 2.9029541015625, 3.037841796875, 3.1727294921875, 3.3076171875, 3.4425048828125, 3.577392578125, 3.7122802734375, 3.84716796875, 3.9820556640625, 4.116943359375, 4.2518310546875, 4.38671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 6.0, 4.0, 3.0, 4.0, 10.0, 14.0, 13.0, 14.0, 30.0, 34.0, 39.0, 74.0, 69.0, 108.0, 188.0, 244.0, 420.0, 611.0, 1065.0, 1843.0, 3390.0, 6355.0, 13637.0, 32414.0, 92517.0, 356980.0, 377154.0, 97465.0, 34458.0, 14420.0, 6752.0, 3328.0, 1849.0, 1075.0, 678.0, 430.0, 293.0, 175.0, 112.0, 83.0, 59.0, 49.0, 25.0, 19.0, 9.0, 14.0, 10.0, 7.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.427490234375, -0.4132499694824219, -0.39900970458984375, -0.3847694396972656, -0.3705291748046875, -0.3562889099121094, -0.34204864501953125, -0.3278083801269531, -0.313568115234375, -0.2993278503417969, -0.28508758544921875, -0.2708473205566406, -0.2566070556640625, -0.24236679077148438, -0.22812652587890625, -0.21388626098632812, -0.19964599609375, -0.18540573120117188, -0.17116546630859375, -0.15692520141601562, -0.1426849365234375, -0.12844467163085938, -0.11420440673828125, -0.09996414184570312, -0.085723876953125, -0.07148361206054688, -0.05724334716796875, -0.043003082275390625, -0.0287628173828125, -0.014522552490234375, -0.00028228759765625, 0.013957977294921875, 0.0281982421875, 0.042438507080078125, 0.05667877197265625, 0.07091903686523438, 0.0851593017578125, 0.09939956665039062, 0.11363983154296875, 0.12788009643554688, 0.142120361328125, 0.15636062622070312, 0.17060089111328125, 0.18484115600585938, 0.1990814208984375, 0.21332168579101562, 0.22756195068359375, 0.24180221557617188, 0.25604248046875, 0.2702827453613281, 0.28452301025390625, 0.2987632751464844, 0.3130035400390625, 0.3272438049316406, 0.34148406982421875, 0.3557243347167969, 0.369964599609375, 0.3842048645019531, 0.39844512939453125, 0.4126853942871094, 0.4269256591796875, 0.4411659240722656, 0.45540618896484375, 0.4696464538574219, 0.48388671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 7.0, 3.0, 4.0, 9.0, 10.0, 17.0, 26.0, 29.0, 27.0, 34.0, 49.0, 58.0, 104.0, 105.0, 125.0, 97.0, 63.0, 48.0, 40.0, 31.0, 20.0, 14.0, 12.0, 13.0, 9.0, 10.0, 2.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00012373924255371094, -0.00011987611651420593, -0.00011601299047470093, -0.00011214986443519592, -0.00010828673839569092, -0.00010442361235618591, -0.00010056048631668091, -9.66973602771759e-05, -9.28342342376709e-05, -8.89711081981659e-05, -8.510798215866089e-05, -8.124485611915588e-05, -7.738173007965088e-05, -7.351860404014587e-05, -6.965547800064087e-05, -6.579235196113586e-05, -6.192922592163086e-05, -5.8066099882125854e-05, -5.420297384262085e-05, -5.0339847803115845e-05, -4.647672176361084e-05, -4.2613595724105835e-05, -3.875046968460083e-05, -3.4887343645095825e-05, -3.102421760559082e-05, -2.7161091566085815e-05, -2.329796552658081e-05, -1.9434839487075806e-05, -1.55717134475708e-05, -1.1708587408065796e-05, -7.845461368560791e-06, -3.982335329055786e-06, -1.1920928955078125e-07, 3.7439167499542236e-06, 7.6070427894592285e-06, 1.1470168828964233e-05, 1.5333294868469238e-05, 1.9196420907974243e-05, 2.3059546947479248e-05, 2.6922672986984253e-05, 3.078579902648926e-05, 3.464892506599426e-05, 3.851205110549927e-05, 4.237517714500427e-05, 4.623830318450928e-05, 5.010142922401428e-05, 5.396455526351929e-05, 5.782768130302429e-05, 6.16908073425293e-05, 6.55539333820343e-05, 6.94170594215393e-05, 7.328018546104431e-05, 7.714331150054932e-05, 8.100643754005432e-05, 8.486956357955933e-05, 8.873268961906433e-05, 9.259581565856934e-05, 9.645894169807434e-05, 0.00010032206773757935, 0.00010418519377708435, 0.00010804831981658936, 0.00011191144585609436, 0.00011577457189559937, 0.00011963769793510437, 0.00012350082397460938]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 2.0, 7.0, 14.0, 23.0, 22.0, 24.0, 60.0, 71.0, 117.0, 170.0, 273.0, 550.0, 888.0, 1853.0, 4104.0, 10722.0, 36693.0, 205627.0, 650645.0, 100163.0, 22547.0, 7681.0, 3059.0, 1374.0, 679.0, 427.0, 231.0, 170.0, 89.0, 66.0, 60.0, 25.0, 22.0, 29.0, 15.0, 10.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.70751953125, -0.6833877563476562, -0.6592559814453125, -0.6351242065429688, -0.610992431640625, -0.5868606567382812, -0.5627288818359375, -0.5385971069335938, -0.51446533203125, -0.49033355712890625, -0.4662017822265625, -0.44207000732421875, -0.417938232421875, -0.39380645751953125, -0.3696746826171875, -0.34554290771484375, -0.3214111328125, -0.29727935791015625, -0.2731475830078125, -0.24901580810546875, -0.224884033203125, -0.20075225830078125, -0.1766204833984375, -0.15248870849609375, -0.12835693359375, -0.10422515869140625, -0.0800933837890625, -0.05596160888671875, -0.031829833984375, -0.00769805908203125, 0.0164337158203125, 0.04056549072265625, 0.064697265625, 0.08882904052734375, 0.1129608154296875, 0.13709259033203125, 0.161224365234375, 0.18535614013671875, 0.2094879150390625, 0.23361968994140625, 0.25775146484375, 0.28188323974609375, 0.3060150146484375, 0.33014678955078125, 0.354278564453125, 0.37841033935546875, 0.4025421142578125, 0.42667388916015625, 0.4508056640625, 0.47493743896484375, 0.4990692138671875, 0.5232009887695312, 0.547332763671875, 0.5714645385742188, 0.5955963134765625, 0.6197280883789062, 0.64385986328125, 0.6679916381835938, 0.6921234130859375, 0.7162551879882812, 0.740386962890625, 0.7645187377929688, 0.7886505126953125, 0.8127822875976562, 0.8369140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 10.0, 11.0, 21.0, 17.0, 18.0, 25.0, 32.0, 35.0, 47.0, 63.0, 72.0, 101.0, 98.0, 82.0, 72.0, 49.0, 44.0, 40.0, 25.0, 17.0, 14.0, 14.0, 11.0, 15.0, 10.0, 9.0, 4.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36669921875, -0.3563041687011719, -0.34590911865234375, -0.3355140686035156, -0.3251190185546875, -0.3147239685058594, -0.30432891845703125, -0.2939338684082031, -0.283538818359375, -0.2731437683105469, -0.26274871826171875, -0.2523536682128906, -0.2419586181640625, -0.23156356811523438, -0.22116851806640625, -0.21077346801757812, -0.20037841796875, -0.18998336791992188, -0.17958831787109375, -0.16919326782226562, -0.1587982177734375, -0.14840316772460938, -0.13800811767578125, -0.12761306762695312, -0.117218017578125, -0.10682296752929688, -0.09642791748046875, -0.08603286743164062, -0.0756378173828125, -0.06524276733398438, -0.05484771728515625, -0.044452667236328125, -0.0340576171875, -0.023662567138671875, -0.01326751708984375, -0.002872467041015625, 0.0075225830078125, 0.017917633056640625, 0.02831268310546875, 0.038707733154296875, 0.049102783203125, 0.059497833251953125, 0.06989288330078125, 0.08028793334960938, 0.0906829833984375, 0.10107803344726562, 0.11147308349609375, 0.12186813354492188, 0.13226318359375, 0.14265823364257812, 0.15305328369140625, 0.16344833374023438, 0.1738433837890625, 0.18423843383789062, 0.19463348388671875, 0.20502853393554688, 0.215423583984375, 0.22581863403320312, 0.23621368408203125, 0.24660873413085938, 0.2570037841796875, 0.2673988342285156, 0.27779388427734375, 0.2881889343261719, 0.298583984375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 12.0, 28.0, 94.0, 333.0, 365.0, 103.0, 33.0, 14.0, 5.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.957146644592285, -10.350625991821289, -9.74410629272461, -9.137585639953613, -8.531065940856934, -7.9245452880859375, -7.3180251121521, -6.711504936218262, -6.104984760284424, -5.498464584350586, -4.891944408416748, -4.28542423248291, -3.678903818130493, -3.0723836421966553, -2.4658632278442383, -1.8593430519104004, -1.2528228759765625, -0.6463026404380798, -0.03978240489959717, 0.5667378902435303, 1.1732580661773682, 1.779778242111206, 2.386298656463623, 2.992818832397461, 3.599339008331299, 4.205859184265137, 4.812379360198975, 5.4188995361328125, 6.025420188903809, 6.631939888000488, 7.238460540771484, 7.844980716705322, 8.451499938964844, 9.05802059173584, 9.66454029083252, 10.271060943603516, 10.877580642700195, 11.484101295471191, 12.090621948242188, 12.697141647338867, 13.303661346435547, 13.910181999206543, 14.516701698303223, 15.123222351074219, 15.729742050170898, 16.336261749267578, 16.94278335571289, 17.54930305480957, 18.15582275390625, 18.76234245300293, 19.368864059448242, 19.975383758544922, 20.5819034576416, 21.18842315673828, 21.794944763183594, 22.401464462280273, 23.007986068725586, 23.614505767822266, 24.221027374267578, 24.827547073364258, 25.434066772460938, 26.040586471557617, 26.64710807800293, 27.25362777709961, 27.86014747619629]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 13.0, 13.0, 18.0, 27.0, 30.0, 44.0, 45.0, 56.0, 59.0, 56.0, 71.0, 58.0, 71.0, 69.0, 52.0, 68.0, 38.0, 41.0, 43.0, 32.0, 23.0, 13.0, 12.0, 13.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.36768341064453, -17.93861198425293, -17.509538650512695, -17.080467224121094, -16.651395797729492, -16.222322463989258, -15.793251037597656, -15.364178657531738, -14.93510627746582, -14.506033897399902, -14.0769624710083, -13.647890090942383, -13.218817710876465, -12.789745330810547, -12.360673904418945, -11.931601524353027, -11.502530097961426, -11.073457717895508, -10.644386291503906, -10.215313911437988, -9.78624153137207, -9.357170104980469, -8.92809772491455, -8.499025344848633, -8.069953918457031, -7.6408820152282715, -7.2118096351623535, -6.782737731933594, -6.353665351867676, -5.924593448638916, -5.495521545410156, -5.066449165344238, -4.63737678527832, -4.2083048820495605, -3.7792325019836426, -3.350160598754883, -2.921088457107544, -2.492016315460205, -2.0629444122314453, -1.6338722705841064, -1.2048001289367676, -0.7757280468940735, -0.3466559648513794, 0.08241605758666992, 0.5114881992340088, 0.9405603408813477, 1.3696322441101074, 1.7987043857574463, 2.227776527404785, 2.656848669052124, 3.085920810699463, 3.5149927139282227, 3.9440648555755615, 4.3731369972229, 4.80220890045166, 5.231281280517578, 5.660353183746338, 6.089425086975098, 6.518497467041016, 6.947569370269775, 7.376641273498535, 7.805713653564453, 8.234785079956055, 8.663857460021973, 9.09292984008789]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 16.0, 15.0, 25.0, 34.0, 53.0, 102.0, 135.0, 206.0, 376.0, 580.0, 1054.0, 2029.0, 4658.0, 12200.0, 48435.0, 549766.0, 3395785.0, 140877.0, 23619.0, 7532.0, 3136.0, 1537.0, 845.0, 455.0, 276.0, 186.0, 103.0, 75.0, 38.0, 59.0, 17.0, 17.0, 13.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.412109375, -3.303009033203125, -3.19390869140625, -3.084808349609375, -2.9757080078125, -2.866607666015625, -2.75750732421875, -2.648406982421875, -2.539306640625, -2.430206298828125, -2.32110595703125, -2.212005615234375, -2.1029052734375, -1.993804931640625, -1.88470458984375, -1.775604248046875, -1.66650390625, -1.557403564453125, -1.44830322265625, -1.339202880859375, -1.2301025390625, -1.121002197265625, -1.01190185546875, -0.902801513671875, -0.793701171875, -0.684600830078125, -0.57550048828125, -0.466400146484375, -0.3572998046875, -0.248199462890625, -0.13909912109375, -0.029998779296875, 0.0791015625, 0.188201904296875, 0.29730224609375, 0.406402587890625, 0.5155029296875, 0.624603271484375, 0.73370361328125, 0.842803955078125, 0.951904296875, 1.061004638671875, 1.17010498046875, 1.279205322265625, 1.3883056640625, 1.497406005859375, 1.60650634765625, 1.715606689453125, 1.82470703125, 1.933807373046875, 2.04290771484375, 2.152008056640625, 2.2611083984375, 2.370208740234375, 2.47930908203125, 2.588409423828125, 2.697509765625, 2.806610107421875, 2.91571044921875, 3.024810791015625, 3.1339111328125, 3.243011474609375, 3.35211181640625, 3.461212158203125, 3.5703125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 7.0, 19.0, 12.0, 14.0, 15.0, 25.0, 39.0, 52.0, 66.0, 68.0, 81.0, 69.0, 75.0, 78.0, 61.0, 47.0, 35.0, 45.0, 33.0, 24.0, 25.0, 12.0, 9.0, 15.0, 19.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02734375, -1.958282470703125, -1.88922119140625, -1.820159912109375, -1.7510986328125, -1.682037353515625, -1.61297607421875, -1.543914794921875, -1.474853515625, -1.405792236328125, -1.33673095703125, -1.267669677734375, -1.1986083984375, -1.129547119140625, -1.06048583984375, -0.991424560546875, -0.92236328125, -0.853302001953125, -0.78424072265625, -0.715179443359375, -0.6461181640625, -0.577056884765625, -0.50799560546875, -0.438934326171875, -0.369873046875, -0.300811767578125, -0.23175048828125, -0.162689208984375, -0.0936279296875, -0.024566650390625, 0.04449462890625, 0.113555908203125, 0.1826171875, 0.251678466796875, 0.32073974609375, 0.389801025390625, 0.4588623046875, 0.527923583984375, 0.59698486328125, 0.666046142578125, 0.735107421875, 0.804168701171875, 0.87322998046875, 0.942291259765625, 1.0113525390625, 1.080413818359375, 1.14947509765625, 1.218536376953125, 1.28759765625, 1.356658935546875, 1.42572021484375, 1.494781494140625, 1.5638427734375, 1.632904052734375, 1.70196533203125, 1.771026611328125, 1.840087890625, 1.909149169921875, 1.97821044921875, 2.047271728515625, 2.1163330078125, 2.185394287109375, 2.25445556640625, 2.323516845703125, 2.392578125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 14.0, 16.0, 31.0, 35.0, 45.0, 81.0, 149.0, 239.0, 421.0, 971.0, 2608.0, 9637.0, 64408.0, 3642105.0, 439564.0, 25731.0, 5095.0, 1579.0, 669.0, 348.0, 180.0, 105.0, 66.0, 45.0, 33.0, 24.0, 11.0, 13.0, 7.0, 7.0, 8.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.08551025390625, -3.9483642578125, -3.81121826171875, -3.674072265625, -3.53692626953125, -3.3997802734375, -3.26263427734375, -3.12548828125, -2.98834228515625, -2.8511962890625, -2.71405029296875, -2.576904296875, -2.43975830078125, -2.3026123046875, -2.16546630859375, -2.0283203125, -1.89117431640625, -1.7540283203125, -1.61688232421875, -1.479736328125, -1.34259033203125, -1.2054443359375, -1.06829833984375, -0.93115234375, -0.79400634765625, -0.6568603515625, -0.51971435546875, -0.382568359375, -0.24542236328125, -0.1082763671875, 0.02886962890625, 0.166015625, 0.30316162109375, 0.4403076171875, 0.57745361328125, 0.714599609375, 0.85174560546875, 0.9888916015625, 1.12603759765625, 1.26318359375, 1.40032958984375, 1.5374755859375, 1.67462158203125, 1.811767578125, 1.94891357421875, 2.0860595703125, 2.22320556640625, 2.3603515625, 2.49749755859375, 2.6346435546875, 2.77178955078125, 2.908935546875, 3.04608154296875, 3.1832275390625, 3.32037353515625, 3.45751953125, 3.59466552734375, 3.7318115234375, 3.86895751953125, 4.006103515625, 4.14324951171875, 4.2803955078125, 4.41754150390625, 4.5546875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 6.0, 10.0, 14.0, 11.0, 31.0, 20.0, 46.0, 55.0, 74.0, 88.0, 173.0, 283.0, 595.0, 1046.0, 653.0, 327.0, 184.0, 113.0, 82.0, 66.0, 47.0, 30.0, 30.0, 16.0, 13.0, 12.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6375045776367188, -0.6143646240234375, -0.5912246704101562, -0.568084716796875, -0.5449447631835938, -0.5218048095703125, -0.49866485595703125, -0.47552490234375, -0.45238494873046875, -0.4292449951171875, -0.40610504150390625, -0.382965087890625, -0.35982513427734375, -0.3366851806640625, -0.31354522705078125, -0.2904052734375, -0.26726531982421875, -0.2441253662109375, -0.22098541259765625, -0.197845458984375, -0.17470550537109375, -0.1515655517578125, -0.12842559814453125, -0.10528564453125, -0.08214569091796875, -0.0590057373046875, -0.03586578369140625, -0.012725830078125, 0.01041412353515625, 0.0335540771484375, 0.05669403076171875, 0.079833984375, 0.10297393798828125, 0.1261138916015625, 0.14925384521484375, 0.172393798828125, 0.19553375244140625, 0.2186737060546875, 0.24181365966796875, 0.26495361328125, 0.28809356689453125, 0.3112335205078125, 0.33437347412109375, 0.357513427734375, 0.38065338134765625, 0.4037933349609375, 0.42693328857421875, 0.4500732421875, 0.47321319580078125, 0.4963531494140625, 0.5194931030273438, 0.542633056640625, 0.5657730102539062, 0.5889129638671875, 0.6120529174804688, 0.63519287109375, 0.6583328247070312, 0.6814727783203125, 0.7046127319335938, 0.727752685546875, 0.7508926391601562, 0.7740325927734375, 0.7971725463867188, 0.8203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 8.0, 17.0, 24.0, 56.0, 84.0, 139.0, 190.0, 139.0, 104.0, 70.0, 37.0, 37.0, 15.0, 12.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.906198978424072, -4.765286922454834, -4.624375343322754, -4.483463287353516, -4.342551231384277, -4.201639652252197, -4.060727596282959, -3.9198157787323, -3.7789039611816406, -3.6379921436309814, -3.497080087661743, -3.356168270111084, -3.215256452560425, -3.0743446350097656, -2.9334325790405273, -2.792520761489868, -2.65160870552063, -2.5106968879699707, -2.3697848320007324, -2.2288730144500732, -2.087961196899414, -1.9470492601394653, -1.8061373233795166, -1.6652255058288574, -1.5243135690689087, -1.38340163230896, -1.2424898147583008, -1.101577877998352, -0.9606660008430481, -0.8197541236877441, -0.6788421869277954, -0.5379303097724915, -0.3970184326171875, -0.25610655546188354, -0.1151946485042572, 0.02571725845336914, 0.1666291356086731, 0.30754101276397705, 0.4484529495239258, 0.5893648266792297, 0.7302767038345337, 0.8711885809898376, 1.0121004581451416, 1.1530123949050903, 1.293924331665039, 1.4348361492156982, 1.575748085975647, 1.7166600227355957, 1.8575718402862549, 1.9984837770462036, 2.1393957138061523, 2.2803075313568115, 2.4212193489074707, 2.562131404876709, 2.703043222427368, 2.8439550399780273, 2.9848670959472656, 3.125778913497925, 3.266690969467163, 3.4076027870178223, 3.5485146045684814, 3.6894264221191406, 3.830338478088379, 3.971250295639038, 4.112162113189697]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 7.0, 13.0, 20.0, 18.0, 14.0, 17.0, 37.0, 40.0, 27.0, 45.0, 40.0, 53.0, 53.0, 61.0, 65.0, 61.0, 41.0, 51.0, 49.0, 43.0, 24.0, 31.0, 36.0, 23.0, 15.0, 15.0, 18.0, 13.0, 9.0, 9.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7863608598709106, -1.7207067012786865, -1.6550525426864624, -1.5893983840942383, -1.5237441062927246, -1.4580899477005005, -1.3924357891082764, -1.3267816305160522, -1.2611274719238281, -1.195473313331604, -1.1298191547393799, -1.0641648769378662, -0.9985107183456421, -0.932856559753418, -0.8672024011611938, -0.8015482425689697, -0.735893964767456, -0.6702398061752319, -0.604585587978363, -0.5389314293861389, -0.4732772409915924, -0.4076230525970459, -0.3419688940048218, -0.27631470561027527, -0.21066051721572876, -0.14500632882118225, -0.07935215532779694, -0.013697981834411621, 0.05195620656013489, 0.1176103949546814, 0.18326455354690552, 0.24891874194145203, 0.3145730495452881, 0.3802272379398346, 0.4458814263343811, 0.5115355849266052, 0.5771898031234741, 0.6428439617156982, 0.7084981203079224, 0.7741522789001465, 0.8398064970970154, 0.9054606556892395, 0.9711148738861084, 1.0367690324783325, 1.1024231910705566, 1.1680774688720703, 1.2337315082550049, 1.2993857860565186, 1.3650399446487427, 1.4306941032409668, 1.496348261833191, 1.562002420425415, 1.6276566982269287, 1.6933108568191528, 1.758965015411377, 1.824619174003601, 1.8902733325958252, 1.9559274911880493, 2.0215816497802734, 2.087235927581787, 2.1528899669647217, 2.2185442447662354, 2.28419828414917, 2.3498525619506836, 2.4155068397521973]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 13.0, 17.0, 28.0, 38.0, 57.0, 84.0, 137.0, 249.0, 431.0, 719.0, 1341.0, 2669.0, 5740.0, 13176.0, 33859.0, 98176.0, 284134.0, 369496.0, 152609.0, 50918.0, 19028.0, 7936.0, 3647.0, 1834.0, 959.0, 499.0, 288.0, 193.0, 122.0, 65.0, 32.0, 11.0, 16.0, 11.0, 11.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2335205078125, -0.22669219970703125, -0.2198638916015625, -0.21303558349609375, -0.206207275390625, -0.19937896728515625, -0.1925506591796875, -0.18572235107421875, -0.17889404296875, -0.17206573486328125, -0.1652374267578125, -0.15840911865234375, -0.151580810546875, -0.14475250244140625, -0.1379241943359375, -0.13109588623046875, -0.124267578125, -0.11743927001953125, -0.1106109619140625, -0.10378265380859375, -0.096954345703125, -0.09012603759765625, -0.0832977294921875, -0.07646942138671875, -0.06964111328125, -0.06281280517578125, -0.0559844970703125, -0.04915618896484375, -0.042327880859375, -0.03549957275390625, -0.0286712646484375, -0.02184295654296875, -0.0150146484375, -0.00818634033203125, -0.0013580322265625, 0.00547027587890625, 0.012298583984375, 0.01912689208984375, 0.0259552001953125, 0.03278350830078125, 0.03961181640625, 0.04644012451171875, 0.0532684326171875, 0.06009674072265625, 0.066925048828125, 0.07375335693359375, 0.0805816650390625, 0.08740997314453125, 0.09423828125, 0.10106658935546875, 0.1078948974609375, 0.11472320556640625, 0.121551513671875, 0.12837982177734375, 0.1352081298828125, 0.14203643798828125, 0.14886474609375, 0.15569305419921875, 0.1625213623046875, 0.16934967041015625, 0.176177978515625, 0.18300628662109375, 0.1898345947265625, 0.19666290283203125, 0.2034912109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 6.0, 16.0, 21.0, 17.0, 26.0, 30.0, 42.0, 43.0, 64.0, 66.0, 76.0, 83.0, 55.0, 66.0, 53.0, 61.0, 46.0, 35.0, 29.0, 32.0, 25.0, 22.0, 10.0, 9.0, 13.0, 13.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.5955963134765625, -1.540802001953125, -1.4860076904296875, -1.43121337890625, -1.3764190673828125, -1.321624755859375, -1.2668304443359375, -1.2120361328125, -1.1572418212890625, -1.102447509765625, -1.0476531982421875, -0.99285888671875, -0.9380645751953125, -0.883270263671875, -0.8284759521484375, -0.773681640625, -0.7188873291015625, -0.664093017578125, -0.6092987060546875, -0.55450439453125, -0.4997100830078125, -0.444915771484375, -0.3901214599609375, -0.3353271484375, -0.2805328369140625, -0.225738525390625, -0.1709442138671875, -0.11614990234375, -0.0613555908203125, -0.006561279296875, 0.0482330322265625, 0.10302734375, 0.1578216552734375, 0.212615966796875, 0.2674102783203125, 0.32220458984375, 0.3769989013671875, 0.431793212890625, 0.4865875244140625, 0.5413818359375, 0.5961761474609375, 0.650970458984375, 0.7057647705078125, 0.76055908203125, 0.8153533935546875, 0.870147705078125, 0.9249420166015625, 0.979736328125, 1.0345306396484375, 1.089324951171875, 1.1441192626953125, 1.19891357421875, 1.2537078857421875, 1.308502197265625, 1.3632965087890625, 1.4180908203125, 1.4728851318359375, 1.527679443359375, 1.5824737548828125, 1.63726806640625, 1.6920623779296875, 1.746856689453125, 1.8016510009765625, 1.8564453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 13.0, 9.0, 19.0, 24.0, 38.0, 40.0, 63.0, 98.0, 154.0, 180.0, 310.0, 530.0, 1021.0, 2294.0, 5874.0, 18895.0, 73060.0, 270229.0, 432472.0, 176810.0, 45570.0, 12695.0, 4209.0, 1778.0, 824.0, 468.0, 253.0, 177.0, 131.0, 75.0, 78.0, 36.0, 31.0, 27.0, 17.0, 13.0, 7.0, 4.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.261962890625, -0.2541027069091797, -0.24624252319335938, -0.23838233947753906, -0.23052215576171875, -0.22266197204589844, -0.21480178833007812, -0.2069416046142578, -0.1990814208984375, -0.1912212371826172, -0.18336105346679688, -0.17550086975097656, -0.16764068603515625, -0.15978050231933594, -0.15192031860351562, -0.1440601348876953, -0.136199951171875, -0.1283397674560547, -0.12047958374023438, -0.11261940002441406, -0.10475921630859375, -0.09689903259277344, -0.08903884887695312, -0.08117866516113281, -0.0733184814453125, -0.06545829772949219, -0.057598114013671875, -0.04973793029785156, -0.04187774658203125, -0.03401756286621094, -0.026157379150390625, -0.018297195434570312, -0.01043701171875, -0.0025768280029296875, 0.005283355712890625, 0.013143539428710938, 0.02100372314453125, 0.028863906860351562, 0.036724090576171875, 0.04458427429199219, 0.0524444580078125, 0.06030464172363281, 0.06816482543945312, 0.07602500915527344, 0.08388519287109375, 0.09174537658691406, 0.09960556030273438, 0.10746574401855469, 0.115325927734375, 0.12318611145019531, 0.13104629516601562, 0.13890647888183594, 0.14676666259765625, 0.15462684631347656, 0.16248703002929688, 0.1703472137451172, 0.1782073974609375, 0.1860675811767578, 0.19392776489257812, 0.20178794860839844, 0.20964813232421875, 0.21750831604003906, 0.22536849975585938, 0.2332286834716797, 0.2410888671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 4.0, 3.0, 5.0, 10.0, 4.0, 10.0, 16.0, 20.0, 13.0, 20.0, 24.0, 32.0, 26.0, 39.0, 46.0, 54.0, 54.0, 51.0, 64.0, 60.0, 58.0, 38.0, 39.0, 44.0, 45.0, 30.0, 28.0, 31.0, 33.0, 18.0, 18.0, 11.0, 10.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.181640625, -3.088714599609375, -2.99578857421875, -2.902862548828125, -2.8099365234375, -2.717010498046875, -2.62408447265625, -2.531158447265625, -2.438232421875, -2.345306396484375, -2.25238037109375, -2.159454345703125, -2.0665283203125, -1.973602294921875, -1.88067626953125, -1.787750244140625, -1.69482421875, -1.601898193359375, -1.50897216796875, -1.416046142578125, -1.3231201171875, -1.230194091796875, -1.13726806640625, -1.044342041015625, -0.951416015625, -0.858489990234375, -0.76556396484375, -0.672637939453125, -0.5797119140625, -0.486785888671875, -0.39385986328125, -0.300933837890625, -0.2080078125, -0.115081787109375, -0.02215576171875, 0.070770263671875, 0.1636962890625, 0.256622314453125, 0.34954833984375, 0.442474365234375, 0.535400390625, 0.628326416015625, 0.72125244140625, 0.814178466796875, 0.9071044921875, 1.000030517578125, 1.09295654296875, 1.185882568359375, 1.27880859375, 1.371734619140625, 1.46466064453125, 1.557586669921875, 1.6505126953125, 1.743438720703125, 1.83636474609375, 1.929290771484375, 2.022216796875, 2.115142822265625, 2.20806884765625, 2.300994873046875, 2.3939208984375, 2.486846923828125, 2.57977294921875, 2.672698974609375, 2.765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 13.0, 29.0, 34.0, 33.0, 92.0, 117.0, 190.0, 394.0, 656.0, 1373.0, 3350.0, 10500.0, 74894.0, 775706.0, 157590.0, 15696.0, 4314.0, 1695.0, 822.0, 422.0, 220.0, 131.0, 78.0, 59.0, 42.0, 16.0, 17.0, 14.0, 10.0, 4.0, 7.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.167236328125, -0.1615924835205078, -0.15594863891601562, -0.15030479431152344, -0.14466094970703125, -0.13901710510253906, -0.13337326049804688, -0.1277294158935547, -0.1220855712890625, -0.11644172668457031, -0.11079788208007812, -0.10515403747558594, -0.09951019287109375, -0.09386634826660156, -0.08822250366210938, -0.08257865905761719, -0.076934814453125, -0.07129096984863281, -0.06564712524414062, -0.06000328063964844, -0.05435943603515625, -0.04871559143066406, -0.043071746826171875, -0.03742790222167969, -0.0317840576171875, -0.026140213012695312, -0.020496368408203125, -0.014852523803710938, -0.00920867919921875, -0.0035648345947265625, 0.002079010009765625, 0.0077228546142578125, 0.01336669921875, 0.019010543823242188, 0.024654388427734375, 0.030298233032226562, 0.03594207763671875, 0.04158592224121094, 0.047229766845703125, 0.05287361145019531, 0.0585174560546875, 0.06416130065917969, 0.06980514526367188, 0.07544898986816406, 0.08109283447265625, 0.08673667907714844, 0.09238052368164062, 0.09802436828613281, 0.103668212890625, 0.10931205749511719, 0.11495590209960938, 0.12059974670410156, 0.12624359130859375, 0.13188743591308594, 0.13753128051757812, 0.1431751251220703, 0.1488189697265625, 0.1544628143310547, 0.16010665893554688, 0.16575050354003906, 0.17139434814453125, 0.17703819274902344, 0.18268203735351562, 0.1883258819580078, 0.1939697265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 10.0, 2.0, 15.0, 18.0, 28.0, 55.0, 103.0, 212.0, 252.0, 164.0, 77.0, 30.0, 14.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001590251922607422, -0.00015451014041900635, -0.0001499950885772705, -0.00014548003673553467, -0.00014096498489379883, -0.000136449933052063, -0.00013193488121032715, -0.0001274198293685913, -0.00012290477752685547, -0.00011838972568511963, -0.00011387467384338379, -0.00010935962200164795, -0.00010484457015991211, -0.00010032951831817627, -9.581446647644043e-05, -9.129941463470459e-05, -8.678436279296875e-05, -8.226931095123291e-05, -7.775425910949707e-05, -7.323920726776123e-05, -6.872415542602539e-05, -6.420910358428955e-05, -5.969405174255371e-05, -5.517899990081787e-05, -5.066394805908203e-05, -4.614889621734619e-05, -4.163384437561035e-05, -3.711879253387451e-05, -3.260374069213867e-05, -2.8088688850402832e-05, -2.3573637008666992e-05, -1.9058585166931152e-05, -1.4543533325195312e-05, -1.0028481483459473e-05, -5.513429641723633e-06, -9.98377799987793e-07, 3.516674041748047e-06, 8.031725883483887e-06, 1.2546777725219727e-05, 1.7061829566955566e-05, 2.1576881408691406e-05, 2.6091933250427246e-05, 3.0606985092163086e-05, 3.5122036933898926e-05, 3.9637088775634766e-05, 4.4152140617370605e-05, 4.8667192459106445e-05, 5.3182244300842285e-05, 5.7697296142578125e-05, 6.221234798431396e-05, 6.67273998260498e-05, 7.124245166778564e-05, 7.575750350952148e-05, 8.027255535125732e-05, 8.478760719299316e-05, 8.9302659034729e-05, 9.381771087646484e-05, 9.833276271820068e-05, 0.00010284781455993652, 0.00010736286640167236, 0.0001118779182434082, 0.00011639297008514404, 0.00012090802192687988, 0.00012542307376861572, 0.00012993812561035156]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 12.0, 11.0, 23.0, 23.0, 29.0, 45.0, 67.0, 101.0, 120.0, 207.0, 336.0, 599.0, 1248.0, 3188.0, 9822.0, 58798.0, 736624.0, 208219.0, 20139.0, 5098.0, 1832.0, 839.0, 390.0, 268.0, 135.0, 113.0, 71.0, 52.0, 31.0, 28.0, 23.0, 16.0, 8.0, 10.0, 6.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.209228515625, -0.20337295532226562, -0.19751739501953125, -0.19166183471679688, -0.1858062744140625, -0.17995071411132812, -0.17409515380859375, -0.16823959350585938, -0.162384033203125, -0.15652847290039062, -0.15067291259765625, -0.14481735229492188, -0.1389617919921875, -0.13310623168945312, -0.12725067138671875, -0.12139511108398438, -0.11553955078125, -0.10968399047851562, -0.10382843017578125, -0.09797286987304688, -0.0921173095703125, -0.08626174926757812, -0.08040618896484375, -0.07455062866210938, -0.068695068359375, -0.06283950805664062, -0.05698394775390625, -0.051128387451171875, -0.0452728271484375, -0.039417266845703125, -0.03356170654296875, -0.027706146240234375, -0.0218505859375, -0.015995025634765625, -0.01013946533203125, -0.004283905029296875, 0.0015716552734375, 0.007427215576171875, 0.01328277587890625, 0.019138336181640625, 0.024993896484375, 0.030849456787109375, 0.03670501708984375, 0.042560577392578125, 0.0484161376953125, 0.054271697998046875, 0.06012725830078125, 0.06598281860351562, 0.07183837890625, 0.07769393920898438, 0.08354949951171875, 0.08940505981445312, 0.0952606201171875, 0.10111618041992188, 0.10697174072265625, 0.11282730102539062, 0.118682861328125, 0.12453842163085938, 0.13039398193359375, 0.13624954223632812, 0.1421051025390625, 0.14796066284179688, 0.15381622314453125, 0.15967178344726562, 0.16552734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 5.0, 14.0, 12.0, 22.0, 24.0, 43.0, 40.0, 72.0, 101.0, 112.0, 120.0, 94.0, 84.0, 52.0, 48.0, 32.0, 33.0, 12.0, 14.0, 16.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03656005859375, -0.03555583953857422, -0.03455162048339844, -0.033547401428222656, -0.032543182373046875, -0.031538963317871094, -0.030534744262695312, -0.02953052520751953, -0.02852630615234375, -0.02752208709716797, -0.026517868041992188, -0.025513648986816406, -0.024509429931640625, -0.023505210876464844, -0.022500991821289062, -0.02149677276611328, -0.0204925537109375, -0.01948833465576172, -0.018484115600585938, -0.017479896545410156, -0.016475677490234375, -0.015471458435058594, -0.014467239379882812, -0.013463020324707031, -0.01245880126953125, -0.011454582214355469, -0.010450363159179688, -0.009446144104003906, -0.008441925048828125, -0.007437705993652344, -0.0064334869384765625, -0.005429267883300781, -0.004425048828125, -0.0034208297729492188, -0.0024166107177734375, -0.0014123916625976562, -0.000408172607421875, 0.0005960464477539062, 0.0016002655029296875, 0.0026044845581054688, 0.00360870361328125, 0.004612922668457031, 0.0056171417236328125, 0.006621360778808594, 0.007625579833984375, 0.008629798889160156, 0.009634017944335938, 0.010638236999511719, 0.0116424560546875, 0.012646675109863281, 0.013650894165039062, 0.014655113220214844, 0.015659332275390625, 0.016663551330566406, 0.017667770385742188, 0.01867198944091797, 0.01967620849609375, 0.02068042755126953, 0.021684646606445312, 0.022688865661621094, 0.023693084716796875, 0.024697303771972656, 0.025701522827148438, 0.02670574188232422, 0.0277099609375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 10.0, 13.0, 24.0, 32.0, 115.0, 266.0, 285.0, 128.0, 58.0, 27.0, 13.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.100545883178711, -3.9370317459106445, -3.773517608642578, -3.6100034713745117, -3.4464893341064453, -3.282975196838379, -3.1194610595703125, -2.955946922302246, -2.7924327850341797, -2.6289186477661133, -2.465404510498047, -2.3018903732299805, -2.138376235961914, -1.9748620986938477, -1.8113479614257812, -1.6478338241577148, -1.4843196868896484, -1.320805549621582, -1.1572914123535156, -0.9937772750854492, -0.8302631378173828, -0.6667490005493164, -0.50323486328125, -0.3397207260131836, -0.1762065887451172, -0.012692451477050781, 0.15082168579101562, 0.31433582305908203, 0.47784996032714844, 0.6413640975952148, 0.8048782348632812, 0.9683923721313477, 1.1319069862365723, 1.2954211235046387, 1.458935260772705, 1.6224493980407715, 1.785963535308838, 1.9494776725769043, 2.1129918098449707, 2.276505947113037, 2.4400200843811035, 2.60353422164917, 2.7670483589172363, 2.9305624961853027, 3.094076633453369, 3.2575907707214355, 3.421104907989502, 3.5846190452575684, 3.7481331825256348, 3.911647319793701, 4.075161457061768, 4.238675594329834, 4.4021897315979, 4.565703868865967, 4.729218006134033, 4.8927321434021, 5.056246280670166, 5.219760417938232, 5.383274555206299, 5.546788692474365, 5.710302829742432, 5.873816967010498, 6.0373311042785645, 6.200845241546631, 6.364359378814697]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 17.0, 16.0, 28.0, 29.0, 35.0, 50.0, 60.0, 54.0, 67.0, 82.0, 86.0, 72.0, 73.0, 60.0, 38.0, 34.0, 40.0, 30.0, 23.0, 10.0, 11.0, 13.0, 9.0, 6.0, 10.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6169227361679077, -1.5615910291671753, -1.5062594413757324, -1.450927734375, -1.3955961465835571, -1.3402644395828247, -1.2849328517913818, -1.2296011447906494, -1.174269437789917, -1.1189377307891846, -1.0636061429977417, -1.0082744359970093, -0.9529428482055664, -0.897611141204834, -0.8422794938087463, -0.7869478464126587, -0.7316162586212158, -0.6762846112251282, -0.6209529638290405, -0.5656212568283081, -0.5102896690368652, -0.4549579918384552, -0.39962631464004517, -0.3442946672439575, -0.2889630198478699, -0.23363137245178223, -0.1782997101545334, -0.12296804785728455, -0.0676364004611969, -0.012304753065109253, 0.04302692413330078, 0.09835857152938843, 0.15369033813476562, 0.20902198553085327, 0.2643536329269409, 0.31968531012535095, 0.3750169575214386, 0.43034860491752625, 0.4856802821159363, 0.5410119295120239, 0.5963435769081116, 0.6516752243041992, 0.7070068717002869, 0.7623385190963745, 0.8176702260971069, 0.8730018138885498, 0.9283335208892822, 0.9836651682853699, 1.0389968156814575, 1.09432852268219, 1.1496601104736328, 1.2049918174743652, 1.260323405265808, 1.3156551122665405, 1.3709867000579834, 1.4263184070587158, 1.4816501140594482, 1.5369818210601807, 1.5923134088516235, 1.647645115852356, 1.7029767036437988, 1.7583084106445312, 1.8136401176452637, 1.8689717054367065, 1.9243032932281494]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 19.0, 13.0, 25.0, 35.0, 51.0, 83.0, 100.0, 143.0, 235.0, 359.0, 565.0, 835.0, 1442.0, 2433.0, 4662.0, 9154.0, 20178.0, 53350.0, 194108.0, 528481.0, 151479.0, 44947.0, 17543.0, 8204.0, 4141.0, 2195.0, 1354.0, 849.0, 505.0, 349.0, 200.0, 145.0, 100.0, 88.0, 49.0, 34.0, 22.0, 14.0, 11.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1552734375, -1.1172943115234375, -1.079315185546875, -1.0413360595703125, -1.00335693359375, -0.9653778076171875, -0.927398681640625, -0.8894195556640625, -0.8514404296875, -0.8134613037109375, -0.775482177734375, -0.7375030517578125, -0.69952392578125, -0.6615447998046875, -0.623565673828125, -0.5855865478515625, -0.547607421875, -0.5096282958984375, -0.471649169921875, -0.4336700439453125, -0.39569091796875, -0.3577117919921875, -0.319732666015625, -0.2817535400390625, -0.2437744140625, -0.2057952880859375, -0.167816162109375, -0.1298370361328125, -0.09185791015625, -0.0538787841796875, -0.015899658203125, 0.0220794677734375, 0.06005859375, 0.0980377197265625, 0.136016845703125, 0.1739959716796875, 0.21197509765625, 0.2499542236328125, 0.287933349609375, 0.3259124755859375, 0.3638916015625, 0.4018707275390625, 0.439849853515625, 0.4778289794921875, 0.51580810546875, 0.5537872314453125, 0.591766357421875, 0.6297454833984375, 0.667724609375, 0.7057037353515625, 0.743682861328125, 0.7816619873046875, 0.81964111328125, 0.8576202392578125, 0.895599365234375, 0.9335784912109375, 0.9715576171875, 1.0095367431640625, 1.047515869140625, 1.0854949951171875, 1.12347412109375, 1.1614532470703125, 1.199432373046875, 1.2374114990234375, 1.275390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 7.0, 2.0, 10.0, 10.0, 22.0, 24.0, 28.0, 38.0, 35.0, 40.0, 56.0, 63.0, 68.0, 85.0, 80.0, 71.0, 54.0, 57.0, 53.0, 33.0, 32.0, 25.0, 24.0, 17.0, 14.0, 9.0, 6.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817901611328125, -3.67681884765625, -3.535736083984375, -3.3946533203125, -3.253570556640625, -3.11248779296875, -2.971405029296875, -2.830322265625, -2.689239501953125, -2.54815673828125, -2.407073974609375, -2.2659912109375, -2.124908447265625, -1.98382568359375, -1.842742919921875, -1.70166015625, -1.560577392578125, -1.41949462890625, -1.278411865234375, -1.1373291015625, -0.996246337890625, -0.85516357421875, -0.714080810546875, -0.572998046875, -0.431915283203125, -0.29083251953125, -0.149749755859375, -0.0086669921875, 0.132415771484375, 0.27349853515625, 0.414581298828125, 0.5556640625, 0.696746826171875, 0.83782958984375, 0.978912353515625, 1.1199951171875, 1.261077880859375, 1.40216064453125, 1.543243408203125, 1.684326171875, 1.825408935546875, 1.96649169921875, 2.107574462890625, 2.2486572265625, 2.389739990234375, 2.53082275390625, 2.671905517578125, 2.81298828125, 2.954071044921875, 3.09515380859375, 3.236236572265625, 3.3773193359375, 3.518402099609375, 3.65948486328125, 3.800567626953125, 3.941650390625, 4.082733154296875, 4.22381591796875, 4.364898681640625, 4.5059814453125, 4.647064208984375, 4.78814697265625, 4.929229736328125, 5.0703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 12.0, 21.0, 26.0, 40.0, 51.0, 71.0, 109.0, 193.0, 346.0, 580.0, 1158.0, 2592.0, 6358.0, 20128.0, 94393.0, 662087.0, 210294.0, 33664.0, 9460.0, 3561.0, 1540.0, 747.0, 409.0, 210.0, 157.0, 94.0, 65.0, 40.0, 29.0, 23.0, 16.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.26171875, -1.217742919921875, -1.17376708984375, -1.129791259765625, -1.0858154296875, -1.041839599609375, -0.99786376953125, -0.953887939453125, -0.909912109375, -0.865936279296875, -0.82196044921875, -0.777984619140625, -0.7340087890625, -0.690032958984375, -0.64605712890625, -0.602081298828125, -0.55810546875, -0.514129638671875, -0.47015380859375, -0.426177978515625, -0.3822021484375, -0.338226318359375, -0.29425048828125, -0.250274658203125, -0.206298828125, -0.162322998046875, -0.11834716796875, -0.074371337890625, -0.0303955078125, 0.013580322265625, 0.05755615234375, 0.101531982421875, 0.1455078125, 0.189483642578125, 0.23345947265625, 0.277435302734375, 0.3214111328125, 0.365386962890625, 0.40936279296875, 0.453338623046875, 0.497314453125, 0.541290283203125, 0.58526611328125, 0.629241943359375, 0.6732177734375, 0.717193603515625, 0.76116943359375, 0.805145263671875, 0.84912109375, 0.893096923828125, 0.93707275390625, 0.981048583984375, 1.0250244140625, 1.069000244140625, 1.11297607421875, 1.156951904296875, 1.200927734375, 1.244903564453125, 1.28887939453125, 1.332855224609375, 1.3768310546875, 1.420806884765625, 1.46478271484375, 1.508758544921875, 1.552734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 12.0, 6.0, 11.0, 11.0, 10.0, 15.0, 19.0, 19.0, 28.0, 36.0, 29.0, 36.0, 48.0, 43.0, 37.0, 50.0, 42.0, 42.0, 45.0, 47.0, 41.0, 39.0, 41.0, 34.0, 31.0, 40.0, 33.0, 30.0, 19.0, 16.0, 17.0, 11.0, 8.0, 13.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.1729736328125, -4.041259765625, -3.9095458984375, -3.77783203125, -3.6461181640625, -3.514404296875, -3.3826904296875, -3.2509765625, -3.1192626953125, -2.987548828125, -2.8558349609375, -2.72412109375, -2.5924072265625, -2.460693359375, -2.3289794921875, -2.197265625, -2.0655517578125, -1.933837890625, -1.8021240234375, -1.67041015625, -1.5386962890625, -1.406982421875, -1.2752685546875, -1.1435546875, -1.0118408203125, -0.880126953125, -0.7484130859375, -0.61669921875, -0.4849853515625, -0.353271484375, -0.2215576171875, -0.08984375, 0.0418701171875, 0.173583984375, 0.3052978515625, 0.43701171875, 0.5687255859375, 0.700439453125, 0.8321533203125, 0.9638671875, 1.0955810546875, 1.227294921875, 1.3590087890625, 1.49072265625, 1.6224365234375, 1.754150390625, 1.8858642578125, 2.017578125, 2.1492919921875, 2.281005859375, 2.4127197265625, 2.54443359375, 2.6761474609375, 2.807861328125, 2.9395751953125, 3.0712890625, 3.2030029296875, 3.334716796875, 3.4664306640625, 3.59814453125, 3.7298583984375, 3.861572265625, 3.9932861328125, 4.125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 11.0, 18.0, 39.0, 44.0, 125.0, 308.0, 1245.0, 9409.0, 481812.0, 543592.0, 10184.0, 1223.0, 330.0, 107.0, 52.0, 17.0, 15.0, 9.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.583984375, -1.5443954467773438, -1.5048065185546875, -1.4652175903320312, -1.425628662109375, -1.3860397338867188, -1.3464508056640625, -1.3068618774414062, -1.26727294921875, -1.2276840209960938, -1.1880950927734375, -1.1485061645507812, -1.108917236328125, -1.0693283081054688, -1.0297393798828125, -0.9901504516601562, -0.9505615234375, -0.9109725952148438, -0.8713836669921875, -0.8317947387695312, -0.792205810546875, -0.7526168823242188, -0.7130279541015625, -0.6734390258789062, -0.63385009765625, -0.5942611694335938, -0.5546722412109375, -0.5150833129882812, -0.475494384765625, -0.43590545654296875, -0.3963165283203125, -0.35672760009765625, -0.317138671875, -0.27754974365234375, -0.2379608154296875, -0.19837188720703125, -0.158782958984375, -0.11919403076171875, -0.0796051025390625, -0.04001617431640625, -0.00042724609375, 0.03916168212890625, 0.0787506103515625, 0.11833953857421875, 0.157928466796875, 0.19751739501953125, 0.2371063232421875, 0.27669525146484375, 0.3162841796875, 0.35587310791015625, 0.3954620361328125, 0.43505096435546875, 0.474639892578125, 0.5142288208007812, 0.5538177490234375, 0.5934066772460938, 0.63299560546875, 0.6725845336914062, 0.7121734619140625, 0.7517623901367188, 0.791351318359375, 0.8309402465820312, 0.8705291748046875, 0.9101181030273438, 0.94970703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 13.0, 28.0, 66.0, 110.0, 228.0, 232.0, 116.0, 78.0, 38.0, 28.0, 18.0, 14.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001556873321533203, -0.00015014410018920898, -0.00014460086822509766, -0.00013905763626098633, -0.000133514404296875, -0.00012797117233276367, -0.00012242794036865234, -0.00011688470840454102, -0.00011134147644042969, -0.00010579824447631836, -0.00010025501251220703, -9.47117805480957e-05, -8.916854858398438e-05, -8.362531661987305e-05, -7.808208465576172e-05, -7.253885269165039e-05, -6.699562072753906e-05, -6.145238876342773e-05, -5.5909156799316406e-05, -5.036592483520508e-05, -4.482269287109375e-05, -3.927946090698242e-05, -3.3736228942871094e-05, -2.8192996978759766e-05, -2.2649765014648438e-05, -1.710653305053711e-05, -1.1563301086425781e-05, -6.020069122314453e-06, -4.76837158203125e-07, 5.066394805908203e-06, 1.0609626770019531e-05, 1.615285873413086e-05, 2.1696090698242188e-05, 2.7239322662353516e-05, 3.2782554626464844e-05, 3.832578659057617e-05, 4.38690185546875e-05, 4.941225051879883e-05, 5.4955482482910156e-05, 6.0498714447021484e-05, 6.604194641113281e-05, 7.158517837524414e-05, 7.712841033935547e-05, 8.26716423034668e-05, 8.821487426757812e-05, 9.375810623168945e-05, 9.930133819580078e-05, 0.00010484457015991211, 0.00011038780212402344, 0.00011593103408813477, 0.0001214742660522461, 0.00012701749801635742, 0.00013256072998046875, 0.00013810396194458008, 0.0001436471939086914, 0.00014919042587280273, 0.00015473365783691406, 0.0001602768898010254, 0.00016582012176513672, 0.00017136335372924805, 0.00017690658569335938, 0.0001824498176574707, 0.00018799304962158203, 0.00019353628158569336, 0.0001990795135498047]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 15.0, 22.0, 47.0, 99.0, 252.0, 675.0, 2571.0, 15849.0, 491806.0, 517155.0, 16229.0, 2602.0, 775.0, 226.0, 93.0, 55.0, 25.0, 16.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92529296875, -0.8910293579101562, -0.8567657470703125, -0.8225021362304688, -0.788238525390625, -0.7539749145507812, -0.7197113037109375, -0.6854476928710938, -0.65118408203125, -0.6169204711914062, -0.5826568603515625, -0.5483932495117188, -0.514129638671875, -0.47986602783203125, -0.4456024169921875, -0.41133880615234375, -0.3770751953125, -0.34281158447265625, -0.3085479736328125, -0.27428436279296875, -0.240020751953125, -0.20575714111328125, -0.1714935302734375, -0.13722991943359375, -0.10296630859375, -0.06870269775390625, -0.0344390869140625, -0.00017547607421875, 0.034088134765625, 0.06835174560546875, 0.1026153564453125, 0.13687896728515625, 0.171142578125, 0.20540618896484375, 0.2396697998046875, 0.27393341064453125, 0.308197021484375, 0.34246063232421875, 0.3767242431640625, 0.41098785400390625, 0.44525146484375, 0.47951507568359375, 0.5137786865234375, 0.5480422973632812, 0.582305908203125, 0.6165695190429688, 0.6508331298828125, 0.6850967407226562, 0.7193603515625, 0.7536239624023438, 0.7878875732421875, 0.8221511840820312, 0.856414794921875, 0.8906784057617188, 0.9249420166015625, 0.9592056274414062, 0.99346923828125, 1.0277328491210938, 1.0619964599609375, 1.0962600708007812, 1.130523681640625, 1.1647872924804688, 1.1990509033203125, 1.2333145141601562, 1.267578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 13.0, 32.0, 60.0, 90.0, 162.0, 224.0, 163.0, 103.0, 51.0, 29.0, 23.0, 16.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6420707702636719, -0.6239852905273438, -0.6058998107910156, -0.5878143310546875, -0.5697288513183594, -0.5516433715820312, -0.5335578918457031, -0.515472412109375, -0.4973869323730469, -0.47930145263671875, -0.4612159729003906, -0.4431304931640625, -0.4250450134277344, -0.40695953369140625, -0.3888740539550781, -0.37078857421875, -0.3527030944824219, -0.33461761474609375, -0.3165321350097656, -0.2984466552734375, -0.2803611755371094, -0.26227569580078125, -0.24419021606445312, -0.226104736328125, -0.20801925659179688, -0.18993377685546875, -0.17184829711914062, -0.1537628173828125, -0.13567733764648438, -0.11759185791015625, -0.09950637817382812, -0.0814208984375, -0.06333541870117188, -0.04524993896484375, -0.027164459228515625, -0.0090789794921875, 0.009006500244140625, 0.02709197998046875, 0.045177459716796875, 0.063262939453125, 0.08134841918945312, 0.09943389892578125, 0.11751937866210938, 0.1356048583984375, 0.15369033813476562, 0.17177581787109375, 0.18986129760742188, 0.20794677734375, 0.22603225708007812, 0.24411773681640625, 0.2622032165527344, 0.2802886962890625, 0.2983741760253906, 0.31645965576171875, 0.3345451354980469, 0.352630615234375, 0.3707160949707031, 0.38880157470703125, 0.4068870544433594, 0.4249725341796875, 0.4430580139160156, 0.46114349365234375, 0.4792289733886719, 0.497314453125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 14.0, 28.0, 221.0, 639.0, 87.0, 18.0, 4.0, 3.0, 1.0], "bins": [-57.02280807495117, -56.044891357421875, -55.06697082519531, -54.089054107666016, -53.11113739013672, -52.133216857910156, -51.15530014038086, -50.17738342285156, -49.199462890625, -48.2215461730957, -47.24362564086914, -46.265708923339844, -45.28779220581055, -44.309871673583984, -43.33195495605469, -42.354034423828125, -41.37611770629883, -40.39820098876953, -39.42028045654297, -38.44236373901367, -37.464447021484375, -36.48652648925781, -35.508609771728516, -34.53069305419922, -33.552772521972656, -32.57485580444336, -31.59693717956543, -30.6190185546875, -29.64109992980957, -28.66318130493164, -27.685264587402344, -26.707345962524414, -25.729429244995117, -24.751510620117188, -23.77359390258789, -22.79567527770996, -21.81775665283203, -20.839839935302734, -19.861921310424805, -18.884002685546875, -17.906084060668945, -16.928165435791016, -15.950247764587402, -14.972330093383789, -13.99441146850586, -13.016493797302246, -12.038576126098633, -11.060657501220703, -10.082738876342773, -9.10482120513916, -8.12690258026123, -7.148984909057617, -6.1710662841796875, -5.193148612976074, -4.215230464935303, -3.2373123168945312, -2.259394645690918, -1.2814764976501465, -0.30355846881866455, 0.6743595600128174, 1.6522777080535889, 2.6301956176757812, 3.6081137657165527, 4.586031913757324, 5.563950061798096]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 7.0, 10.0, 16.0, 12.0, 17.0, 17.0, 27.0, 25.0, 22.0, 25.0, 29.0, 42.0, 34.0, 41.0, 49.0, 32.0, 33.0, 39.0, 47.0, 37.0, 41.0, 31.0, 34.0, 43.0, 19.0, 26.0, 25.0, 23.0, 21.0, 15.0, 19.0, 21.0, 20.0, 18.0, 13.0, 6.0, 9.0, 9.0, 5.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.727214336395264, -6.497513294219971, -6.2678117752075195, -6.038110733032227, -5.808409690856934, -5.578708648681641, -5.349007606506348, -5.1193060874938965, -4.8896050453186035, -4.6599040031433105, -4.430202484130859, -4.200501441955566, -3.9708003997802734, -3.7410993576049805, -3.5113980770111084, -3.2816967964172363, -3.0519957542419434, -2.8222947120666504, -2.5925934314727783, -2.3628921508789062, -2.1331911087036133, -1.9034899473190308, -1.6737887859344482, -1.4440876245498657, -1.2143864631652832, -0.9846853017807007, -0.7549841403961182, -0.5252829790115356, -0.2955818176269531, -0.0658806562423706, 0.16382050514221191, 0.39352166652679443, 0.6232233047485352, 0.8529244661331177, 1.0826256275177002, 1.3123267889022827, 1.5420279502868652, 1.7717291116714478, 2.0014302730560303, 2.2311315536499023, 2.4608325958251953, 2.6905336380004883, 2.9202349185943604, 3.1499361991882324, 3.3796372413635254, 3.6093382835388184, 3.8390395641326904, 4.0687408447265625, 4.2984418869018555, 4.528142929077148, 4.757843971252441, 4.987545490264893, 5.2172465324401855, 5.4469475746154785, 5.67664909362793, 5.906350135803223, 6.136051177978516, 6.365752220153809, 6.595453262329102, 6.825154781341553, 7.054855823516846, 7.284556865692139, 7.51425838470459, 7.743959426879883, 7.973660469055176]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 17.0, 16.0, 23.0, 34.0, 42.0, 66.0, 92.0, 139.0, 193.0, 321.0, 496.0, 777.0, 1330.0, 2385.0, 4661.0, 10608.0, 31128.0, 141712.0, 2584516.0, 1272444.0, 100071.0, 24427.0, 9067.0, 4097.0, 2132.0, 1255.0, 763.0, 484.0, 341.0, 220.0, 134.0, 87.0, 53.0, 42.0, 40.0, 19.0, 13.0, 8.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.033203125, -1.965240478515625, -1.89727783203125, -1.829315185546875, -1.7613525390625, -1.693389892578125, -1.62542724609375, -1.557464599609375, -1.489501953125, -1.421539306640625, -1.35357666015625, -1.285614013671875, -1.2176513671875, -1.149688720703125, -1.08172607421875, -1.013763427734375, -0.94580078125, -0.877838134765625, -0.80987548828125, -0.741912841796875, -0.6739501953125, -0.605987548828125, -0.53802490234375, -0.470062255859375, -0.402099609375, -0.334136962890625, -0.26617431640625, -0.198211669921875, -0.1302490234375, -0.062286376953125, 0.00567626953125, 0.073638916015625, 0.1416015625, 0.209564208984375, 0.27752685546875, 0.345489501953125, 0.4134521484375, 0.481414794921875, 0.54937744140625, 0.617340087890625, 0.685302734375, 0.753265380859375, 0.82122802734375, 0.889190673828125, 0.9571533203125, 1.025115966796875, 1.09307861328125, 1.161041259765625, 1.22900390625, 1.296966552734375, 1.36492919921875, 1.432891845703125, 1.5008544921875, 1.568817138671875, 1.63677978515625, 1.704742431640625, 1.772705078125, 1.840667724609375, 1.90863037109375, 1.976593017578125, 2.0445556640625, 2.112518310546875, 2.18048095703125, 2.248443603515625, 2.31640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 6.0, 7.0, 10.0, 8.0, 15.0, 22.0, 40.0, 37.0, 49.0, 58.0, 78.0, 77.0, 87.0, 67.0, 83.0, 65.0, 54.0, 56.0, 31.0, 25.0, 25.0, 18.0, 15.0, 12.0, 11.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.095703125, -2.0281982421875, -1.960693359375, -1.8931884765625, -1.82568359375, -1.7581787109375, -1.690673828125, -1.6231689453125, -1.5556640625, -1.4881591796875, -1.420654296875, -1.3531494140625, -1.28564453125, -1.2181396484375, -1.150634765625, -1.0831298828125, -1.015625, -0.9481201171875, -0.880615234375, -0.8131103515625, -0.74560546875, -0.6781005859375, -0.610595703125, -0.5430908203125, -0.4755859375, -0.4080810546875, -0.340576171875, -0.2730712890625, -0.20556640625, -0.1380615234375, -0.070556640625, -0.0030517578125, 0.064453125, 0.1319580078125, 0.199462890625, 0.2669677734375, 0.33447265625, 0.4019775390625, 0.469482421875, 0.5369873046875, 0.6044921875, 0.6719970703125, 0.739501953125, 0.8070068359375, 0.87451171875, 0.9420166015625, 1.009521484375, 1.0770263671875, 1.14453125, 1.2120361328125, 1.279541015625, 1.3470458984375, 1.41455078125, 1.4820556640625, 1.549560546875, 1.6170654296875, 1.6845703125, 1.7520751953125, 1.819580078125, 1.8870849609375, 1.95458984375, 2.0220947265625, 2.089599609375, 2.1571044921875, 2.224609375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 9.0, 9.0, 14.0, 31.0, 30.0, 69.0, 133.0, 223.0, 596.0, 2024.0, 10606.0, 188176.0, 3933832.0, 51001.0, 5348.0, 1280.0, 442.0, 211.0, 106.0, 49.0, 27.0, 12.0, 23.0, 11.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.3787841796875, -4.218505859375, -4.0582275390625, -3.89794921875, -3.7376708984375, -3.577392578125, -3.4171142578125, -3.2568359375, -3.0965576171875, -2.936279296875, -2.7760009765625, -2.61572265625, -2.4554443359375, -2.295166015625, -2.1348876953125, -1.974609375, -1.8143310546875, -1.654052734375, -1.4937744140625, -1.33349609375, -1.1732177734375, -1.012939453125, -0.8526611328125, -0.6923828125, -0.5321044921875, -0.371826171875, -0.2115478515625, -0.05126953125, 0.1090087890625, 0.269287109375, 0.4295654296875, 0.58984375, 0.7501220703125, 0.910400390625, 1.0706787109375, 1.23095703125, 1.3912353515625, 1.551513671875, 1.7117919921875, 1.8720703125, 2.0323486328125, 2.192626953125, 2.3529052734375, 2.51318359375, 2.6734619140625, 2.833740234375, 2.9940185546875, 3.154296875, 3.3145751953125, 3.474853515625, 3.6351318359375, 3.79541015625, 3.9556884765625, 4.115966796875, 4.2762451171875, 4.4365234375, 4.5968017578125, 4.757080078125, 4.9173583984375, 5.07763671875, 5.2379150390625, 5.398193359375, 5.5584716796875, 5.71875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 9.0, 11.0, 12.0, 27.0, 33.0, 58.0, 69.0, 132.0, 264.0, 505.0, 1435.0, 716.0, 359.0, 177.0, 76.0, 67.0, 32.0, 27.0, 16.0, 10.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93212890625, -0.9052200317382812, -0.8783111572265625, -0.8514022827148438, -0.824493408203125, -0.7975845336914062, -0.7706756591796875, -0.7437667846679688, -0.71685791015625, -0.6899490356445312, -0.6630401611328125, -0.6361312866210938, -0.609222412109375, -0.5823135375976562, -0.5554046630859375, -0.5284957885742188, -0.5015869140625, -0.47467803955078125, -0.4477691650390625, -0.42086029052734375, -0.393951416015625, -0.36704254150390625, -0.3401336669921875, -0.31322479248046875, -0.28631591796875, -0.25940704345703125, -0.2324981689453125, -0.20558929443359375, -0.178680419921875, -0.15177154541015625, -0.1248626708984375, -0.09795379638671875, -0.071044921875, -0.04413604736328125, -0.0172271728515625, 0.00968170166015625, 0.036590576171875, 0.06349945068359375, 0.0904083251953125, 0.11731719970703125, 0.14422607421875, 0.17113494873046875, 0.1980438232421875, 0.22495269775390625, 0.251861572265625, 0.27877044677734375, 0.3056793212890625, 0.33258819580078125, 0.3594970703125, 0.38640594482421875, 0.4133148193359375, 0.44022369384765625, 0.467132568359375, 0.49404144287109375, 0.5209503173828125, 0.5478591918945312, 0.57476806640625, 0.6016769409179688, 0.6285858154296875, 0.6554946899414062, 0.682403564453125, 0.7093124389648438, 0.7362213134765625, 0.7631301879882812, 0.7900390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 8.0, 8.0, 12.0, 11.0, 19.0, 29.0, 51.0, 77.0, 158.0, 204.0, 166.0, 96.0, 57.0, 36.0, 17.0, 15.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.210004806518555, -5.067798137664795, -4.925590991973877, -4.783384323120117, -4.641177177429199, -4.4989705085754395, -4.35676383972168, -4.214556694030762, -4.072350025177002, -3.930143117904663, -3.787936210632324, -3.6457295417785645, -3.5035226345062256, -3.3613157272338867, -3.219109058380127, -3.076902151107788, -2.934695243835449, -2.7924883365631104, -2.6502814292907715, -2.5080747604370117, -2.365867853164673, -2.223660945892334, -2.081454277038574, -1.9392473697662354, -1.7970404624938965, -1.6548335552215576, -1.5126267671585083, -1.370419979095459, -1.2282130718231201, -1.0860061645507812, -0.9437993764877319, -0.8015925288200378, -0.6593859195709229, -0.5171790719032288, -0.37497222423553467, -0.23276537656784058, -0.09055852890014648, 0.05164831876754761, 0.1938551664352417, 0.3360620141029358, 0.4782688617706299, 0.620475709438324, 0.7626825571060181, 0.9048894047737122, 1.0470962524414062, 1.1893031597137451, 1.3315099477767944, 1.4737167358398438, 1.6159236431121826, 1.7581305503845215, 1.9003373384475708, 2.04254412651062, 2.184751033782959, 2.326957941055298, 2.4691648483276367, 2.6113715171813965, 2.7535784244537354, 2.895785331726074, 3.037992000579834, 3.180198907852173, 3.3224058151245117, 3.4646127223968506, 3.6068196296691895, 3.749026298522949, 3.891233205795288]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 3.0, 1.0, 5.0, 7.0, 2.0, 9.0, 3.0, 12.0, 12.0, 18.0, 25.0, 30.0, 35.0, 45.0, 46.0, 61.0, 71.0, 76.0, 64.0, 55.0, 55.0, 50.0, 55.0, 41.0, 34.0, 34.0, 30.0, 28.0, 15.0, 20.0, 14.0, 8.0, 8.0, 12.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9250521659851074, -1.8598415851593018, -1.794631004333496, -1.7294204235076904, -1.6642097234725952, -1.5989991426467896, -1.5337885618209839, -1.4685779809951782, -1.403367280960083, -1.3381567001342773, -1.2729461193084717, -1.207735538482666, -1.1425248384475708, -1.0773142576217651, -1.0121036767959595, -0.9468930959701538, -0.8816825151443481, -0.8164719343185425, -0.751261293888092, -0.6860507130622864, -0.6208400726318359, -0.5556294918060303, -0.4904189109802246, -0.42520830035209656, -0.3599976897239685, -0.29478707909584045, -0.2295764833688736, -0.16436588764190674, -0.09915527701377869, -0.033944666385650635, 0.03126591444015503, 0.09647652506828308, 0.16168713569641113, 0.22689774632453918, 0.29210835695266724, 0.3573189377784729, 0.42252954840660095, 0.487740159034729, 0.5529507398605347, 0.6181613206863403, 0.6833719611167908, 0.7485825419425964, 0.8137931823730469, 0.8790037631988525, 0.9442143440246582, 1.0094249248504639, 1.0746355056762695, 1.1398462057113647, 1.2050567865371704, 1.270267367362976, 1.3354779481887817, 1.400688648223877, 1.4658992290496826, 1.5311098098754883, 1.596320390701294, 1.6615309715270996, 1.7267415523529053, 1.791952133178711, 1.8571627140045166, 1.9223732948303223, 1.9875839948654175, 2.0527944564819336, 2.1180052757263184, 2.183215856552124, 2.2484264373779297]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 11.0, 24.0, 29.0, 71.0, 78.0, 190.0, 317.0, 576.0, 1265.0, 2916.0, 7994.0, 24983.0, 97619.0, 413008.0, 378325.0, 86668.0, 21956.0, 7273.0, 2760.0, 1181.0, 539.0, 261.0, 197.0, 90.0, 59.0, 39.0, 29.0, 19.0, 14.0, 10.0, 7.0, 3.0, 4.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273193359375, -0.2649040222167969, -0.25661468505859375, -0.24832534790039062, -0.2400360107421875, -0.23174667358398438, -0.22345733642578125, -0.21516799926757812, -0.206878662109375, -0.19858932495117188, -0.19029998779296875, -0.18201065063476562, -0.1737213134765625, -0.16543197631835938, -0.15714263916015625, -0.14885330200195312, -0.14056396484375, -0.13227462768554688, -0.12398529052734375, -0.11569595336914062, -0.1074066162109375, -0.09911727905273438, -0.09082794189453125, -0.08253860473632812, -0.074249267578125, -0.06595993041992188, -0.05767059326171875, -0.049381256103515625, -0.0410919189453125, -0.032802581787109375, -0.02451324462890625, -0.016223907470703125, -0.0079345703125, 0.000354766845703125, 0.00864410400390625, 0.016933441162109375, 0.0252227783203125, 0.033512115478515625, 0.04180145263671875, 0.050090789794921875, 0.058380126953125, 0.06666946411132812, 0.07495880126953125, 0.08324813842773438, 0.0915374755859375, 0.09982681274414062, 0.10811614990234375, 0.11640548706054688, 0.12469482421875, 0.13298416137695312, 0.14127349853515625, 0.14956283569335938, 0.1578521728515625, 0.16614151000976562, 0.17443084716796875, 0.18272018432617188, 0.191009521484375, 0.19929885864257812, 0.20758819580078125, 0.21587753295898438, 0.2241668701171875, 0.23245620727539062, 0.24074554443359375, 0.24903488159179688, 0.25732421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 3.0, 4.0, 8.0, 11.0, 17.0, 14.0, 20.0, 30.0, 35.0, 55.0, 47.0, 85.0, 81.0, 60.0, 81.0, 62.0, 71.0, 49.0, 47.0, 35.0, 23.0, 31.0, 26.0, 27.0, 18.0, 5.0, 12.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.52313232421875, -1.4710693359375, -1.41900634765625, -1.366943359375, -1.31488037109375, -1.2628173828125, -1.21075439453125, -1.15869140625, -1.10662841796875, -1.0545654296875, -1.00250244140625, -0.950439453125, -0.89837646484375, -0.8463134765625, -0.79425048828125, -0.7421875, -0.69012451171875, -0.6380615234375, -0.58599853515625, -0.533935546875, -0.48187255859375, -0.4298095703125, -0.37774658203125, -0.32568359375, -0.27362060546875, -0.2215576171875, -0.16949462890625, -0.117431640625, -0.06536865234375, -0.0133056640625, 0.03875732421875, 0.0908203125, 0.14288330078125, 0.1949462890625, 0.24700927734375, 0.299072265625, 0.35113525390625, 0.4031982421875, 0.45526123046875, 0.50732421875, 0.55938720703125, 0.6114501953125, 0.66351318359375, 0.715576171875, 0.76763916015625, 0.8197021484375, 0.87176513671875, 0.923828125, 0.97589111328125, 1.0279541015625, 1.08001708984375, 1.132080078125, 1.18414306640625, 1.2362060546875, 1.28826904296875, 1.34033203125, 1.39239501953125, 1.4444580078125, 1.49652099609375, 1.548583984375, 1.60064697265625, 1.6527099609375, 1.70477294921875, 1.7568359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 8.0, 15.0, 14.0, 18.0, 25.0, 45.0, 63.0, 71.0, 127.0, 153.0, 215.0, 293.0, 462.0, 761.0, 1476.0, 3586.0, 9540.0, 33069.0, 124339.0, 359523.0, 348481.0, 118261.0, 31639.0, 9302.0, 3321.0, 1495.0, 754.0, 473.0, 258.0, 219.0, 158.0, 100.0, 77.0, 59.0, 32.0, 37.0, 24.0, 22.0, 8.0, 6.0, 12.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1920166015625, -0.18581771850585938, -0.17961883544921875, -0.17341995239257812, -0.1672210693359375, -0.16102218627929688, -0.15482330322265625, -0.14862442016601562, -0.142425537109375, -0.13622665405273438, -0.13002777099609375, -0.12382888793945312, -0.1176300048828125, -0.11143112182617188, -0.10523223876953125, -0.09903335571289062, -0.09283447265625, -0.08663558959960938, -0.08043670654296875, -0.07423782348632812, -0.0680389404296875, -0.061840057373046875, -0.05564117431640625, -0.049442291259765625, -0.043243408203125, -0.037044525146484375, -0.03084564208984375, -0.024646759033203125, -0.0184478759765625, -0.012248992919921875, -0.00605010986328125, 0.000148773193359375, 0.00634765625, 0.012546539306640625, 0.01874542236328125, 0.024944305419921875, 0.0311431884765625, 0.037342071533203125, 0.04354095458984375, 0.049739837646484375, 0.055938720703125, 0.062137603759765625, 0.06833648681640625, 0.07453536987304688, 0.0807342529296875, 0.08693313598632812, 0.09313201904296875, 0.09933090209960938, 0.10552978515625, 0.11172866821289062, 0.11792755126953125, 0.12412643432617188, 0.1303253173828125, 0.13652420043945312, 0.14272308349609375, 0.14892196655273438, 0.155120849609375, 0.16131973266601562, 0.16751861572265625, 0.17371749877929688, 0.1799163818359375, 0.18611526489257812, 0.19231414794921875, 0.19851303100585938, 0.2047119140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 10.0, 6.0, 9.0, 13.0, 17.0, 20.0, 23.0, 19.0, 20.0, 24.0, 32.0, 47.0, 28.0, 39.0, 34.0, 50.0, 49.0, 45.0, 43.0, 41.0, 45.0, 39.0, 35.0, 39.0, 37.0, 34.0, 28.0, 23.0, 21.0, 20.0, 18.0, 12.0, 13.0, 11.0, 8.0, 4.0, 10.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.31640625, -2.24383544921875, -2.1712646484375, -2.09869384765625, -2.026123046875, -1.95355224609375, -1.8809814453125, -1.80841064453125, -1.73583984375, -1.66326904296875, -1.5906982421875, -1.51812744140625, -1.445556640625, -1.37298583984375, -1.3004150390625, -1.22784423828125, -1.1552734375, -1.08270263671875, -1.0101318359375, -0.93756103515625, -0.864990234375, -0.79241943359375, -0.7198486328125, -0.64727783203125, -0.57470703125, -0.50213623046875, -0.4295654296875, -0.35699462890625, -0.284423828125, -0.21185302734375, -0.1392822265625, -0.06671142578125, 0.005859375, 0.07843017578125, 0.1510009765625, 0.22357177734375, 0.296142578125, 0.36871337890625, 0.4412841796875, 0.51385498046875, 0.58642578125, 0.65899658203125, 0.7315673828125, 0.80413818359375, 0.876708984375, 0.94927978515625, 1.0218505859375, 1.09442138671875, 1.1669921875, 1.23956298828125, 1.3121337890625, 1.38470458984375, 1.457275390625, 1.52984619140625, 1.6024169921875, 1.67498779296875, 1.74755859375, 1.82012939453125, 1.8927001953125, 1.96527099609375, 2.037841796875, 2.11041259765625, 2.1829833984375, 2.25555419921875, 2.328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 9.0, 18.0, 20.0, 47.0, 97.0, 217.0, 630.0, 2024.0, 11669.0, 195606.0, 790763.0, 41070.0, 4705.0, 993.0, 323.0, 152.0, 75.0, 52.0, 32.0, 11.0, 11.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2197265625, -0.21452713012695312, -0.20932769775390625, -0.20412826538085938, -0.1989288330078125, -0.19372940063476562, -0.18852996826171875, -0.18333053588867188, -0.178131103515625, -0.17293167114257812, -0.16773223876953125, -0.16253280639648438, -0.1573333740234375, -0.15213394165039062, -0.14693450927734375, -0.14173507690429688, -0.13653564453125, -0.13133621215820312, -0.12613677978515625, -0.12093734741210938, -0.1157379150390625, -0.11053848266601562, -0.10533905029296875, -0.10013961791992188, -0.094940185546875, -0.08974075317382812, -0.08454132080078125, -0.07934188842773438, -0.0741424560546875, -0.06894302368164062, -0.06374359130859375, -0.058544158935546875, -0.0533447265625, -0.048145294189453125, -0.04294586181640625, -0.037746429443359375, -0.0325469970703125, -0.027347564697265625, -0.02214813232421875, -0.016948699951171875, -0.011749267578125, -0.006549835205078125, -0.00135040283203125, 0.003849029541015625, 0.0090484619140625, 0.014247894287109375, 0.01944732666015625, 0.024646759033203125, 0.02984619140625, 0.035045623779296875, 0.04024505615234375, 0.045444488525390625, 0.0506439208984375, 0.055843353271484375, 0.06104278564453125, 0.06624221801757812, 0.071441650390625, 0.07664108276367188, 0.08184051513671875, 0.08703994750976562, 0.0922393798828125, 0.09743881225585938, 0.10263824462890625, 0.10783767700195312, 0.113037109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 27.0, 34.0, 41.0, 108.0, 129.0, 142.0, 149.0, 135.0, 90.0, 49.0, 30.0, 15.0, 20.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00011348724365234375, -0.00011090654879808426, -0.00010832585394382477, -0.00010574515908956528, -0.00010316446423530579, -0.0001005837693810463, -9.80030745267868e-05, -9.542237967252731e-05, -9.284168481826782e-05, -9.026098996400833e-05, -8.768029510974884e-05, -8.509960025548935e-05, -8.251890540122986e-05, -7.993821054697037e-05, -7.735751569271088e-05, -7.477682083845139e-05, -7.21961259841919e-05, -6.96154311299324e-05, -6.703473627567291e-05, -6.445404142141342e-05, -6.187334656715393e-05, -5.929265171289444e-05, -5.671195685863495e-05, -5.413126200437546e-05, -5.155056715011597e-05, -4.8969872295856476e-05, -4.6389177441596985e-05, -4.3808482587337494e-05, -4.1227787733078e-05, -3.864709287881851e-05, -3.606639802455902e-05, -3.348570317029953e-05, -3.090500831604004e-05, -2.8324313461780548e-05, -2.5743618607521057e-05, -2.3162923753261566e-05, -2.0582228899002075e-05, -1.8001534044742584e-05, -1.5420839190483093e-05, -1.2840144336223602e-05, -1.0259449481964111e-05, -7.67875462770462e-06, -5.098059773445129e-06, -2.5173649191856384e-06, 6.332993507385254e-08, 2.6440247893333435e-06, 5.2247196435928345e-06, 7.805414497852325e-06, 1.0386109352111816e-05, 1.2966804206371307e-05, 1.55474990606308e-05, 1.812819391489029e-05, 2.070888876914978e-05, 2.328958362340927e-05, 2.5870278477668762e-05, 2.8450973331928253e-05, 3.1031668186187744e-05, 3.3612363040447235e-05, 3.6193057894706726e-05, 3.877375274896622e-05, 4.135444760322571e-05, 4.39351424574852e-05, 4.651583731174469e-05, 4.909653216600418e-05, 5.167722702026367e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 7.0, 12.0, 9.0, 17.0, 15.0, 46.0, 87.0, 179.0, 442.0, 1507.0, 10669.0, 430810.0, 589175.0, 13101.0, 1634.0, 472.0, 165.0, 84.0, 47.0, 32.0, 15.0, 9.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.28076171875, -0.27392005920410156, -0.2670783996582031, -0.2602367401123047, -0.25339508056640625, -0.2465534210205078, -0.23971176147460938, -0.23287010192871094, -0.2260284423828125, -0.21918678283691406, -0.21234512329101562, -0.2055034637451172, -0.19866180419921875, -0.1918201446533203, -0.18497848510742188, -0.17813682556152344, -0.171295166015625, -0.16445350646972656, -0.15761184692382812, -0.1507701873779297, -0.14392852783203125, -0.1370868682861328, -0.13024520874023438, -0.12340354919433594, -0.1165618896484375, -0.10972023010253906, -0.10287857055664062, -0.09603691101074219, -0.08919525146484375, -0.08235359191894531, -0.07551193237304688, -0.06867027282714844, -0.06182861328125, -0.05498695373535156, -0.048145294189453125, -0.04130363464355469, -0.03446197509765625, -0.027620315551757812, -0.020778656005859375, -0.013936996459960938, -0.0070953369140625, -0.0002536773681640625, 0.006587982177734375, 0.013429641723632812, 0.02027130126953125, 0.027112960815429688, 0.033954620361328125, 0.04079627990722656, 0.047637939453125, 0.05447959899902344, 0.061321258544921875, 0.06816291809082031, 0.07500457763671875, 0.08184623718261719, 0.08868789672851562, 0.09552955627441406, 0.1023712158203125, 0.10921287536621094, 0.11605453491210938, 0.12289619445800781, 0.12973785400390625, 0.1365795135498047, 0.14342117309570312, 0.15026283264160156, 0.1571044921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 19.0, 24.0, 77.0, 149.0, 262.0, 234.0, 113.0, 51.0, 30.0, 13.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036895751953125, -0.0352787971496582, -0.033661842346191406, -0.03204488754272461, -0.030427932739257812, -0.028810977935791016, -0.02719402313232422, -0.025577068328857422, -0.023960113525390625, -0.022343158721923828, -0.02072620391845703, -0.019109249114990234, -0.017492294311523438, -0.01587533950805664, -0.014258384704589844, -0.012641429901123047, -0.01102447509765625, -0.009407520294189453, -0.007790565490722656, -0.006173610687255859, -0.0045566558837890625, -0.0029397010803222656, -0.0013227462768554688, 0.0002942085266113281, 0.001911163330078125, 0.003528118133544922, 0.005145072937011719, 0.006762027740478516, 0.008378982543945312, 0.00999593734741211, 0.011612892150878906, 0.013229846954345703, 0.0148468017578125, 0.016463756561279297, 0.018080711364746094, 0.01969766616821289, 0.021314620971679688, 0.022931575775146484, 0.02454853057861328, 0.026165485382080078, 0.027782440185546875, 0.029399394989013672, 0.03101634979248047, 0.032633304595947266, 0.03425025939941406, 0.03586721420288086, 0.037484169006347656, 0.03910112380981445, 0.04071807861328125, 0.04233503341674805, 0.043951988220214844, 0.04556894302368164, 0.04718589782714844, 0.048802852630615234, 0.05041980743408203, 0.05203676223754883, 0.053653717041015625, 0.05527067184448242, 0.05688762664794922, 0.058504581451416016, 0.06012153625488281, 0.06173849105834961, 0.0633554458618164, 0.0649724006652832, 0.06658935546875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 4.0, 10.0, 12.0, 11.0, 21.0, 32.0, 59.0, 129.0, 224.0, 213.0, 107.0, 66.0, 29.0, 30.0, 17.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4636218547821045, -3.3551101684570312, -3.246598482131958, -3.1380867958068848, -3.0295751094818115, -2.9210634231567383, -2.812551736831665, -2.704040050506592, -2.5955283641815186, -2.4870166778564453, -2.378504991531372, -2.269993305206299, -2.1614816188812256, -2.0529699325561523, -1.944458246231079, -1.8359465599060059, -1.7274348735809326, -1.6189231872558594, -1.5104115009307861, -1.401899814605713, -1.2933881282806396, -1.1848764419555664, -1.0763647556304932, -0.9678530693054199, -0.8593413829803467, -0.7508296966552734, -0.6423180103302002, -0.533806324005127, -0.4252946376800537, -0.31678295135498047, -0.20827126502990723, -0.09975957870483398, 0.008751869201660156, 0.1172635555267334, 0.22577524185180664, 0.3342869281768799, 0.4427986145019531, 0.5513103008270264, 0.6598219871520996, 0.7683336734771729, 0.8768453598022461, 0.9853570461273193, 1.0938687324523926, 1.2023804187774658, 1.310892105102539, 1.4194037914276123, 1.5279154777526855, 1.6364271640777588, 1.744938850402832, 1.8534505367279053, 1.9619622230529785, 2.0704739093780518, 2.178985595703125, 2.2874972820281982, 2.3960089683532715, 2.5045206546783447, 2.613032341003418, 2.721544027328491, 2.8300557136535645, 2.9385673999786377, 3.047079086303711, 3.155590772628784, 3.2641024589538574, 3.3726141452789307, 3.481125831604004]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 9.0, 1.0, 5.0, 5.0, 10.0, 9.0, 14.0, 25.0, 29.0, 28.0, 45.0, 50.0, 64.0, 84.0, 74.0, 73.0, 58.0, 61.0, 63.0, 47.0, 44.0, 40.0, 25.0, 32.0, 20.0, 16.0, 13.0, 11.0, 6.0, 11.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5008580684661865, -1.452011227607727, -1.4031645059585571, -1.3543176651000977, -1.3054708242416382, -1.2566239833831787, -1.2077772617340088, -1.1589304208755493, -1.1100835800170898, -1.0612367391586304, -1.0123900175094604, -0.963543176651001, -0.9146963357925415, -0.8658495545387268, -0.8170027732849121, -0.7681559324264526, -0.7193092107772827, -0.670462429523468, -0.6216155886650085, -0.5727688074111938, -0.5239219665527344, -0.4750751852989197, -0.426228404045105, -0.3773815929889679, -0.3285347819328308, -0.2796879708766937, -0.23084117472171783, -0.18199437856674194, -0.13314756751060486, -0.08430075645446777, -0.035453975200653076, 0.013392835855484009, 0.06223952770233154, 0.11108633130788803, 0.15993313491344452, 0.2087799310684204, 0.2576267421245575, 0.3064735531806946, 0.3553203344345093, 0.40416714549064636, 0.45301395654678345, 0.5018607378005981, 0.5507075786590576, 0.5995543599128723, 0.648401141166687, 0.6972479820251465, 0.7460947632789612, 0.7949415445327759, 0.8437883853912354, 0.89263516664505, 0.9414820075035095, 0.9903287887573242, 1.0391756296157837, 1.0880224704742432, 1.136869192123413, 1.1857160329818726, 1.234562873840332, 1.2834097146987915, 1.3322564363479614, 1.381103277206421, 1.4299501180648804, 1.4787969589233398, 1.5276436805725098, 1.5764905214309692, 1.6253372430801392]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 3.0, 8.0, 8.0, 23.0, 25.0, 26.0, 33.0, 56.0, 73.0, 93.0, 141.0, 188.0, 285.0, 402.0, 672.0, 1062.0, 1910.0, 3350.0, 6794.0, 16386.0, 55945.0, 543165.0, 344691.0, 44998.0, 14403.0, 6180.0, 2945.0, 1724.0, 990.0, 647.0, 419.0, 256.0, 148.0, 126.0, 108.0, 64.0, 49.0, 35.0, 32.0, 14.0, 20.0, 12.0, 7.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.7451171875, -1.6936798095703125, -1.642242431640625, -1.5908050537109375, -1.53936767578125, -1.4879302978515625, -1.436492919921875, -1.3850555419921875, -1.3336181640625, -1.2821807861328125, -1.230743408203125, -1.1793060302734375, -1.12786865234375, -1.0764312744140625, -1.024993896484375, -0.9735565185546875, -0.922119140625, -0.8706817626953125, -0.819244384765625, -0.7678070068359375, -0.71636962890625, -0.6649322509765625, -0.613494873046875, -0.5620574951171875, -0.5106201171875, -0.4591827392578125, -0.407745361328125, -0.3563079833984375, -0.30487060546875, -0.2534332275390625, -0.201995849609375, -0.1505584716796875, -0.09912109375, -0.0476837158203125, 0.003753662109375, 0.0551910400390625, 0.10662841796875, 0.1580657958984375, 0.209503173828125, 0.2609405517578125, 0.3123779296875, 0.3638153076171875, 0.415252685546875, 0.4666900634765625, 0.51812744140625, 0.5695648193359375, 0.621002197265625, 0.6724395751953125, 0.723876953125, 0.7753143310546875, 0.826751708984375, 0.8781890869140625, 0.92962646484375, 0.9810638427734375, 1.032501220703125, 1.0839385986328125, 1.1353759765625, 1.1868133544921875, 1.238250732421875, 1.2896881103515625, 1.34112548828125, 1.3925628662109375, 1.444000244140625, 1.4954376220703125, 1.546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 6.0, 2.0, 8.0, 4.0, 7.0, 5.0, 9.0, 18.0, 21.0, 23.0, 45.0, 55.0, 66.0, 95.0, 99.0, 79.0, 63.0, 72.0, 62.0, 53.0, 45.0, 38.0, 36.0, 21.0, 13.0, 15.0, 8.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.9921875, -3.86663818359375, -3.7410888671875, -3.61553955078125, -3.489990234375, -3.36444091796875, -3.2388916015625, -3.11334228515625, -2.98779296875, -2.86224365234375, -2.7366943359375, -2.61114501953125, -2.485595703125, -2.36004638671875, -2.2344970703125, -2.10894775390625, -1.9833984375, -1.85784912109375, -1.7322998046875, -1.60675048828125, -1.481201171875, -1.35565185546875, -1.2301025390625, -1.10455322265625, -0.97900390625, -0.85345458984375, -0.7279052734375, -0.60235595703125, -0.476806640625, -0.35125732421875, -0.2257080078125, -0.10015869140625, 0.025390625, 0.15093994140625, 0.2764892578125, 0.40203857421875, 0.527587890625, 0.65313720703125, 0.7786865234375, 0.90423583984375, 1.02978515625, 1.15533447265625, 1.2808837890625, 1.40643310546875, 1.531982421875, 1.65753173828125, 1.7830810546875, 1.90863037109375, 2.0341796875, 2.15972900390625, 2.2852783203125, 2.41082763671875, 2.536376953125, 2.66192626953125, 2.7874755859375, 2.91302490234375, 3.03857421875, 3.16412353515625, 3.2896728515625, 3.41522216796875, 3.540771484375, 3.66632080078125, 3.7918701171875, 3.91741943359375, 4.04296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 9.0, 12.0, 17.0, 39.0, 65.0, 83.0, 165.0, 265.0, 552.0, 1031.0, 2395.0, 6653.0, 25597.0, 329164.0, 635779.0, 33327.0, 7960.0, 2800.0, 1224.0, 596.0, 295.0, 185.0, 112.0, 60.0, 43.0, 33.0, 19.0, 14.0, 8.0, 5.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.587890625, -1.527008056640625, -1.46612548828125, -1.405242919921875, -1.3443603515625, -1.283477783203125, -1.22259521484375, -1.161712646484375, -1.100830078125, -1.039947509765625, -0.97906494140625, -0.918182373046875, -0.8572998046875, -0.796417236328125, -0.73553466796875, -0.674652099609375, -0.61376953125, -0.552886962890625, -0.49200439453125, -0.431121826171875, -0.3702392578125, -0.309356689453125, -0.24847412109375, -0.187591552734375, -0.126708984375, -0.065826416015625, -0.00494384765625, 0.055938720703125, 0.1168212890625, 0.177703857421875, 0.23858642578125, 0.299468994140625, 0.3603515625, 0.421234130859375, 0.48211669921875, 0.542999267578125, 0.6038818359375, 0.664764404296875, 0.72564697265625, 0.786529541015625, 0.847412109375, 0.908294677734375, 0.96917724609375, 1.030059814453125, 1.0909423828125, 1.151824951171875, 1.21270751953125, 1.273590087890625, 1.33447265625, 1.395355224609375, 1.45623779296875, 1.517120361328125, 1.5780029296875, 1.638885498046875, 1.69976806640625, 1.760650634765625, 1.821533203125, 1.882415771484375, 1.94329833984375, 2.004180908203125, 2.0650634765625, 2.125946044921875, 2.18682861328125, 2.247711181640625, 2.30859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 0.0, 3.0, 7.0, 6.0, 5.0, 5.0, 10.0, 12.0, 11.0, 11.0, 17.0, 22.0, 27.0, 25.0, 29.0, 26.0, 40.0, 39.0, 44.0, 42.0, 43.0, 48.0, 48.0, 34.0, 34.0, 45.0, 37.0, 44.0, 32.0, 32.0, 22.0, 28.0, 26.0, 23.0, 20.0, 15.0, 20.0, 17.0, 9.0, 9.0, 5.0, 8.0, 7.0, 1.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.16015625, -3.055450439453125, -2.95074462890625, -2.846038818359375, -2.7413330078125, -2.636627197265625, -2.53192138671875, -2.427215576171875, -2.322509765625, -2.217803955078125, -2.11309814453125, -2.008392333984375, -1.9036865234375, -1.798980712890625, -1.69427490234375, -1.589569091796875, -1.48486328125, -1.380157470703125, -1.27545166015625, -1.170745849609375, -1.0660400390625, -0.961334228515625, -0.85662841796875, -0.751922607421875, -0.647216796875, -0.542510986328125, -0.43780517578125, -0.333099365234375, -0.2283935546875, -0.123687744140625, -0.01898193359375, 0.085723876953125, 0.1904296875, 0.295135498046875, 0.39984130859375, 0.504547119140625, 0.6092529296875, 0.713958740234375, 0.81866455078125, 0.923370361328125, 1.028076171875, 1.132781982421875, 1.23748779296875, 1.342193603515625, 1.4468994140625, 1.551605224609375, 1.65631103515625, 1.761016845703125, 1.86572265625, 1.970428466796875, 2.07513427734375, 2.179840087890625, 2.2845458984375, 2.389251708984375, 2.49395751953125, 2.598663330078125, 2.703369140625, 2.808074951171875, 2.91278076171875, 3.017486572265625, 3.1221923828125, 3.226898193359375, 3.33160400390625, 3.436309814453125, 3.541015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 8.0, 15.0, 21.0, 38.0, 58.0, 111.0, 189.0, 372.0, 719.0, 2169.0, 6543.0, 29291.0, 682685.0, 295464.0, 22057.0, 5466.0, 1802.0, 696.0, 332.0, 197.0, 105.0, 60.0, 41.0, 25.0, 24.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0224609375, -0.9904327392578125, -0.958404541015625, -0.9263763427734375, -0.89434814453125, -0.8623199462890625, -0.830291748046875, -0.7982635498046875, -0.7662353515625, -0.7342071533203125, -0.702178955078125, -0.6701507568359375, -0.63812255859375, -0.6060943603515625, -0.574066162109375, -0.5420379638671875, -0.510009765625, -0.4779815673828125, -0.445953369140625, -0.4139251708984375, -0.38189697265625, -0.3498687744140625, -0.317840576171875, -0.2858123779296875, -0.2537841796875, -0.2217559814453125, -0.189727783203125, -0.1576995849609375, -0.12567138671875, -0.0936431884765625, -0.061614990234375, -0.0295867919921875, 0.00244140625, 0.0344696044921875, 0.066497802734375, 0.0985260009765625, 0.13055419921875, 0.1625823974609375, 0.194610595703125, 0.2266387939453125, 0.2586669921875, 0.2906951904296875, 0.322723388671875, 0.3547515869140625, 0.38677978515625, 0.4188079833984375, 0.450836181640625, 0.4828643798828125, 0.514892578125, 0.5469207763671875, 0.578948974609375, 0.6109771728515625, 0.64300537109375, 0.6750335693359375, 0.707061767578125, 0.7390899658203125, 0.7711181640625, 0.8031463623046875, 0.835174560546875, 0.8672027587890625, 0.89923095703125, 0.9312591552734375, 0.963287353515625, 0.9953155517578125, 1.02734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 9.0, 19.0, 17.0, 38.0, 77.0, 150.0, 390.0, 112.0, 61.0, 34.0, 16.0, 22.0, 8.0, 5.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.0002191103994846344, -0.00021291524171829224, -0.00020672008395195007, -0.0002005249261856079, -0.00019432976841926575, -0.00018813461065292358, -0.00018193945288658142, -0.00017574429512023926, -0.0001695491373538971, -0.00016335397958755493, -0.00015715882182121277, -0.0001509636640548706, -0.00014476850628852844, -0.00013857334852218628, -0.00013237819075584412, -0.00012618303298950195, -0.00011998787522315979, -0.00011379271745681763, -0.00010759755969047546, -0.0001014024019241333, -9.520724415779114e-05, -8.901208639144897e-05, -8.281692862510681e-05, -7.662177085876465e-05, -7.042661309242249e-05, -6.423145532608032e-05, -5.803629755973816e-05, -5.1841139793395996e-05, -4.564598202705383e-05, -3.945082426071167e-05, -3.325566649436951e-05, -2.7060508728027344e-05, -2.086535096168518e-05, -1.4670193195343018e-05, -8.475035429000854e-06, -2.2798776626586914e-06, 3.915280103683472e-06, 1.0110437870025635e-05, 1.6305595636367798e-05, 2.250075340270996e-05, 2.8695911169052124e-05, 3.489106893539429e-05, 4.108622670173645e-05, 4.728138446807861e-05, 5.3476542234420776e-05, 5.967170000076294e-05, 6.58668577671051e-05, 7.206201553344727e-05, 7.825717329978943e-05, 8.445233106613159e-05, 9.064748883247375e-05, 9.684264659881592e-05, 0.00010303780436515808, 0.00010923296213150024, 0.00011542811989784241, 0.00012162327766418457, 0.00012781843543052673, 0.0001340135931968689, 0.00014020875096321106, 0.00014640390872955322, 0.00015259906649589539, 0.00015879422426223755, 0.0001649893820285797, 0.00017118453979492188]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 11.0, 16.0, 18.0, 25.0, 23.0, 31.0, 42.0, 65.0, 75.0, 109.0, 181.0, 264.0, 538.0, 983.0, 2062.0, 4775.0, 13587.0, 63189.0, 773865.0, 152679.0, 22947.0, 7044.0, 2895.0, 1276.0, 705.0, 386.0, 231.0, 149.0, 111.0, 73.0, 53.0, 25.0, 21.0, 27.0, 10.0, 16.0, 14.0, 8.0, 2.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.794921875, -0.771331787109375, -0.74774169921875, -0.724151611328125, -0.7005615234375, -0.676971435546875, -0.65338134765625, -0.629791259765625, -0.606201171875, -0.582611083984375, -0.55902099609375, -0.535430908203125, -0.5118408203125, -0.488250732421875, -0.46466064453125, -0.441070556640625, -0.41748046875, -0.393890380859375, -0.37030029296875, -0.346710205078125, -0.3231201171875, -0.299530029296875, -0.27593994140625, -0.252349853515625, -0.228759765625, -0.205169677734375, -0.18157958984375, -0.157989501953125, -0.1343994140625, -0.110809326171875, -0.08721923828125, -0.063629150390625, -0.0400390625, -0.016448974609375, 0.00714111328125, 0.030731201171875, 0.0543212890625, 0.077911376953125, 0.10150146484375, 0.125091552734375, 0.148681640625, 0.172271728515625, 0.19586181640625, 0.219451904296875, 0.2430419921875, 0.266632080078125, 0.29022216796875, 0.313812255859375, 0.33740234375, 0.360992431640625, 0.38458251953125, 0.408172607421875, 0.4317626953125, 0.455352783203125, 0.47894287109375, 0.502532958984375, 0.526123046875, 0.549713134765625, 0.57330322265625, 0.596893310546875, 0.6204833984375, 0.644073486328125, 0.66766357421875, 0.691253662109375, 0.71484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 8.0, 13.0, 10.0, 15.0, 12.0, 30.0, 39.0, 30.0, 61.0, 112.0, 232.0, 139.0, 61.0, 51.0, 37.0, 21.0, 23.0, 14.0, 14.0, 9.0, 7.0, 2.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3388671875, -0.3288421630859375, -0.318817138671875, -0.3087921142578125, -0.29876708984375, -0.2887420654296875, -0.278717041015625, -0.2686920166015625, -0.2586669921875, -0.2486419677734375, -0.238616943359375, -0.2285919189453125, -0.21856689453125, -0.2085418701171875, -0.198516845703125, -0.1884918212890625, -0.178466796875, -0.1684417724609375, -0.158416748046875, -0.1483917236328125, -0.13836669921875, -0.1283416748046875, -0.118316650390625, -0.1082916259765625, -0.0982666015625, -0.0882415771484375, -0.078216552734375, -0.0681915283203125, -0.05816650390625, -0.0481414794921875, -0.038116455078125, -0.0280914306640625, -0.01806640625, -0.0080413818359375, 0.001983642578125, 0.0120086669921875, 0.02203369140625, 0.0320587158203125, 0.042083740234375, 0.0521087646484375, 0.0621337890625, 0.0721588134765625, 0.082183837890625, 0.0922088623046875, 0.10223388671875, 0.1122589111328125, 0.122283935546875, 0.1323089599609375, 0.142333984375, 0.1523590087890625, 0.162384033203125, 0.1724090576171875, 0.18243408203125, 0.1924591064453125, 0.202484130859375, 0.2125091552734375, 0.2225341796875, 0.2325592041015625, 0.242584228515625, 0.2526092529296875, 0.26263427734375, 0.2726593017578125, 0.282684326171875, 0.2927093505859375, 0.302734375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 11.0, 18.0, 30.0, 82.0, 229.0, 366.0, 162.0, 57.0, 23.0, 7.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68994665145874, -4.275148391723633, -3.8603501319885254, -3.445551872253418, -3.0307536125183105, -2.6159555912017822, -2.201157331466675, -1.7863590717315674, -1.37156081199646, -0.9567625522613525, -0.5419643521308899, -0.12716615200042725, 0.2876321077346802, 0.702430248260498, 1.1172285079956055, 1.532026767730713, 1.9468250274658203, 2.3616232872009277, 2.776421546936035, 3.1912198066711426, 3.60601806640625, 4.020815849304199, 4.435614585876465, 4.850412368774414, 5.26521110534668, 5.680009365081787, 6.0948076248168945, 6.509605884552002, 6.924404144287109, 7.339201927185059, 7.754000663757324, 8.168798446655273, 8.583596229553223, 8.998394012451172, 9.413192749023438, 9.827990531921387, 10.242789268493652, 10.657587051391602, 11.072385787963867, 11.487183570861816, 11.901982307434082, 12.316780090332031, 12.731578826904297, 13.146376609802246, 13.561175346374512, 13.975973129272461, 14.390771865844727, 14.805569648742676, 15.220367431640625, 15.635165214538574, 16.049962997436523, 16.46476173400879, 16.879560470581055, 17.29435920715332, 17.709156036376953, 18.12395477294922, 18.538753509521484, 18.95355224609375, 19.368349075317383, 19.78314781188965, 20.197946548461914, 20.61274528503418, 21.027542114257812, 21.442340850830078, 21.857139587402344]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 18.0, 15.0, 25.0, 28.0, 20.0, 14.0, 34.0, 30.0, 30.0, 34.0, 36.0, 31.0, 41.0, 41.0, 32.0, 38.0, 27.0, 38.0, 46.0, 31.0, 30.0, 37.0, 36.0, 31.0, 19.0, 30.0, 28.0, 5.0, 17.0, 18.0, 12.0, 16.0, 16.0, 4.0, 2.0, 9.0, 5.0, 4.0, 2.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.528428554534912, -5.359193801879883, -5.189959526062012, -5.020724773406982, -4.851490020751953, -4.682255744934082, -4.513020992279053, -4.343786239624023, -4.174551963806152, -4.005317211151123, -3.836082696914673, -3.6668481826782227, -3.4976136684417725, -3.3283791542053223, -3.159144401550293, -2.9899098873138428, -2.8206751346588135, -2.6514406204223633, -2.482205867767334, -2.312971353530884, -2.1437368392944336, -1.9745022058486938, -1.805267572402954, -1.636033058166504, -1.4667984247207642, -1.2975637912750244, -1.1283292770385742, -0.9590946435928345, -0.7898600697517395, -0.6206254959106445, -0.4513908624649048, -0.2821563482284546, -0.11292171478271484, 0.05631287395954132, 0.22554746270179749, 0.39478206634521484, 0.5640166401863098, 0.7332512140274048, 0.9024858474731445, 1.0717203617095947, 1.2409549951553345, 1.4101896286010742, 1.5794241428375244, 1.7486587762832642, 1.917893409729004, 2.087127923965454, 2.2563624382019043, 2.4255971908569336, 2.594831705093384, 2.764066219329834, 2.9333009719848633, 3.1025354862213135, 3.2717700004577637, 3.441004753112793, 3.610239267349243, 3.7794737815856934, 3.9487085342407227, 4.117943286895752, 4.287177562713623, 4.456412315368652, 4.625647068023682, 4.794881343841553, 4.964116096496582, 5.133350372314453, 5.302585124969482]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 10.0, 11.0, 14.0, 18.0, 30.0, 49.0, 65.0, 102.0, 149.0, 267.0, 417.0, 800.0, 1568.0, 3382.0, 9402.0, 36615.0, 365435.0, 3605318.0, 137071.0, 21415.0, 6444.0, 2708.0, 1237.0, 651.0, 396.0, 246.0, 155.0, 94.0, 64.0, 44.0, 31.0, 24.0, 18.0, 8.0, 9.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.591796875, -3.50048828125, -3.4091796875, -3.31787109375, -3.2265625, -3.13525390625, -3.0439453125, -2.95263671875, -2.861328125, -2.77001953125, -2.6787109375, -2.58740234375, -2.49609375, -2.40478515625, -2.3134765625, -2.22216796875, -2.130859375, -2.03955078125, -1.9482421875, -1.85693359375, -1.765625, -1.67431640625, -1.5830078125, -1.49169921875, -1.400390625, -1.30908203125, -1.2177734375, -1.12646484375, -1.03515625, -0.94384765625, -0.8525390625, -0.76123046875, -0.669921875, -0.57861328125, -0.4873046875, -0.39599609375, -0.3046875, -0.21337890625, -0.1220703125, -0.03076171875, 0.060546875, 0.15185546875, 0.2431640625, 0.33447265625, 0.42578125, 0.51708984375, 0.6083984375, 0.69970703125, 0.791015625, 0.88232421875, 0.9736328125, 1.06494140625, 1.15625, 1.24755859375, 1.3388671875, 1.43017578125, 1.521484375, 1.61279296875, 1.7041015625, 1.79541015625, 1.88671875, 1.97802734375, 2.0693359375, 2.16064453125, 2.251953125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 5.0, 4.0, 8.0, 14.0, 12.0, 20.0, 20.0, 21.0, 25.0, 55.0, 49.0, 62.0, 64.0, 76.0, 85.0, 70.0, 62.0, 54.0, 46.0, 40.0, 46.0, 25.0, 21.0, 19.0, 18.0, 7.0, 10.0, 6.0, 10.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.76171875, -1.7061309814453125, -1.650543212890625, -1.5949554443359375, -1.53936767578125, -1.4837799072265625, -1.428192138671875, -1.3726043701171875, -1.3170166015625, -1.2614288330078125, -1.205841064453125, -1.1502532958984375, -1.09466552734375, -1.0390777587890625, -0.983489990234375, -0.9279022216796875, -0.872314453125, -0.8167266845703125, -0.761138916015625, -0.7055511474609375, -0.64996337890625, -0.5943756103515625, -0.538787841796875, -0.4832000732421875, -0.4276123046875, -0.3720245361328125, -0.316436767578125, -0.2608489990234375, -0.20526123046875, -0.1496734619140625, -0.094085693359375, -0.0384979248046875, 0.01708984375, 0.0726776123046875, 0.128265380859375, 0.1838531494140625, 0.23944091796875, 0.2950286865234375, 0.350616455078125, 0.4062042236328125, 0.4617919921875, 0.5173797607421875, 0.572967529296875, 0.6285552978515625, 0.68414306640625, 0.7397308349609375, 0.795318603515625, 0.8509063720703125, 0.906494140625, 0.9620819091796875, 1.017669677734375, 1.0732574462890625, 1.12884521484375, 1.1844329833984375, 1.240020751953125, 1.2956085205078125, 1.3511962890625, 1.4067840576171875, 1.462371826171875, 1.5179595947265625, 1.57354736328125, 1.6291351318359375, 1.684722900390625, 1.7403106689453125, 1.7958984375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 18.0, 19.0, 24.0, 51.0, 69.0, 110.0, 226.0, 407.0, 1058.0, 2782.0, 10882.0, 78259.0, 3782767.0, 288476.0, 21510.0, 4796.0, 1538.0, 561.0, 250.0, 164.0, 90.0, 56.0, 44.0, 25.0, 18.0, 16.0, 6.0, 4.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6953125, -3.582305908203125, -3.46929931640625, -3.356292724609375, -3.2432861328125, -3.130279541015625, -3.01727294921875, -2.904266357421875, -2.791259765625, -2.678253173828125, -2.56524658203125, -2.452239990234375, -2.3392333984375, -2.226226806640625, -2.11322021484375, -2.000213623046875, -1.88720703125, -1.774200439453125, -1.66119384765625, -1.548187255859375, -1.4351806640625, -1.322174072265625, -1.20916748046875, -1.096160888671875, -0.983154296875, -0.870147705078125, -0.75714111328125, -0.644134521484375, -0.5311279296875, -0.418121337890625, -0.30511474609375, -0.192108154296875, -0.0791015625, 0.033905029296875, 0.14691162109375, 0.259918212890625, 0.3729248046875, 0.485931396484375, 0.59893798828125, 0.711944580078125, 0.824951171875, 0.937957763671875, 1.05096435546875, 1.163970947265625, 1.2769775390625, 1.389984130859375, 1.50299072265625, 1.615997314453125, 1.72900390625, 1.842010498046875, 1.95501708984375, 2.068023681640625, 2.1810302734375, 2.294036865234375, 2.40704345703125, 2.520050048828125, 2.633056640625, 2.746063232421875, 2.85906982421875, 2.972076416015625, 3.0850830078125, 3.198089599609375, 3.31109619140625, 3.424102783203125, 3.537109375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 5.0, 6.0, 9.0, 6.0, 18.0, 25.0, 26.0, 50.0, 48.0, 81.0, 133.0, 201.0, 364.0, 728.0, 1132.0, 479.0, 286.0, 131.0, 94.0, 61.0, 40.0, 30.0, 33.0, 16.0, 12.0, 12.0, 11.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.544921875, -0.5256195068359375, -0.506317138671875, -0.4870147705078125, -0.46771240234375, -0.4484100341796875, -0.429107666015625, -0.4098052978515625, -0.3905029296875, -0.3712005615234375, -0.351898193359375, -0.3325958251953125, -0.31329345703125, -0.2939910888671875, -0.274688720703125, -0.2553863525390625, -0.236083984375, -0.2167816162109375, -0.197479248046875, -0.1781768798828125, -0.15887451171875, -0.1395721435546875, -0.120269775390625, -0.1009674072265625, -0.0816650390625, -0.0623626708984375, -0.043060302734375, -0.0237579345703125, -0.00445556640625, 0.0148468017578125, 0.034149169921875, 0.0534515380859375, 0.07275390625, 0.0920562744140625, 0.111358642578125, 0.1306610107421875, 0.14996337890625, 0.1692657470703125, 0.188568115234375, 0.2078704833984375, 0.2271728515625, 0.2464752197265625, 0.265777587890625, 0.2850799560546875, 0.30438232421875, 0.3236846923828125, 0.342987060546875, 0.3622894287109375, 0.381591796875, 0.4008941650390625, 0.420196533203125, 0.4394989013671875, 0.45880126953125, 0.4781036376953125, 0.497406005859375, 0.5167083740234375, 0.5360107421875, 0.5553131103515625, 0.574615478515625, 0.5939178466796875, 0.61322021484375, 0.6325225830078125, 0.651824951171875, 0.6711273193359375, 0.6904296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 10.0, 9.0, 4.0, 14.0, 18.0, 26.0, 35.0, 53.0, 88.0, 156.0, 170.0, 156.0, 94.0, 55.0, 32.0, 19.0, 18.0, 15.0, 9.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.264806270599365, -4.1411027908325195, -4.017398834228516, -3.89369535446167, -3.769991874694824, -3.6462881565093994, -3.5225844383239746, -3.398880958557129, -3.275177240371704, -3.1514735221862793, -3.0277700424194336, -2.904066324234009, -2.780362844467163, -2.6566591262817383, -2.5329556465148926, -2.4092519283294678, -2.285548210144043, -2.161844491958618, -2.0381410121917725, -1.9144372940063477, -1.7907336950302124, -1.6670300960540771, -1.543326497077942, -1.4196228981018066, -1.295919418334961, -1.1722158193588257, -1.0485122203826904, -0.9248085618019104, -0.8011049032211304, -0.6774013042449951, -0.5536977052688599, -0.42999404668807983, -0.3062903881072998, -0.18258675932884216, -0.058883145451545715, 0.06482046842575073, 0.18852409720420837, 0.312227725982666, 0.43593132495880127, 0.5596349835395813, 0.6833385825157166, 0.8070421814918518, 0.9307458400726318, 1.054449439048767, 1.1781530380249023, 1.3018567562103271, 1.4255602359771729, 1.5492639541625977, 1.672967553138733, 1.7966711521148682, 1.9203747510910034, 2.0440783500671387, 2.1677820682525635, 2.2914857864379883, 2.415189266204834, 2.538892984390259, 2.6625964641571045, 2.7863001823425293, 2.910003662109375, 3.0337073802948, 3.1574108600616455, 3.2811145782470703, 3.404818058013916, 3.528521776199341, 3.6522254943847656]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 6.0, 9.0, 12.0, 19.0, 13.0, 16.0, 25.0, 26.0, 35.0, 44.0, 37.0, 55.0, 49.0, 62.0, 55.0, 62.0, 55.0, 48.0, 62.0, 39.0, 45.0, 32.0, 36.0, 20.0, 23.0, 18.0, 13.0, 18.0, 9.0, 9.0, 5.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0225017070770264, -1.9644750356674194, -1.906448245048523, -1.848421573638916, -1.7903947830200195, -1.7323681116104126, -1.6743413209915161, -1.6163146495819092, -1.5582878589630127, -1.5002611875534058, -1.4422343969345093, -1.3842077255249023, -1.3261809349060059, -1.268154263496399, -1.2101274728775024, -1.1521008014678955, -1.094074010848999, -1.036047339439392, -0.9780205488204956, -0.9199938178062439, -0.8619670867919922, -0.8039404153823853, -0.7459136247634888, -0.6878869533538818, -0.6298602819442749, -0.5718335509300232, -0.5138068199157715, -0.4557800889015198, -0.39775335788726807, -0.33972665667533875, -0.28169992566108704, -0.22367319464683533, -0.16564643383026123, -0.10761970281600952, -0.04959297925233841, 0.008433744311332703, 0.06646047532558441, 0.12448719143867493, 0.18251392245292664, 0.24054065346717834, 0.29856738448143005, 0.35659411549568176, 0.41462084650993347, 0.4726475477218628, 0.5306742787361145, 0.5887010097503662, 0.6467277407646179, 0.7047544717788696, 0.7627812027931213, 0.820807933807373, 0.8788346648216248, 0.9368613958358765, 0.9948881268501282, 1.0529148578643799, 1.1109415292739868, 1.1689683198928833, 1.2269949913024902, 1.2850216627120972, 1.3430484533309937, 1.4010751247406006, 1.459101915359497, 1.517128586769104, 1.5751553773880005, 1.6331820487976074, 1.691208839416504]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 9.0, 16.0, 18.0, 26.0, 39.0, 60.0, 101.0, 124.0, 182.0, 339.0, 596.0, 952.0, 1824.0, 3691.0, 7796.0, 18026.0, 46948.0, 145246.0, 375740.0, 291902.0, 96456.0, 32988.0, 13046.0, 5882.0, 2894.0, 1576.0, 835.0, 458.0, 263.0, 167.0, 108.0, 73.0, 50.0, 34.0, 25.0, 21.0, 9.0, 7.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1845703125, -0.17911338806152344, -0.17365646362304688, -0.1681995391845703, -0.16274261474609375, -0.1572856903076172, -0.15182876586914062, -0.14637184143066406, -0.1409149169921875, -0.13545799255371094, -0.13000106811523438, -0.12454414367675781, -0.11908721923828125, -0.11363029479980469, -0.10817337036132812, -0.10271644592285156, -0.097259521484375, -0.09180259704589844, -0.08634567260742188, -0.08088874816894531, -0.07543182373046875, -0.06997489929199219, -0.06451797485351562, -0.05906105041503906, -0.0536041259765625, -0.04814720153808594, -0.042690277099609375, -0.03723335266113281, -0.03177642822265625, -0.026319503784179688, -0.020862579345703125, -0.015405654907226562, -0.00994873046875, -0.0044918060302734375, 0.000965118408203125, 0.0064220428466796875, 0.01187896728515625, 0.017335891723632812, 0.022792816162109375, 0.028249740600585938, 0.0337066650390625, 0.03916358947753906, 0.044620513916015625, 0.05007743835449219, 0.05553436279296875, 0.06099128723144531, 0.06644821166992188, 0.07190513610839844, 0.077362060546875, 0.08281898498535156, 0.08827590942382812, 0.09373283386230469, 0.09918975830078125, 0.10464668273925781, 0.11010360717773438, 0.11556053161621094, 0.1210174560546875, 0.12647438049316406, 0.13193130493164062, 0.1373882293701172, 0.14284515380859375, 0.1483020782470703, 0.15375900268554688, 0.15921592712402344, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 3.0, 3.0, 8.0, 8.0, 16.0, 7.0, 14.0, 21.0, 29.0, 32.0, 45.0, 46.0, 69.0, 58.0, 86.0, 73.0, 80.0, 58.0, 59.0, 51.0, 49.0, 35.0, 32.0, 23.0, 14.0, 19.0, 13.0, 10.0, 4.0, 9.0, 6.0, 1.0, 4.0, 1.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5859375, -1.5360260009765625, -1.486114501953125, -1.4362030029296875, -1.38629150390625, -1.3363800048828125, -1.286468505859375, -1.2365570068359375, -1.1866455078125, -1.1367340087890625, -1.086822509765625, -1.0369110107421875, -0.98699951171875, -0.9370880126953125, -0.887176513671875, -0.8372650146484375, -0.787353515625, -0.7374420166015625, -0.687530517578125, -0.6376190185546875, -0.58770751953125, -0.5377960205078125, -0.487884521484375, -0.4379730224609375, -0.3880615234375, -0.3381500244140625, -0.288238525390625, -0.2383270263671875, -0.18841552734375, -0.1385040283203125, -0.088592529296875, -0.0386810302734375, 0.01123046875, 0.0611419677734375, 0.111053466796875, 0.1609649658203125, 0.21087646484375, 0.2607879638671875, 0.310699462890625, 0.3606109619140625, 0.4105224609375, 0.4604339599609375, 0.510345458984375, 0.5602569580078125, 0.61016845703125, 0.6600799560546875, 0.709991455078125, 0.7599029541015625, 0.809814453125, 0.8597259521484375, 0.909637451171875, 0.9595489501953125, 1.00946044921875, 1.0593719482421875, 1.109283447265625, 1.1591949462890625, 1.2091064453125, 1.2590179443359375, 1.308929443359375, 1.3588409423828125, 1.40875244140625, 1.4586639404296875, 1.508575439453125, 1.5584869384765625, 1.6083984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 10.0, 25.0, 23.0, 48.0, 64.0, 113.0, 156.0, 264.0, 432.0, 758.0, 1735.0, 4443.0, 15756.0, 74413.0, 370327.0, 449231.0, 100853.0, 20100.0, 5524.0, 2031.0, 942.0, 520.0, 292.0, 178.0, 108.0, 64.0, 51.0, 25.0, 19.0, 13.0, 10.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2098388671875, -0.20209312438964844, -0.19434738159179688, -0.1866016387939453, -0.17885589599609375, -0.1711101531982422, -0.16336441040039062, -0.15561866760253906, -0.1478729248046875, -0.14012718200683594, -0.13238143920898438, -0.12463569641113281, -0.11688995361328125, -0.10914421081542969, -0.10139846801757812, -0.09365272521972656, -0.085906982421875, -0.07816123962402344, -0.07041549682617188, -0.06266975402832031, -0.05492401123046875, -0.04717826843261719, -0.039432525634765625, -0.03168678283691406, -0.0239410400390625, -0.016195297241210938, -0.008449554443359375, -0.0007038116455078125, 0.00704193115234375, 0.014787673950195312, 0.022533416748046875, 0.030279159545898438, 0.03802490234375, 0.04577064514160156, 0.053516387939453125, 0.06126213073730469, 0.06900787353515625, 0.07675361633300781, 0.08449935913085938, 0.09224510192871094, 0.0999908447265625, 0.10773658752441406, 0.11548233032226562, 0.12322807312011719, 0.13097381591796875, 0.1387195587158203, 0.14646530151367188, 0.15421104431152344, 0.161956787109375, 0.16970252990722656, 0.17744827270507812, 0.1851940155029297, 0.19293975830078125, 0.2006855010986328, 0.20843124389648438, 0.21617698669433594, 0.2239227294921875, 0.23166847229003906, 0.23941421508789062, 0.2471599578857422, 0.25490570068359375, 0.2626514434814453, 0.2703971862792969, 0.27814292907714844, 0.285888671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 8.0, 11.0, 6.0, 16.0, 9.0, 9.0, 19.0, 23.0, 20.0, 24.0, 23.0, 42.0, 46.0, 47.0, 54.0, 53.0, 51.0, 45.0, 60.0, 48.0, 48.0, 47.0, 44.0, 44.0, 36.0, 34.0, 23.0, 18.0, 21.0, 14.0, 17.0, 12.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.108673095703125, -2.02984619140625, -1.951019287109375, -1.8721923828125, -1.793365478515625, -1.71453857421875, -1.635711669921875, -1.556884765625, -1.478057861328125, -1.39923095703125, -1.320404052734375, -1.2415771484375, -1.162750244140625, -1.08392333984375, -1.005096435546875, -0.92626953125, -0.847442626953125, -0.76861572265625, -0.689788818359375, -0.6109619140625, -0.532135009765625, -0.45330810546875, -0.374481201171875, -0.295654296875, -0.216827392578125, -0.13800048828125, -0.059173583984375, 0.0196533203125, 0.098480224609375, 0.17730712890625, 0.256134033203125, 0.3349609375, 0.413787841796875, 0.49261474609375, 0.571441650390625, 0.6502685546875, 0.729095458984375, 0.80792236328125, 0.886749267578125, 0.965576171875, 1.044403076171875, 1.12322998046875, 1.202056884765625, 1.2808837890625, 1.359710693359375, 1.43853759765625, 1.517364501953125, 1.59619140625, 1.675018310546875, 1.75384521484375, 1.832672119140625, 1.9114990234375, 1.990325927734375, 2.06915283203125, 2.147979736328125, 2.226806640625, 2.305633544921875, 2.38446044921875, 2.463287353515625, 2.5421142578125, 2.620941162109375, 2.69976806640625, 2.778594970703125, 2.857421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 10.0, 17.0, 16.0, 32.0, 47.0, 84.0, 196.0, 451.0, 1117.0, 3313.0, 14133.0, 219295.0, 761021.0, 39769.0, 6082.0, 1768.0, 646.0, 254.0, 131.0, 50.0, 34.0, 29.0, 16.0, 13.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1392822265625, -0.13451766967773438, -0.12975311279296875, -0.12498855590820312, -0.1202239990234375, -0.11545944213867188, -0.11069488525390625, -0.10593032836914062, -0.101165771484375, -0.09640121459960938, -0.09163665771484375, -0.08687210083007812, -0.0821075439453125, -0.07734298706054688, -0.07257843017578125, -0.06781387329101562, -0.06304931640625, -0.058284759521484375, -0.05352020263671875, -0.048755645751953125, -0.0439910888671875, -0.039226531982421875, -0.03446197509765625, -0.029697418212890625, -0.024932861328125, -0.020168304443359375, -0.01540374755859375, -0.010639190673828125, -0.0058746337890625, -0.001110076904296875, 0.00365447998046875, 0.008419036865234375, 0.01318359375, 0.017948150634765625, 0.02271270751953125, 0.027477264404296875, 0.0322418212890625, 0.037006378173828125, 0.04177093505859375, 0.046535491943359375, 0.051300048828125, 0.056064605712890625, 0.06082916259765625, 0.06559371948242188, 0.0703582763671875, 0.07512283325195312, 0.07988739013671875, 0.08465194702148438, 0.08941650390625, 0.09418106079101562, 0.09894561767578125, 0.10371017456054688, 0.1084747314453125, 0.11323928833007812, 0.11800384521484375, 0.12276840209960938, 0.127532958984375, 0.13229751586914062, 0.13706207275390625, 0.14182662963867188, 0.1465911865234375, 0.15135574340820312, 0.15612030029296875, 0.16088485717773438, 0.1656494140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 10.0, 17.0, 13.0, 32.0, 40.0, 62.0, 72.0, 100.0, 117.0, 106.0, 116.0, 85.0, 57.0, 41.0, 27.0, 25.0, 16.0, 9.0, 14.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.628036499023438e-05, -6.448943167924881e-05, -6.269849836826324e-05, -6.090756505727768e-05, -5.9116631746292114e-05, -5.732569843530655e-05, -5.5534765124320984e-05, -5.374383181333542e-05, -5.1952898502349854e-05, -5.016196519136429e-05, -4.837103188037872e-05, -4.658009856939316e-05, -4.478916525840759e-05, -4.299823194742203e-05, -4.120729863643646e-05, -3.94163653254509e-05, -3.762543201446533e-05, -3.583449870347977e-05, -3.40435653924942e-05, -3.2252632081508636e-05, -3.046169877052307e-05, -2.8670765459537506e-05, -2.687983214855194e-05, -2.5088898837566376e-05, -2.329796552658081e-05, -2.1507032215595245e-05, -1.971609890460968e-05, -1.7925165593624115e-05, -1.613423228263855e-05, -1.4343298971652985e-05, -1.255236566066742e-05, -1.0761432349681854e-05, -8.970499038696289e-06, -7.179565727710724e-06, -5.388632416725159e-06, -3.5976991057395935e-06, -1.8067657947540283e-06, -1.5832483768463135e-08, 1.775100827217102e-06, 3.5660341382026672e-06, 5.356967449188232e-06, 7.147900760173798e-06, 8.938834071159363e-06, 1.0729767382144928e-05, 1.2520700693130493e-05, 1.4311634004116058e-05, 1.6102567315101624e-05, 1.789350062608719e-05, 1.9684433937072754e-05, 2.147536724805832e-05, 2.3266300559043884e-05, 2.505723387002945e-05, 2.6848167181015015e-05, 2.863910049200058e-05, 3.0430033802986145e-05, 3.222096711397171e-05, 3.4011900424957275e-05, 3.580283373594284e-05, 3.7593767046928406e-05, 3.938470035791397e-05, 4.1175633668899536e-05, 4.29665669798851e-05, 4.4757500290870667e-05, 4.654843360185623e-05, 4.83393669128418e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 14.0, 17.0, 38.0, 52.0, 109.0, 207.0, 477.0, 936.0, 2712.0, 10537.0, 104852.0, 831346.0, 83550.0, 9401.0, 2510.0, 919.0, 403.0, 201.0, 110.0, 53.0, 33.0, 20.0, 13.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1844482421875, -0.17977428436279297, -0.17510032653808594, -0.1704263687133789, -0.16575241088867188, -0.16107845306396484, -0.1564044952392578, -0.15173053741455078, -0.14705657958984375, -0.14238262176513672, -0.1377086639404297, -0.13303470611572266, -0.12836074829101562, -0.1236867904663086, -0.11901283264160156, -0.11433887481689453, -0.1096649169921875, -0.10499095916748047, -0.10031700134277344, -0.0956430435180664, -0.09096908569335938, -0.08629512786865234, -0.08162117004394531, -0.07694721221923828, -0.07227325439453125, -0.06759929656982422, -0.06292533874511719, -0.058251380920410156, -0.053577423095703125, -0.048903465270996094, -0.04422950744628906, -0.03955554962158203, -0.034881591796875, -0.03020763397216797, -0.025533676147460938, -0.020859718322753906, -0.016185760498046875, -0.011511802673339844, -0.0068378448486328125, -0.0021638870239257812, 0.00251007080078125, 0.007184028625488281, 0.011857986450195312, 0.016531944274902344, 0.021205902099609375, 0.025879859924316406, 0.030553817749023438, 0.03522777557373047, 0.0399017333984375, 0.04457569122314453, 0.04924964904785156, 0.053923606872558594, 0.058597564697265625, 0.06327152252197266, 0.06794548034667969, 0.07261943817138672, 0.07729339599609375, 0.08196735382080078, 0.08664131164550781, 0.09131526947021484, 0.09598922729492188, 0.1006631851196289, 0.10533714294433594, 0.11001110076904297, 0.11468505859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 11.0, 10.0, 16.0, 24.0, 45.0, 55.0, 105.0, 146.0, 176.0, 152.0, 103.0, 57.0, 30.0, 19.0, 15.0, 8.0, 5.0, 9.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026214599609375, -0.025096893310546875, -0.02397918701171875, -0.022861480712890625, -0.0217437744140625, -0.020626068115234375, -0.01950836181640625, -0.018390655517578125, -0.01727294921875, -0.016155242919921875, -0.01503753662109375, -0.013919830322265625, -0.0128021240234375, -0.011684417724609375, -0.01056671142578125, -0.009449005126953125, -0.008331298828125, -0.007213592529296875, -0.00609588623046875, -0.004978179931640625, -0.0038604736328125, -0.002742767333984375, -0.00162506103515625, -0.000507354736328125, 0.0006103515625, 0.001728057861328125, 0.00284576416015625, 0.003963470458984375, 0.0050811767578125, 0.006198883056640625, 0.00731658935546875, 0.008434295654296875, 0.009552001953125, 0.010669708251953125, 0.01178741455078125, 0.012905120849609375, 0.0140228271484375, 0.015140533447265625, 0.01625823974609375, 0.017375946044921875, 0.01849365234375, 0.019611358642578125, 0.02072906494140625, 0.021846771240234375, 0.0229644775390625, 0.024082183837890625, 0.02519989013671875, 0.026317596435546875, 0.027435302734375, 0.028553009033203125, 0.02967071533203125, 0.030788421630859375, 0.0319061279296875, 0.033023834228515625, 0.03414154052734375, 0.035259246826171875, 0.036376953125, 0.037494659423828125, 0.03861236572265625, 0.039730072021484375, 0.0408477783203125, 0.041965484619140625, 0.04308319091796875, 0.044200897216796875, 0.045318603515625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 12.0, 9.0, 6.0, 8.0, 20.0, 20.0, 34.0, 52.0, 94.0, 167.0, 196.0, 159.0, 82.0, 47.0, 27.0, 19.0, 11.0, 14.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.8472964763641357, -2.7590572834014893, -2.670818328857422, -2.5825791358947754, -2.494340181350708, -2.4061009883880615, -2.317862033843994, -2.2296228408813477, -2.141383647918701, -2.0531444549560547, -1.9649055004119873, -1.8766663074493408, -1.7884273529052734, -1.700188159942627, -1.61194908618927, -1.523710012435913, -1.4354710578918457, -1.3472319841384888, -1.2589929103851318, -1.1707537174224854, -1.082514762878418, -0.9942756295204163, -0.9060364961624146, -0.8177974224090576, -0.7295583486557007, -0.6413192749023438, -0.5530802011489868, -0.4648410677909851, -0.3766019940376282, -0.28836292028427124, -0.20012378692626953, -0.1118847131729126, -0.023645639419555664, 0.06459344923496246, 0.1528325378894806, 0.2410716414451599, 0.32931071519851685, 0.4175497889518738, 0.5057889223098755, 0.5940279960632324, 0.6822670698165894, 0.7705061435699463, 0.8587452173233032, 0.9469843506813049, 1.0352234840393066, 1.123462438583374, 1.2117016315460205, 1.2999407052993774, 1.3881797790527344, 1.4764188528060913, 1.5646579265594482, 1.6528971195220947, 1.741136074066162, 1.8293752670288086, 1.9176143407821655, 2.0058534145355225, 2.09409236907959, 2.1823315620422363, 2.2705705165863037, 2.35880970954895, 2.4470486640930176, 2.535287857055664, 2.6235270500183105, 2.711766004562378, 2.8000051975250244]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 4.0, 7.0, 7.0, 12.0, 9.0, 18.0, 22.0, 24.0, 34.0, 44.0, 58.0, 58.0, 67.0, 70.0, 69.0, 69.0, 69.0, 64.0, 53.0, 43.0, 32.0, 28.0, 27.0, 17.0, 17.0, 16.0, 9.0, 6.0, 9.0, 7.0, 2.0, 5.0, 2.0, 3.0, 0.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5011661052703857, -1.4553509950637817, -1.4095358848571777, -1.3637208938598633, -1.3179057836532593, -1.2720906734466553, -1.2262755632400513, -1.1804604530334473, -1.1346454620361328, -1.0888303518295288, -1.0430152416229248, -0.9972001910209656, -0.9513851404190063, -0.9055700302124023, -0.8597549200057983, -0.8139398097991943, -0.7681246995925903, -0.7223095893859863, -0.6764945387840271, -0.6306794285774231, -0.5848643779754639, -0.5390492677688599, -0.49323415756225586, -0.44741907715797424, -0.4016039967536926, -0.355788916349411, -0.3099738359451294, -0.2641587257385254, -0.21834364533424377, -0.17252856492996216, -0.12671345472335815, -0.08089837431907654, -0.03508317470550537, 0.010731913149356842, 0.056547001004219055, 0.10236209630966187, 0.14817717671394348, 0.1939922571182251, 0.2398073673248291, 0.2856224477291107, 0.33143752813339233, 0.37725260853767395, 0.42306768894195557, 0.46888279914855957, 0.5146979093551636, 0.5605129599571228, 0.6063280701637268, 0.652143120765686, 0.69795823097229, 0.743773341178894, 0.7895883917808533, 0.8354035019874573, 0.8812185525894165, 0.9270336627960205, 0.9728487730026245, 1.0186638832092285, 1.064478874206543, 1.110293984413147, 1.156109094619751, 1.2019240856170654, 1.2477391958236694, 1.2935543060302734, 1.3393694162368774, 1.3851845264434814, 1.4309996366500854]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 5.0, 9.0, 8.0, 14.0, 30.0, 28.0, 38.0, 62.0, 97.0, 114.0, 196.0, 249.0, 444.0, 739.0, 1293.0, 2669.0, 6072.0, 16585.0, 82805.0, 857637.0, 55176.0, 13706.0, 5164.0, 2301.0, 1155.0, 726.0, 392.0, 251.0, 166.0, 116.0, 94.0, 48.0, 42.0, 32.0, 26.0, 16.0, 16.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.94744873046875, -1.8812255859375, -1.81500244140625, -1.748779296875, -1.68255615234375, -1.6163330078125, -1.55010986328125, -1.48388671875, -1.41766357421875, -1.3514404296875, -1.28521728515625, -1.218994140625, -1.15277099609375, -1.0865478515625, -1.02032470703125, -0.9541015625, -0.88787841796875, -0.8216552734375, -0.75543212890625, -0.689208984375, -0.62298583984375, -0.5567626953125, -0.49053955078125, -0.42431640625, -0.35809326171875, -0.2918701171875, -0.22564697265625, -0.159423828125, -0.09320068359375, -0.0269775390625, 0.03924560546875, 0.10546875, 0.17169189453125, 0.2379150390625, 0.30413818359375, 0.370361328125, 0.43658447265625, 0.5028076171875, 0.56903076171875, 0.63525390625, 0.70147705078125, 0.7677001953125, 0.83392333984375, 0.900146484375, 0.96636962890625, 1.0325927734375, 1.09881591796875, 1.1650390625, 1.23126220703125, 1.2974853515625, 1.36370849609375, 1.429931640625, 1.49615478515625, 1.5623779296875, 1.62860107421875, 1.69482421875, 1.76104736328125, 1.8272705078125, 1.89349365234375, 1.959716796875, 2.02593994140625, 2.0921630859375, 2.15838623046875, 2.224609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 4.0, 4.0, 10.0, 7.0, 14.0, 21.0, 22.0, 37.0, 43.0, 50.0, 64.0, 48.0, 75.0, 81.0, 69.0, 85.0, 55.0, 51.0, 50.0, 40.0, 26.0, 17.0, 28.0, 16.0, 11.0, 12.0, 12.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.44921875, -3.353424072265625, -3.25762939453125, -3.161834716796875, -3.0660400390625, -2.970245361328125, -2.87445068359375, -2.778656005859375, -2.682861328125, -2.587066650390625, -2.49127197265625, -2.395477294921875, -2.2996826171875, -2.203887939453125, -2.10809326171875, -2.012298583984375, -1.91650390625, -1.820709228515625, -1.72491455078125, -1.629119873046875, -1.5333251953125, -1.437530517578125, -1.34173583984375, -1.245941162109375, -1.150146484375, -1.054351806640625, -0.95855712890625, -0.862762451171875, -0.7669677734375, -0.671173095703125, -0.57537841796875, -0.479583740234375, -0.3837890625, -0.287994384765625, -0.19219970703125, -0.096405029296875, -0.0006103515625, 0.095184326171875, 0.19097900390625, 0.286773681640625, 0.382568359375, 0.478363037109375, 0.57415771484375, 0.669952392578125, 0.7657470703125, 0.861541748046875, 0.95733642578125, 1.053131103515625, 1.14892578125, 1.244720458984375, 1.34051513671875, 1.436309814453125, 1.5321044921875, 1.627899169921875, 1.72369384765625, 1.819488525390625, 1.915283203125, 2.011077880859375, 2.10687255859375, 2.202667236328125, 2.2984619140625, 2.394256591796875, 2.49005126953125, 2.585845947265625, 2.681640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 12.0, 24.0, 27.0, 50.0, 96.0, 194.0, 505.0, 1580.0, 7310.0, 88006.0, 927453.0, 18842.0, 3007.0, 803.0, 319.0, 155.0, 62.0, 31.0, 18.0, 11.0, 10.0, 4.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.14404296875, -3.0400390625, -2.93603515625, -2.83203125, -2.72802734375, -2.6240234375, -2.52001953125, -2.416015625, -2.31201171875, -2.2080078125, -2.10400390625, -2.0, -1.89599609375, -1.7919921875, -1.68798828125, -1.583984375, -1.47998046875, -1.3759765625, -1.27197265625, -1.16796875, -1.06396484375, -0.9599609375, -0.85595703125, -0.751953125, -0.64794921875, -0.5439453125, -0.43994140625, -0.3359375, -0.23193359375, -0.1279296875, -0.02392578125, 0.080078125, 0.18408203125, 0.2880859375, 0.39208984375, 0.49609375, 0.60009765625, 0.7041015625, 0.80810546875, 0.912109375, 1.01611328125, 1.1201171875, 1.22412109375, 1.328125, 1.43212890625, 1.5361328125, 1.64013671875, 1.744140625, 1.84814453125, 1.9521484375, 2.05615234375, 2.16015625, 2.26416015625, 2.3681640625, 2.47216796875, 2.576171875, 2.68017578125, 2.7841796875, 2.88818359375, 2.9921875, 3.09619140625, 3.2001953125, 3.30419921875, 3.408203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 8.0, 13.0, 9.0, 15.0, 24.0, 24.0, 37.0, 32.0, 41.0, 45.0, 39.0, 38.0, 49.0, 61.0, 54.0, 60.0, 54.0, 55.0, 40.0, 47.0, 46.0, 36.0, 28.0, 18.0, 22.0, 15.0, 20.0, 13.0, 9.0, 9.0, 5.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.859375, -3.751800537109375, -3.64422607421875, -3.536651611328125, -3.4290771484375, -3.321502685546875, -3.21392822265625, -3.106353759765625, -2.998779296875, -2.891204833984375, -2.78363037109375, -2.676055908203125, -2.5684814453125, -2.460906982421875, -2.35333251953125, -2.245758056640625, -2.13818359375, -2.030609130859375, -1.92303466796875, -1.815460205078125, -1.7078857421875, -1.600311279296875, -1.49273681640625, -1.385162353515625, -1.277587890625, -1.170013427734375, -1.06243896484375, -0.954864501953125, -0.8472900390625, -0.739715576171875, -0.63214111328125, -0.524566650390625, -0.4169921875, -0.309417724609375, -0.20184326171875, -0.094268798828125, 0.0133056640625, 0.120880126953125, 0.22845458984375, 0.336029052734375, 0.443603515625, 0.551177978515625, 0.65875244140625, 0.766326904296875, 0.8739013671875, 0.981475830078125, 1.08905029296875, 1.196624755859375, 1.30419921875, 1.411773681640625, 1.51934814453125, 1.626922607421875, 1.7344970703125, 1.842071533203125, 1.94964599609375, 2.057220458984375, 2.164794921875, 2.272369384765625, 2.37994384765625, 2.487518310546875, 2.5950927734375, 2.702667236328125, 2.81024169921875, 2.917816162109375, 3.025390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 2.0, 8.0, 11.0, 15.0, 15.0, 26.0, 25.0, 66.0, 66.0, 98.0, 210.0, 486.0, 1392.0, 4550.0, 20623.0, 789527.0, 209859.0, 15916.0, 3566.0, 1061.0, 475.0, 205.0, 112.0, 70.0, 37.0, 37.0, 25.0, 16.0, 10.0, 15.0, 7.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0546875, -1.0216522216796875, -0.988616943359375, -0.9555816650390625, -0.92254638671875, -0.8895111083984375, -0.856475830078125, -0.8234405517578125, -0.7904052734375, -0.7573699951171875, -0.724334716796875, -0.6912994384765625, -0.65826416015625, -0.6252288818359375, -0.592193603515625, -0.5591583251953125, -0.526123046875, -0.4930877685546875, -0.460052490234375, -0.4270172119140625, -0.39398193359375, -0.3609466552734375, -0.327911376953125, -0.2948760986328125, -0.2618408203125, -0.2288055419921875, -0.195770263671875, -0.1627349853515625, -0.12969970703125, -0.0966644287109375, -0.063629150390625, -0.0305938720703125, 0.00244140625, 0.0354766845703125, 0.068511962890625, 0.1015472412109375, 0.13458251953125, 0.1676177978515625, 0.200653076171875, 0.2336883544921875, 0.2667236328125, 0.2997589111328125, 0.332794189453125, 0.3658294677734375, 0.39886474609375, 0.4319000244140625, 0.464935302734375, 0.4979705810546875, 0.531005859375, 0.5640411376953125, 0.597076416015625, 0.6301116943359375, 0.66314697265625, 0.6961822509765625, 0.729217529296875, 0.7622528076171875, 0.7952880859375, 0.8283233642578125, 0.861358642578125, 0.8943939208984375, 0.92742919921875, 0.9604644775390625, 0.993499755859375, 1.0265350341796875, 1.0595703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 10.0, 14.0, 36.0, 102.0, 669.0, 90.0, 24.0, 11.0, 11.0, 6.0, 10.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011903047561645508, -0.00010954122990369797, -0.00010005198419094086, -9.056273847818375e-05, -8.107349276542664e-05, -7.158424705266953e-05, -6.209500133991241e-05, -5.2605755627155304e-05, -4.311650991439819e-05, -3.362726420164108e-05, -2.4138018488883972e-05, -1.4648772776126862e-05, -5.159527063369751e-06, 4.32971864938736e-06, 1.381896436214447e-05, 2.330821007490158e-05, 3.279745578765869e-05, 4.22867015004158e-05, 5.177594721317291e-05, 6.126519292593002e-05, 7.075443863868713e-05, 8.024368435144424e-05, 8.973293006420135e-05, 9.922217577695847e-05, 0.00010871142148971558, 0.00011820066720247269, 0.0001276899129152298, 0.0001371791586279869, 0.00014666840434074402, 0.00015615765005350113, 0.00016564689576625824, 0.00017513614147901535, 0.00018462538719177246, 0.00019411463290452957, 0.00020360387861728668, 0.0002130931243300438, 0.0002225823700428009, 0.00023207161575555801, 0.00024156086146831512, 0.00025105010718107224, 0.00026053935289382935, 0.00027002859860658646, 0.00027951784431934357, 0.0002890070900321007, 0.0002984963357448578, 0.0003079855814576149, 0.000317474827170372, 0.0003269640728831291, 0.00033645331859588623, 0.00034594256430864334, 0.00035543181002140045, 0.00036492105573415756, 0.00037441030144691467, 0.0003838995471596718, 0.0003933887928724289, 0.000402878038585186, 0.0004123672842979431, 0.0004218565300107002, 0.00043134577572345734, 0.00044083502143621445, 0.00045032426714897156, 0.00045981351286172867, 0.0004693027585744858, 0.0004787920042872429, 0.00048828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 16.0, 28.0, 53.0, 109.0, 215.0, 535.0, 1502.0, 4686.0, 21203.0, 859715.0, 141652.0, 13758.0, 3226.0, 1040.0, 415.0, 187.0, 67.0, 45.0, 25.0, 17.0, 11.0, 10.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4287109375, -1.3909835815429688, -1.3532562255859375, -1.3155288696289062, -1.277801513671875, -1.2400741577148438, -1.2023468017578125, -1.1646194458007812, -1.12689208984375, -1.0891647338867188, -1.0514373779296875, -1.0137100219726562, -0.975982666015625, -0.9382553100585938, -0.9005279541015625, -0.8628005981445312, -0.8250732421875, -0.7873458862304688, -0.7496185302734375, -0.7118911743164062, -0.674163818359375, -0.6364364624023438, -0.5987091064453125, -0.5609817504882812, -0.52325439453125, -0.48552703857421875, -0.4477996826171875, -0.41007232666015625, -0.372344970703125, -0.33461761474609375, -0.2968902587890625, -0.25916290283203125, -0.221435546875, -0.18370819091796875, -0.1459808349609375, -0.10825347900390625, -0.070526123046875, -0.03279876708984375, 0.0049285888671875, 0.04265594482421875, 0.08038330078125, 0.11811065673828125, 0.1558380126953125, 0.19356536865234375, 0.231292724609375, 0.26902008056640625, 0.3067474365234375, 0.34447479248046875, 0.3822021484375, 0.41992950439453125, 0.4576568603515625, 0.49538421630859375, 0.533111572265625, 0.5708389282226562, 0.6085662841796875, 0.6462936401367188, 0.68402099609375, 0.7217483520507812, 0.7594757080078125, 0.7972030639648438, 0.834930419921875, 0.8726577758789062, 0.9103851318359375, 0.9481124877929688, 0.98583984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 7.0, 11.0, 21.0, 23.0, 71.0, 198.0, 441.0, 87.0, 36.0, 19.0, 16.0, 11.0, 11.0, 5.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.415771484375, -0.4036064147949219, -0.39144134521484375, -0.3792762756347656, -0.3671112060546875, -0.3549461364746094, -0.34278106689453125, -0.3306159973144531, -0.318450927734375, -0.3062858581542969, -0.29412078857421875, -0.2819557189941406, -0.2697906494140625, -0.2576255798339844, -0.24546051025390625, -0.23329544067382812, -0.22113037109375, -0.20896530151367188, -0.19680023193359375, -0.18463516235351562, -0.1724700927734375, -0.16030502319335938, -0.14813995361328125, -0.13597488403320312, -0.123809814453125, -0.11164474487304688, -0.09947967529296875, -0.08731460571289062, -0.0751495361328125, -0.06298446655273438, -0.05081939697265625, -0.038654327392578125, -0.0264892578125, -0.014324188232421875, -0.00215911865234375, 0.010005950927734375, 0.0221710205078125, 0.034336090087890625, 0.04650115966796875, 0.058666229248046875, 0.070831298828125, 0.08299636840820312, 0.09516143798828125, 0.10732650756835938, 0.1194915771484375, 0.13165664672851562, 0.14382171630859375, 0.15598678588867188, 0.16815185546875, 0.18031692504882812, 0.19248199462890625, 0.20464706420898438, 0.2168121337890625, 0.22897720336914062, 0.24114227294921875, 0.2533073425292969, 0.265472412109375, 0.2776374816894531, 0.28980255126953125, 0.3019676208496094, 0.3141326904296875, 0.3262977600097656, 0.33846282958984375, 0.3506278991699219, 0.36279296875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 16.0, 24.0, 60.0, 223.0, 395.0, 191.0, 42.0, 28.0, 12.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.579866409301758, -22.140300750732422, -21.700733184814453, -21.261167526245117, -20.82160186767578, -20.382036209106445, -19.94247055053711, -19.50290298461914, -19.063337326049805, -18.62377166748047, -18.1842041015625, -17.744638442993164, -17.305072784423828, -16.865507125854492, -16.425941467285156, -15.986373901367188, -15.546808242797852, -15.107242584228516, -14.667675971984863, -14.228109359741211, -13.788543701171875, -13.348978042602539, -12.909411430358887, -12.469844818115234, -12.030279159545898, -11.590713500976562, -11.15114688873291, -10.711580276489258, -10.272014617919922, -9.832448959350586, -9.392882347106934, -8.953315734863281, -8.513750076293945, -8.07418441772461, -7.634617805480957, -7.195051670074463, -6.755485534667969, -6.315919399261475, -5.8763532638549805, -5.436787128448486, -4.99722146987915, -4.557655334472656, -4.118089199066162, -3.678523063659668, -3.238956928253174, -2.7993907928466797, -2.3598246574401855, -1.9202585220336914, -1.4806923866271973, -1.0411262512207031, -0.601560115814209, -0.16199398040771484, 0.2775721549987793, 0.7171382904052734, 1.1567044258117676, 1.5962705612182617, 2.035836696624756, 2.47540283203125, 2.914968967437744, 3.3545351028442383, 3.7941012382507324, 4.233667373657227, 4.673233509063721, 5.112799644470215, 5.552365779876709]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 8.0, 9.0, 7.0, 7.0, 16.0, 10.0, 17.0, 21.0, 19.0, 23.0, 35.0, 30.0, 38.0, 28.0, 39.0, 41.0, 37.0, 49.0, 38.0, 37.0, 41.0, 38.0, 39.0, 47.0, 38.0, 30.0, 31.0, 30.0, 30.0, 19.0, 25.0, 16.0, 20.0, 14.0, 11.0, 13.0, 5.0, 10.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.190743923187256, -5.0354743003845215, -4.880205154418945, -4.724935531616211, -4.569665908813477, -4.414396286010742, -4.259126663208008, -4.103857517242432, -3.9485878944396973, -3.793318271636963, -3.6380488872528076, -3.4827795028686523, -3.327509880065918, -3.1722402572631836, -3.0169708728790283, -2.861701488494873, -2.7064318656921387, -2.5511622428894043, -2.395892858505249, -2.2406234741210938, -2.0853538513183594, -1.9300843477249146, -1.7748148441314697, -1.619545340538025, -1.46427583694458, -1.3090063333511353, -1.1537368297576904, -0.9984673261642456, -0.8431978225708008, -0.687928318977356, -0.5326588153839111, -0.3773893117904663, -0.22211933135986328, -0.06684982776641846, 0.08841967582702637, 0.2436891794204712, 0.398958683013916, 0.5542281866073608, 0.7094976902008057, 0.8647671937942505, 1.0200366973876953, 1.1753062009811401, 1.330575704574585, 1.4858452081680298, 1.6411147117614746, 1.7963842153549194, 1.9516537189483643, 2.1069231033325195, 2.262192726135254, 2.4174623489379883, 2.5727317333221436, 2.728001117706299, 2.883270740509033, 3.0385403633117676, 3.193809747695923, 3.349079132080078, 3.5043487548828125, 3.659618377685547, 3.814887762069702, 3.9701571464538574, 4.125426769256592, 4.280696392059326, 4.435965538024902, 4.591235160827637, 4.746504783630371]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 15.0, 18.0, 23.0, 29.0, 34.0, 64.0, 97.0, 203.0, 508.0, 1749.0, 7992.0, 91802.0, 4013111.0, 69599.0, 6551.0, 1439.0, 500.0, 183.0, 98.0, 60.0, 39.0, 22.0, 17.0, 17.0, 15.0, 19.0, 9.0, 6.0, 9.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.390625, -6.21533203125, -6.0400390625, -5.86474609375, -5.689453125, -5.51416015625, -5.3388671875, -5.16357421875, -4.98828125, -4.81298828125, -4.6376953125, -4.46240234375, -4.287109375, -4.11181640625, -3.9365234375, -3.76123046875, -3.5859375, -3.41064453125, -3.2353515625, -3.06005859375, -2.884765625, -2.70947265625, -2.5341796875, -2.35888671875, -2.18359375, -2.00830078125, -1.8330078125, -1.65771484375, -1.482421875, -1.30712890625, -1.1318359375, -0.95654296875, -0.78125, -0.60595703125, -0.4306640625, -0.25537109375, -0.080078125, 0.09521484375, 0.2705078125, 0.44580078125, 0.62109375, 0.79638671875, 0.9716796875, 1.14697265625, 1.322265625, 1.49755859375, 1.6728515625, 1.84814453125, 2.0234375, 2.19873046875, 2.3740234375, 2.54931640625, 2.724609375, 2.89990234375, 3.0751953125, 3.25048828125, 3.42578125, 3.60107421875, 3.7763671875, 3.95166015625, 4.126953125, 4.30224609375, 4.4775390625, 4.65283203125, 4.828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 11.0, 15.0, 14.0, 14.0, 34.0, 33.0, 42.0, 50.0, 72.0, 78.0, 89.0, 92.0, 86.0, 66.0, 80.0, 46.0, 27.0, 25.0, 25.0, 22.0, 17.0, 6.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.89605712890625, -1.8370361328125, -1.77801513671875, -1.718994140625, -1.65997314453125, -1.6009521484375, -1.54193115234375, -1.48291015625, -1.42388916015625, -1.3648681640625, -1.30584716796875, -1.246826171875, -1.18780517578125, -1.1287841796875, -1.06976318359375, -1.0107421875, -0.95172119140625, -0.8927001953125, -0.83367919921875, -0.774658203125, -0.71563720703125, -0.6566162109375, -0.59759521484375, -0.53857421875, -0.47955322265625, -0.4205322265625, -0.36151123046875, -0.302490234375, -0.24346923828125, -0.1844482421875, -0.12542724609375, -0.06640625, -0.00738525390625, 0.0516357421875, 0.11065673828125, 0.169677734375, 0.22869873046875, 0.2877197265625, 0.34674072265625, 0.40576171875, 0.46478271484375, 0.5238037109375, 0.58282470703125, 0.641845703125, 0.70086669921875, 0.7598876953125, 0.81890869140625, 0.8779296875, 0.93695068359375, 0.9959716796875, 1.05499267578125, 1.114013671875, 1.17303466796875, 1.2320556640625, 1.29107666015625, 1.35009765625, 1.40911865234375, 1.4681396484375, 1.52716064453125, 1.586181640625, 1.64520263671875, 1.7042236328125, 1.76324462890625, 1.822265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 10.0, 21.0, 48.0, 42.0, 86.0, 149.0, 372.0, 1113.0, 4557.0, 31237.0, 2786627.0, 1337618.0, 26646.0, 3989.0, 995.0, 398.0, 139.0, 83.0, 34.0, 33.0, 17.0, 10.0, 10.0, 3.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.84765625, -4.69598388671875, -4.5443115234375, -4.39263916015625, -4.240966796875, -4.08929443359375, -3.9376220703125, -3.78594970703125, -3.63427734375, -3.48260498046875, -3.3309326171875, -3.17926025390625, -3.027587890625, -2.87591552734375, -2.7242431640625, -2.57257080078125, -2.4208984375, -2.26922607421875, -2.1175537109375, -1.96588134765625, -1.814208984375, -1.66253662109375, -1.5108642578125, -1.35919189453125, -1.20751953125, -1.05584716796875, -0.9041748046875, -0.75250244140625, -0.600830078125, -0.44915771484375, -0.2974853515625, -0.14581298828125, 0.005859375, 0.15753173828125, 0.3092041015625, 0.46087646484375, 0.612548828125, 0.76422119140625, 0.9158935546875, 1.06756591796875, 1.21923828125, 1.37091064453125, 1.5225830078125, 1.67425537109375, 1.825927734375, 1.97760009765625, 2.1292724609375, 2.28094482421875, 2.4326171875, 2.58428955078125, 2.7359619140625, 2.88763427734375, 3.039306640625, 3.19097900390625, 3.3426513671875, 3.49432373046875, 3.64599609375, 3.79766845703125, 3.9493408203125, 4.10101318359375, 4.252685546875, 4.40435791015625, 4.5560302734375, 4.70770263671875, 4.859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 7.0, 22.0, 17.0, 23.0, 28.0, 45.0, 68.0, 84.0, 94.0, 176.0, 355.0, 597.0, 1052.0, 559.0, 310.0, 203.0, 100.0, 86.0, 61.0, 42.0, 28.0, 22.0, 20.0, 13.0, 8.0, 18.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60546875, -0.5849685668945312, -0.5644683837890625, -0.5439682006835938, -0.523468017578125, -0.5029678344726562, -0.4824676513671875, -0.46196746826171875, -0.44146728515625, -0.42096710205078125, -0.4004669189453125, -0.37996673583984375, -0.359466552734375, -0.33896636962890625, -0.3184661865234375, -0.29796600341796875, -0.2774658203125, -0.25696563720703125, -0.2364654541015625, -0.21596527099609375, -0.195465087890625, -0.17496490478515625, -0.1544647216796875, -0.13396453857421875, -0.11346435546875, -0.09296417236328125, -0.0724639892578125, -0.05196380615234375, -0.031463623046875, -0.01096343994140625, 0.0095367431640625, 0.03003692626953125, 0.050537109375, 0.07103729248046875, 0.0915374755859375, 0.11203765869140625, 0.132537841796875, 0.15303802490234375, 0.1735382080078125, 0.19403839111328125, 0.21453857421875, 0.23503875732421875, 0.2555389404296875, 0.27603912353515625, 0.296539306640625, 0.31703948974609375, 0.3375396728515625, 0.35803985595703125, 0.3785400390625, 0.39904022216796875, 0.4195404052734375, 0.44004058837890625, 0.460540771484375, 0.48104095458984375, 0.5015411376953125, 0.5220413208007812, 0.54254150390625, 0.5630416870117188, 0.5835418701171875, 0.6040420532226562, 0.624542236328125, 0.6450424194335938, 0.6655426025390625, 0.6860427856445312, 0.70654296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 31.0, 35.0, 53.0, 104.0, 152.0, 170.0, 159.0, 122.0, 55.0, 49.0, 17.0, 15.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2743020057678223, -3.1289138793945312, -2.9835257530212402, -2.838137626647949, -2.692749500274658, -2.547361373901367, -2.401973247528076, -2.256585121154785, -2.111196994781494, -1.9658088684082031, -1.820420742034912, -1.675032615661621, -1.52964448928833, -1.384256362915039, -1.2388681173324585, -1.0934799909591675, -0.9480917453765869, -0.8027036190032959, -0.6573154926300049, -0.5119273066520691, -0.3665391802787781, -0.22115105390548706, -0.07576286792755127, 0.06962525844573975, 0.21501338481903076, 0.3604015111923218, 0.5057896375656128, 0.6511778235435486, 0.7965659499168396, 0.9419540762901306, 1.0873422622680664, 1.2327303886413574, 1.3781185150146484, 1.5235066413879395, 1.6688947677612305, 1.8142828941345215, 1.9596710205078125, 2.1050591468811035, 2.2504472732543945, 2.3958353996276855, 2.5412235260009766, 2.6866116523742676, 2.8319997787475586, 2.9773879051208496, 3.1227760314941406, 3.2681641578674316, 3.4135522842407227, 3.5589404106140137, 3.704328775405884, 3.849716901779175, 3.995105028152466, 4.140493392944336, 4.285881519317627, 4.431269645690918, 4.576657772064209, 4.7220458984375, 4.867434024810791, 5.012822151184082, 5.158210277557373, 5.303598403930664, 5.448986530303955, 5.594374656677246, 5.739762783050537, 5.885150909423828, 6.030539035797119]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 12.0, 12.0, 24.0, 13.0, 27.0, 17.0, 32.0, 35.0, 46.0, 44.0, 50.0, 51.0, 60.0, 60.0, 51.0, 49.0, 56.0, 52.0, 45.0, 34.0, 43.0, 27.0, 29.0, 28.0, 16.0, 20.0, 10.0, 11.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.029968023300171, -1.9686391353607178, -1.907310128211975, -1.845981240272522, -1.7846523523330688, -1.7233233451843262, -1.661994457244873, -1.60066556930542, -1.5393366813659668, -1.4780077934265137, -1.416678786277771, -1.3553498983383179, -1.2940210103988647, -1.232692003250122, -1.171363115310669, -1.1100342273712158, -1.0487052202224731, -0.9873762726783752, -0.9260473847389221, -0.8647184371948242, -0.8033895492553711, -0.7420606017112732, -0.6807316541671753, -0.6194027662277222, -0.5580738186836243, -0.49674490094184875, -0.43541598320007324, -0.37408703565597534, -0.31275811791419983, -0.2514292001724243, -0.19010025262832642, -0.1287713348865509, -0.06744253635406494, -0.006113611161708832, 0.05521531403064728, 0.11654424667358398, 0.1778731644153595, 0.239202082157135, 0.3005310297012329, 0.3618599474430084, 0.42318886518478394, 0.48451778292655945, 0.545846700668335, 0.6071756482124329, 0.6685045957565308, 0.7298334836959839, 0.7911624312400818, 0.8524913787841797, 0.9138202667236328, 0.9751492142677307, 1.0364781618118286, 1.0978070497512817, 1.1591359376907349, 1.2204649448394775, 1.2817938327789307, 1.3431227207183838, 1.404451608657837, 1.46578049659729, 1.5271095037460327, 1.5884383916854858, 1.649767279624939, 1.7110962867736816, 1.7724251747131348, 1.833754062652588, 1.8950830698013306]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 5.0, 13.0, 9.0, 13.0, 23.0, 33.0, 39.0, 68.0, 75.0, 127.0, 214.0, 351.0, 536.0, 966.0, 1564.0, 2969.0, 5989.0, 14633.0, 48827.0, 261582.0, 535112.0, 127286.0, 28116.0, 9907.0, 4491.0, 2316.0, 1217.0, 705.0, 408.0, 303.0, 217.0, 113.0, 103.0, 58.0, 48.0, 26.0, 26.0, 10.0, 11.0, 8.0, 12.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.36962890625, -0.35852813720703125, -0.3474273681640625, -0.33632659912109375, -0.325225830078125, -0.31412506103515625, -0.3030242919921875, -0.29192352294921875, -0.28082275390625, -0.26972198486328125, -0.2586212158203125, -0.24752044677734375, -0.236419677734375, -0.22531890869140625, -0.2142181396484375, -0.20311737060546875, -0.1920166015625, -0.18091583251953125, -0.1698150634765625, -0.15871429443359375, -0.147613525390625, -0.13651275634765625, -0.1254119873046875, -0.11431121826171875, -0.10321044921875, -0.09210968017578125, -0.0810089111328125, -0.06990814208984375, -0.058807373046875, -0.04770660400390625, -0.0366058349609375, -0.02550506591796875, -0.014404296875, -0.00330352783203125, 0.0077972412109375, 0.01889801025390625, 0.029998779296875, 0.04109954833984375, 0.0522003173828125, 0.06330108642578125, 0.07440185546875, 0.08550262451171875, 0.0966033935546875, 0.10770416259765625, 0.118804931640625, 0.12990570068359375, 0.1410064697265625, 0.15210723876953125, 0.1632080078125, 0.17430877685546875, 0.1854095458984375, 0.19651031494140625, 0.207611083984375, 0.21871185302734375, 0.2298126220703125, 0.24091339111328125, 0.25201416015625, 0.26311492919921875, 0.2742156982421875, 0.28531646728515625, 0.296417236328125, 0.30751800537109375, 0.3186187744140625, 0.32971954345703125, 0.3408203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 11.0, 9.0, 17.0, 19.0, 16.0, 27.0, 26.0, 46.0, 49.0, 39.0, 64.0, 60.0, 65.0, 71.0, 52.0, 53.0, 42.0, 47.0, 50.0, 35.0, 35.0, 35.0, 26.0, 24.0, 16.0, 11.0, 7.0, 6.0, 10.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6683197021484375, -1.616912841796875, -1.5655059814453125, -1.51409912109375, -1.4626922607421875, -1.411285400390625, -1.3598785400390625, -1.3084716796875, -1.2570648193359375, -1.205657958984375, -1.1542510986328125, -1.10284423828125, -1.0514373779296875, -1.000030517578125, -0.9486236572265625, -0.897216796875, -0.8458099365234375, -0.794403076171875, -0.7429962158203125, -0.69158935546875, -0.6401824951171875, -0.588775634765625, -0.5373687744140625, -0.4859619140625, -0.4345550537109375, -0.383148193359375, -0.3317413330078125, -0.28033447265625, -0.2289276123046875, -0.177520751953125, -0.1261138916015625, -0.07470703125, -0.0233001708984375, 0.028106689453125, 0.0795135498046875, 0.13092041015625, 0.1823272705078125, 0.233734130859375, 0.2851409912109375, 0.3365478515625, 0.3879547119140625, 0.439361572265625, 0.4907684326171875, 0.54217529296875, 0.5935821533203125, 0.644989013671875, 0.6963958740234375, 0.747802734375, 0.7992095947265625, 0.850616455078125, 0.9020233154296875, 0.95343017578125, 1.0048370361328125, 1.056243896484375, 1.1076507568359375, 1.1590576171875, 1.2104644775390625, 1.261871337890625, 1.3132781982421875, 1.36468505859375, 1.4160919189453125, 1.467498779296875, 1.5189056396484375, 1.5703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 1.0, 4.0, 4.0, 6.0, 12.0, 15.0, 18.0, 35.0, 28.0, 53.0, 64.0, 99.0, 116.0, 235.0, 376.0, 561.0, 940.0, 1664.0, 3374.0, 7775.0, 21335.0, 86718.0, 403508.0, 399290.0, 85691.0, 21343.0, 7624.0, 3401.0, 1670.0, 961.0, 550.0, 338.0, 229.0, 146.0, 112.0, 68.0, 46.0, 30.0, 34.0, 22.0, 13.0, 9.0, 13.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.293701171875, -0.2839088439941406, -0.27411651611328125, -0.2643241882324219, -0.2545318603515625, -0.24473953247070312, -0.23494720458984375, -0.22515487670898438, -0.215362548828125, -0.20557022094726562, -0.19577789306640625, -0.18598556518554688, -0.1761932373046875, -0.16640090942382812, -0.15660858154296875, -0.14681625366210938, -0.13702392578125, -0.12723159790039062, -0.11743927001953125, -0.10764694213867188, -0.0978546142578125, -0.08806228637695312, -0.07826995849609375, -0.06847763061523438, -0.058685302734375, -0.048892974853515625, -0.03910064697265625, -0.029308319091796875, -0.0195159912109375, -0.009723663330078125, 6.866455078125e-05, 0.009860992431640625, 0.0196533203125, 0.029445648193359375, 0.03923797607421875, 0.049030303955078125, 0.0588226318359375, 0.06861495971679688, 0.07840728759765625, 0.08819961547851562, 0.097991943359375, 0.10778427124023438, 0.11757659912109375, 0.12736892700195312, 0.1371612548828125, 0.14695358276367188, 0.15674591064453125, 0.16653823852539062, 0.17633056640625, 0.18612289428710938, 0.19591522216796875, 0.20570755004882812, 0.2154998779296875, 0.22529220581054688, 0.23508453369140625, 0.24487686157226562, 0.254669189453125, 0.2644615173339844, 0.27425384521484375, 0.2840461730957031, 0.2938385009765625, 0.3036308288574219, 0.31342315673828125, 0.3232154846191406, 0.3330078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 15.0, 10.0, 12.0, 18.0, 22.0, 24.0, 24.0, 25.0, 31.0, 34.0, 48.0, 49.0, 53.0, 53.0, 66.0, 65.0, 59.0, 47.0, 47.0, 48.0, 48.0, 28.0, 33.0, 27.0, 18.0, 13.0, 18.0, 15.0, 13.0, 13.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.04296875, -2.93072509765625, -2.8184814453125, -2.70623779296875, -2.593994140625, -2.48175048828125, -2.3695068359375, -2.25726318359375, -2.14501953125, -2.03277587890625, -1.9205322265625, -1.80828857421875, -1.696044921875, -1.58380126953125, -1.4715576171875, -1.35931396484375, -1.2470703125, -1.13482666015625, -1.0225830078125, -0.91033935546875, -0.798095703125, -0.68585205078125, -0.5736083984375, -0.46136474609375, -0.34912109375, -0.23687744140625, -0.1246337890625, -0.01239013671875, 0.099853515625, 0.21209716796875, 0.3243408203125, 0.43658447265625, 0.548828125, 0.66107177734375, 0.7733154296875, 0.88555908203125, 0.997802734375, 1.11004638671875, 1.2222900390625, 1.33453369140625, 1.44677734375, 1.55902099609375, 1.6712646484375, 1.78350830078125, 1.895751953125, 2.00799560546875, 2.1202392578125, 2.23248291015625, 2.3447265625, 2.45697021484375, 2.5692138671875, 2.68145751953125, 2.793701171875, 2.90594482421875, 3.0181884765625, 3.13043212890625, 3.24267578125, 3.35491943359375, 3.4671630859375, 3.57940673828125, 3.691650390625, 3.80389404296875, 3.9161376953125, 4.02838134765625, 4.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 2.0, 4.0, 9.0, 10.0, 14.0, 14.0, 18.0, 31.0, 53.0, 83.0, 118.0, 229.0, 331.0, 631.0, 1293.0, 2773.0, 7003.0, 25243.0, 184313.0, 692865.0, 105731.0, 17731.0, 5347.0, 2242.0, 1048.0, 577.0, 338.0, 161.0, 101.0, 77.0, 41.0, 38.0, 27.0, 16.0, 13.0, 4.0, 6.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11956787109375, -0.11575794219970703, -0.11194801330566406, -0.1081380844116211, -0.10432815551757812, -0.10051822662353516, -0.09670829772949219, -0.09289836883544922, -0.08908843994140625, -0.08527851104736328, -0.08146858215332031, -0.07765865325927734, -0.07384872436523438, -0.0700387954711914, -0.06622886657714844, -0.06241893768310547, -0.0586090087890625, -0.05479907989501953, -0.05098915100097656, -0.047179222106933594, -0.043369293212890625, -0.039559364318847656, -0.03574943542480469, -0.03193950653076172, -0.02812957763671875, -0.02431964874267578, -0.020509719848632812, -0.016699790954589844, -0.012889862060546875, -0.009079933166503906, -0.0052700042724609375, -0.0014600753784179688, 0.002349853515625, 0.006159782409667969, 0.009969711303710938, 0.013779640197753906, 0.017589569091796875, 0.021399497985839844, 0.025209426879882812, 0.02901935577392578, 0.03282928466796875, 0.03663921356201172, 0.04044914245605469, 0.044259071350097656, 0.048069000244140625, 0.051878929138183594, 0.05568885803222656, 0.05949878692626953, 0.0633087158203125, 0.06711864471435547, 0.07092857360839844, 0.0747385025024414, 0.07854843139648438, 0.08235836029052734, 0.08616828918457031, 0.08997821807861328, 0.09378814697265625, 0.09759807586669922, 0.10140800476074219, 0.10521793365478516, 0.10902786254882812, 0.1128377914428711, 0.11664772033691406, 0.12045764923095703, 0.124267578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 6.0, 4.0, 4.0, 15.0, 16.0, 23.0, 21.0, 32.0, 46.0, 78.0, 87.0, 78.0, 90.0, 102.0, 100.0, 62.0, 61.0, 46.0, 29.0, 26.0, 14.0, 15.0, 11.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9591064453125e-05, -4.779268056154251e-05, -4.599429666996002e-05, -4.419591277837753e-05, -4.2397528886795044e-05, -4.0599144995212555e-05, -3.8800761103630066e-05, -3.700237721204758e-05, -3.520399332046509e-05, -3.34056094288826e-05, -3.160722553730011e-05, -2.980884164571762e-05, -2.8010457754135132e-05, -2.6212073862552643e-05, -2.4413689970970154e-05, -2.2615306079387665e-05, -2.0816922187805176e-05, -1.9018538296222687e-05, -1.7220154404640198e-05, -1.542177051305771e-05, -1.362338662147522e-05, -1.182500272989273e-05, -1.0026618838310242e-05, -8.228234946727753e-06, -6.429851055145264e-06, -4.631467163562775e-06, -2.8330832719802856e-06, -1.0346993803977966e-06, 7.636845111846924e-07, 2.5620684027671814e-06, 4.36045229434967e-06, 6.1588361859321594e-06, 7.957220077514648e-06, 9.755603969097137e-06, 1.1553987860679626e-05, 1.3352371752262115e-05, 1.5150755643844604e-05, 1.6949139535427094e-05, 1.8747523427009583e-05, 2.054590731859207e-05, 2.234429121017456e-05, 2.414267510175705e-05, 2.594105899333954e-05, 2.7739442884922028e-05, 2.9537826776504517e-05, 3.1336210668087006e-05, 3.3134594559669495e-05, 3.4932978451251984e-05, 3.673136234283447e-05, 3.852974623441696e-05, 4.032813012599945e-05, 4.212651401758194e-05, 4.392489790916443e-05, 4.572328180074692e-05, 4.752166569232941e-05, 4.9320049583911896e-05, 5.1118433475494385e-05, 5.2916817367076874e-05, 5.471520125865936e-05, 5.651358515024185e-05, 5.831196904182434e-05, 6.011035293340683e-05, 6.190873682498932e-05, 6.370712071657181e-05, 6.55055046081543e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 15.0, 14.0, 29.0, 36.0, 72.0, 101.0, 165.0, 282.0, 455.0, 873.0, 1707.0, 3650.0, 9005.0, 28942.0, 209224.0, 680277.0, 84464.0, 17407.0, 6223.0, 2622.0, 1334.0, 648.0, 368.0, 238.0, 151.0, 57.0, 64.0, 34.0, 21.0, 16.0, 7.0, 8.0, 6.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146240234375, -0.14209842681884766, -0.1379566192626953, -0.13381481170654297, -0.12967300415039062, -0.12553119659423828, -0.12138938903808594, -0.1172475814819336, -0.11310577392578125, -0.1089639663696289, -0.10482215881347656, -0.10068035125732422, -0.09653854370117188, -0.09239673614501953, -0.08825492858886719, -0.08411312103271484, -0.0799713134765625, -0.07582950592041016, -0.07168769836425781, -0.06754589080810547, -0.06340408325195312, -0.05926227569580078, -0.05512046813964844, -0.050978660583496094, -0.04683685302734375, -0.042695045471191406, -0.03855323791503906, -0.03441143035888672, -0.030269622802734375, -0.02612781524658203, -0.021986007690429688, -0.017844200134277344, -0.013702392578125, -0.009560585021972656, -0.0054187774658203125, -0.0012769699096679688, 0.002864837646484375, 0.007006645202636719, 0.011148452758789062, 0.015290260314941406, 0.01943206787109375, 0.023573875427246094, 0.027715682983398438, 0.03185749053955078, 0.035999298095703125, 0.04014110565185547, 0.04428291320800781, 0.048424720764160156, 0.0525665283203125, 0.056708335876464844, 0.06085014343261719, 0.06499195098876953, 0.06913375854492188, 0.07327556610107422, 0.07741737365722656, 0.0815591812133789, 0.08570098876953125, 0.0898427963256836, 0.09398460388183594, 0.09812641143798828, 0.10226821899414062, 0.10641002655029297, 0.11055183410644531, 0.11469364166259766, 0.11883544921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 1.0, 3.0, 6.0, 5.0, 8.0, 24.0, 22.0, 36.0, 45.0, 88.0, 107.0, 162.0, 144.0, 108.0, 80.0, 37.0, 32.0, 13.0, 19.0, 10.0, 11.0, 7.0, 6.0, 3.0, 1.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046905517578125, -0.04563283920288086, -0.04436016082763672, -0.04308748245239258, -0.04181480407714844, -0.0405421257019043, -0.039269447326660156, -0.037996768951416016, -0.036724090576171875, -0.035451412200927734, -0.034178733825683594, -0.03290605545043945, -0.03163337707519531, -0.030360698699951172, -0.02908802032470703, -0.02781534194946289, -0.02654266357421875, -0.02526998519897461, -0.02399730682373047, -0.022724628448486328, -0.021451950073242188, -0.020179271697998047, -0.018906593322753906, -0.017633914947509766, -0.016361236572265625, -0.015088558197021484, -0.013815879821777344, -0.012543201446533203, -0.011270523071289062, -0.009997844696044922, -0.008725166320800781, -0.007452487945556641, -0.0061798095703125, -0.004907131195068359, -0.0036344528198242188, -0.002361774444580078, -0.0010890960693359375, 0.00018358230590820312, 0.0014562606811523438, 0.0027289390563964844, 0.004001617431640625, 0.005274295806884766, 0.006546974182128906, 0.007819652557373047, 0.009092330932617188, 0.010365009307861328, 0.011637687683105469, 0.01291036605834961, 0.01418304443359375, 0.01545572280883789, 0.01672840118408203, 0.018001079559326172, 0.019273757934570312, 0.020546436309814453, 0.021819114685058594, 0.023091793060302734, 0.024364471435546875, 0.025637149810791016, 0.026909828186035156, 0.028182506561279297, 0.029455184936523438, 0.030727863311767578, 0.03200054168701172, 0.03327322006225586, 0.0345458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 6.0, 11.0, 22.0, 29.0, 47.0, 82.0, 149.0, 153.0, 147.0, 125.0, 88.0, 54.0, 31.0, 18.0, 11.0, 3.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7874157428741455, -2.6876680850982666, -2.5879201889038086, -2.4881725311279297, -2.388424873352051, -2.288677215576172, -2.188929557800293, -2.089181661605835, -1.989434003829956, -1.8896863460540771, -1.7899385690689087, -1.6901907920837402, -1.5904431343078613, -1.4906954765319824, -1.390947699546814, -1.2911999225616455, -1.1914522647857666, -1.0917046070098877, -0.9919568300247192, -0.8922091126441956, -0.7924613952636719, -0.6927136778831482, -0.5929659605026245, -0.49321824312210083, -0.39347052574157715, -0.29372280836105347, -0.19397509098052979, -0.0942273736000061, 0.005520343780517578, 0.10526806116104126, 0.20501577854156494, 0.3047634959220886, 0.4045112133026123, 0.504258930683136, 0.6040066480636597, 0.7037543654441833, 0.803502082824707, 0.9032498002052307, 1.0029975175857544, 1.1027452945709229, 1.2024929523468018, 1.3022406101226807, 1.4019883871078491, 1.5017361640930176, 1.6014838218688965, 1.7012314796447754, 1.8009792566299438, 1.9007270336151123, 2.000474691390991, 2.10022234916687, 2.199970245361328, 2.299717903137207, 2.399465560913086, 2.499213218688965, 2.5989608764648438, 2.6987087726593018, 2.7984564304351807, 2.8982040882110596, 2.9979519844055176, 3.0976996421813965, 3.1974472999572754, 3.2971949577331543, 3.396942615509033, 3.496690511703491, 3.59643816947937]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 4.0, 13.0, 14.0, 20.0, 28.0, 21.0, 24.0, 48.0, 57.0, 53.0, 61.0, 64.0, 63.0, 56.0, 74.0, 61.0, 59.0, 40.0, 41.0, 41.0, 30.0, 22.0, 22.0, 18.0, 7.0, 10.0, 8.0, 2.0, 5.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6601585149765015, -1.6081640720367432, -1.5561696290969849, -1.5041751861572266, -1.4521807432174683, -1.40018630027771, -1.3481918573379517, -1.2961974143981934, -1.244202971458435, -1.1922085285186768, -1.1402140855789185, -1.0882196426391602, -1.0362251996994019, -0.9842307567596436, -0.9322363138198853, -0.880241870880127, -0.8282474279403687, -0.7762529850006104, -0.724258542060852, -0.6722640991210938, -0.6202696561813354, -0.5682752132415771, -0.5162807703018188, -0.46428632736206055, -0.41229188442230225, -0.36029744148254395, -0.30830299854278564, -0.25630855560302734, -0.20431411266326904, -0.15231966972351074, -0.10032522678375244, -0.04833078384399414, 0.003663778305053711, 0.05565822124481201, 0.10765266418457031, 0.1596471071243286, 0.21164155006408691, 0.2636359930038452, 0.3156304359436035, 0.3676248788833618, 0.4196193218231201, 0.4716137647628784, 0.5236082077026367, 0.575602650642395, 0.6275970935821533, 0.6795915365219116, 0.7315859794616699, 0.7835804224014282, 0.8355748653411865, 0.8875693082809448, 0.9395637512207031, 0.9915581941604614, 1.0435526371002197, 1.095547080039978, 1.1475415229797363, 1.1995359659194946, 1.251530408859253, 1.3035248517990112, 1.3555192947387695, 1.4075137376785278, 1.4595081806182861, 1.5115026235580444, 1.5634970664978027, 1.615491509437561, 1.6674859523773193]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 13.0, 36.0, 40.0, 61.0, 94.0, 132.0, 231.0, 356.0, 633.0, 1265.0, 2530.0, 5990.0, 18944.0, 111448.0, 814344.0, 68303.0, 14404.0, 4999.0, 2170.0, 1063.0, 517.0, 318.0, 202.0, 147.0, 88.0, 55.0, 38.0, 26.0, 25.0, 12.0, 6.0, 10.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.308197021484375, -2.22967529296875, -2.151153564453125, -2.0726318359375, -1.994110107421875, -1.91558837890625, -1.837066650390625, -1.758544921875, -1.680023193359375, -1.60150146484375, -1.522979736328125, -1.4444580078125, -1.365936279296875, -1.28741455078125, -1.208892822265625, -1.13037109375, -1.051849365234375, -0.97332763671875, -0.894805908203125, -0.8162841796875, -0.737762451171875, -0.65924072265625, -0.580718994140625, -0.502197265625, -0.423675537109375, -0.34515380859375, -0.266632080078125, -0.1881103515625, -0.109588623046875, -0.03106689453125, 0.047454833984375, 0.1259765625, 0.204498291015625, 0.28302001953125, 0.361541748046875, 0.4400634765625, 0.518585205078125, 0.59710693359375, 0.675628662109375, 0.754150390625, 0.832672119140625, 0.91119384765625, 0.989715576171875, 1.0682373046875, 1.146759033203125, 1.22528076171875, 1.303802490234375, 1.38232421875, 1.460845947265625, 1.53936767578125, 1.617889404296875, 1.6964111328125, 1.774932861328125, 1.85345458984375, 1.931976318359375, 2.010498046875, 2.089019775390625, 2.16754150390625, 2.246063232421875, 2.3245849609375, 2.403106689453125, 2.48162841796875, 2.560150146484375, 2.638671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 7.0, 3.0, 2.0, 3.0, 12.0, 8.0, 15.0, 17.0, 29.0, 23.0, 23.0, 33.0, 69.0, 74.0, 69.0, 51.0, 97.0, 79.0, 82.0, 63.0, 52.0, 42.0, 31.0, 29.0, 24.0, 18.0, 13.0, 11.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.179107666015625, -3.06719970703125, -2.955291748046875, -2.8433837890625, -2.731475830078125, -2.61956787109375, -2.507659912109375, -2.395751953125, -2.283843994140625, -2.17193603515625, -2.060028076171875, -1.9481201171875, -1.836212158203125, -1.72430419921875, -1.612396240234375, -1.50048828125, -1.388580322265625, -1.27667236328125, -1.164764404296875, -1.0528564453125, -0.940948486328125, -0.82904052734375, -0.717132568359375, -0.605224609375, -0.493316650390625, -0.38140869140625, -0.269500732421875, -0.1575927734375, -0.045684814453125, 0.06622314453125, 0.178131103515625, 0.2900390625, 0.401947021484375, 0.51385498046875, 0.625762939453125, 0.7376708984375, 0.849578857421875, 0.96148681640625, 1.073394775390625, 1.185302734375, 1.297210693359375, 1.40911865234375, 1.521026611328125, 1.6329345703125, 1.744842529296875, 1.85675048828125, 1.968658447265625, 2.08056640625, 2.192474365234375, 2.30438232421875, 2.416290283203125, 2.5281982421875, 2.640106201171875, 2.75201416015625, 2.863922119140625, 2.975830078125, 3.087738037109375, 3.19964599609375, 3.311553955078125, 3.4234619140625, 3.535369873046875, 3.64727783203125, 3.759185791015625, 3.87109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 12.0, 12.0, 21.0, 26.0, 26.0, 58.0, 66.0, 118.0, 237.0, 537.0, 2063.0, 13132.0, 751185.0, 268076.0, 10047.0, 1781.0, 559.0, 206.0, 126.0, 75.0, 53.0, 46.0, 26.0, 14.0, 16.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.48828125, -6.3216552734375, -6.155029296875, -5.9884033203125, -5.82177734375, -5.6551513671875, -5.488525390625, -5.3218994140625, -5.1552734375, -4.9886474609375, -4.822021484375, -4.6553955078125, -4.48876953125, -4.3221435546875, -4.155517578125, -3.9888916015625, -3.822265625, -3.6556396484375, -3.489013671875, -3.3223876953125, -3.15576171875, -2.9891357421875, -2.822509765625, -2.6558837890625, -2.4892578125, -2.3226318359375, -2.156005859375, -1.9893798828125, -1.82275390625, -1.6561279296875, -1.489501953125, -1.3228759765625, -1.15625, -0.9896240234375, -0.822998046875, -0.6563720703125, -0.48974609375, -0.3231201171875, -0.156494140625, 0.0101318359375, 0.1767578125, 0.3433837890625, 0.510009765625, 0.6766357421875, 0.84326171875, 1.0098876953125, 1.176513671875, 1.3431396484375, 1.509765625, 1.6763916015625, 1.843017578125, 2.0096435546875, 2.17626953125, 2.3428955078125, 2.509521484375, 2.6761474609375, 2.8427734375, 3.0093994140625, 3.176025390625, 3.3426513671875, 3.50927734375, 3.6759033203125, 3.842529296875, 4.0091552734375, 4.17578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 13.0, 15.0, 16.0, 21.0, 11.0, 18.0, 37.0, 42.0, 41.0, 43.0, 35.0, 64.0, 50.0, 55.0, 77.0, 56.0, 64.0, 43.0, 54.0, 46.0, 47.0, 23.0, 25.0, 29.0, 19.0, 9.0, 11.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.286163330078125, -5.14263916015625, -4.999114990234375, -4.8555908203125, -4.712066650390625, -4.56854248046875, -4.425018310546875, -4.281494140625, -4.137969970703125, -3.99444580078125, -3.850921630859375, -3.7073974609375, -3.563873291015625, -3.42034912109375, -3.276824951171875, -3.13330078125, -2.989776611328125, -2.84625244140625, -2.702728271484375, -2.5592041015625, -2.415679931640625, -2.27215576171875, -2.128631591796875, -1.985107421875, -1.841583251953125, -1.69805908203125, -1.554534912109375, -1.4110107421875, -1.267486572265625, -1.12396240234375, -0.980438232421875, -0.8369140625, -0.693389892578125, -0.54986572265625, -0.406341552734375, -0.2628173828125, -0.119293212890625, 0.02423095703125, 0.167755126953125, 0.311279296875, 0.454803466796875, 0.59832763671875, 0.741851806640625, 0.8853759765625, 1.028900146484375, 1.17242431640625, 1.315948486328125, 1.45947265625, 1.602996826171875, 1.74652099609375, 1.890045166015625, 2.0335693359375, 2.177093505859375, 2.32061767578125, 2.464141845703125, 2.607666015625, 2.751190185546875, 2.89471435546875, 3.038238525390625, 3.1817626953125, 3.325286865234375, 3.46881103515625, 3.612335205078125, 3.755859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 13.0, 12.0, 13.0, 21.0, 44.0, 84.0, 184.0, 464.0, 2007.0, 15396.0, 326747.0, 680563.0, 19581.0, 2469.0, 549.0, 191.0, 89.0, 40.0, 33.0, 10.0, 7.0, 7.0, 3.0, 6.0, 9.0, 4.0, 2.0, 1.0], "bins": [-1.572265625, -1.538848876953125, -1.50543212890625, -1.472015380859375, -1.4385986328125, -1.405181884765625, -1.37176513671875, -1.338348388671875, -1.304931640625, -1.271514892578125, -1.23809814453125, -1.204681396484375, -1.1712646484375, -1.137847900390625, -1.10443115234375, -1.071014404296875, -1.03759765625, -1.004180908203125, -0.97076416015625, -0.937347412109375, -0.9039306640625, -0.870513916015625, -0.83709716796875, -0.803680419921875, -0.770263671875, -0.736846923828125, -0.70343017578125, -0.670013427734375, -0.6365966796875, -0.603179931640625, -0.56976318359375, -0.536346435546875, -0.5029296875, -0.469512939453125, -0.43609619140625, -0.402679443359375, -0.3692626953125, -0.335845947265625, -0.30242919921875, -0.269012451171875, -0.235595703125, -0.202178955078125, -0.16876220703125, -0.135345458984375, -0.1019287109375, -0.068511962890625, -0.03509521484375, -0.001678466796875, 0.03173828125, 0.065155029296875, 0.09857177734375, 0.131988525390625, 0.1654052734375, 0.198822021484375, 0.23223876953125, 0.265655517578125, 0.299072265625, 0.332489013671875, 0.36590576171875, 0.399322509765625, 0.4327392578125, 0.466156005859375, 0.49957275390625, 0.532989501953125, 0.56640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 3.0, 4.0, 6.0, 11.0, 14.0, 10.0, 19.0, 30.0, 28.0, 62.0, 96.0, 192.0, 196.0, 98.0, 61.0, 38.0, 38.0, 24.0, 6.0, 17.0, 8.0, 7.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.604194641113281e-05, -6.330013275146484e-05, -6.0558319091796875e-05, -5.7816505432128906e-05, -5.507469177246094e-05, -5.233287811279297e-05, -4.9591064453125e-05, -4.684925079345703e-05, -4.410743713378906e-05, -4.1365623474121094e-05, -3.8623809814453125e-05, -3.5881996154785156e-05, -3.314018249511719e-05, -3.039836883544922e-05, -2.765655517578125e-05, -2.491474151611328e-05, -2.2172927856445312e-05, -1.9431114196777344e-05, -1.6689300537109375e-05, -1.3947486877441406e-05, -1.1205673217773438e-05, -8.463859558105469e-06, -5.7220458984375e-06, -2.9802322387695312e-06, -2.384185791015625e-07, 2.5033950805664062e-06, 5.245208740234375e-06, 7.987022399902344e-06, 1.0728836059570312e-05, 1.3470649719238281e-05, 1.621246337890625e-05, 1.895427703857422e-05, 2.1696090698242188e-05, 2.4437904357910156e-05, 2.7179718017578125e-05, 2.9921531677246094e-05, 3.266334533691406e-05, 3.540515899658203e-05, 3.814697265625e-05, 4.088878631591797e-05, 4.363059997558594e-05, 4.6372413635253906e-05, 4.9114227294921875e-05, 5.1856040954589844e-05, 5.459785461425781e-05, 5.733966827392578e-05, 6.008148193359375e-05, 6.282329559326172e-05, 6.556510925292969e-05, 6.830692291259766e-05, 7.104873657226562e-05, 7.37905502319336e-05, 7.653236389160156e-05, 7.927417755126953e-05, 8.20159912109375e-05, 8.475780487060547e-05, 8.749961853027344e-05, 9.02414321899414e-05, 9.298324584960938e-05, 9.572505950927734e-05, 9.846687316894531e-05, 0.00010120868682861328, 0.00010395050048828125, 0.00010669231414794922, 0.00010943412780761719]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 15.0, 29.0, 50.0, 86.0, 193.0, 512.0, 1538.0, 7191.0, 54463.0, 882651.0, 88806.0, 9951.0, 2025.0, 574.0, 227.0, 100.0, 57.0, 25.0, 15.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9176101684570312, -0.8855133056640625, -0.8534164428710938, -0.821319580078125, -0.7892227172851562, -0.7571258544921875, -0.7250289916992188, -0.69293212890625, -0.6608352661132812, -0.6287384033203125, -0.5966415405273438, -0.564544677734375, -0.5324478149414062, -0.5003509521484375, -0.46825408935546875, -0.4361572265625, -0.40406036376953125, -0.3719635009765625, -0.33986663818359375, -0.307769775390625, -0.27567291259765625, -0.2435760498046875, -0.21147918701171875, -0.17938232421875, -0.14728546142578125, -0.1151885986328125, -0.08309173583984375, -0.050994873046875, -0.01889801025390625, 0.0131988525390625, 0.04529571533203125, 0.077392578125, 0.10948944091796875, 0.1415863037109375, 0.17368316650390625, 0.205780029296875, 0.23787689208984375, 0.2699737548828125, 0.30207061767578125, 0.33416748046875, 0.36626434326171875, 0.3983612060546875, 0.43045806884765625, 0.462554931640625, 0.49465179443359375, 0.5267486572265625, 0.5588455200195312, 0.5909423828125, 0.6230392456054688, 0.6551361083984375, 0.6872329711914062, 0.719329833984375, 0.7514266967773438, 0.7835235595703125, 0.8156204223632812, 0.84771728515625, 0.8798141479492188, 0.9119110107421875, 0.9440078735351562, 0.976104736328125, 1.0082015991210938, 1.0402984619140625, 1.0723953247070312, 1.1044921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 7.0, 3.0, 6.0, 6.0, 19.0, 23.0, 18.0, 39.0, 52.0, 67.0, 114.0, 268.0, 115.0, 66.0, 47.0, 31.0, 34.0, 12.0, 17.0, 13.0, 7.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3030548095703125, -0.293121337890625, -0.2831878662109375, -0.27325439453125, -0.2633209228515625, -0.253387451171875, -0.2434539794921875, -0.2335205078125, -0.2235870361328125, -0.213653564453125, -0.2037200927734375, -0.19378662109375, -0.1838531494140625, -0.173919677734375, -0.1639862060546875, -0.154052734375, -0.1441192626953125, -0.134185791015625, -0.1242523193359375, -0.11431884765625, -0.1043853759765625, -0.094451904296875, -0.0845184326171875, -0.0745849609375, -0.0646514892578125, -0.054718017578125, -0.0447845458984375, -0.03485107421875, -0.0249176025390625, -0.014984130859375, -0.0050506591796875, 0.0048828125, 0.0148162841796875, 0.024749755859375, 0.0346832275390625, 0.04461669921875, 0.0545501708984375, 0.064483642578125, 0.0744171142578125, 0.0843505859375, 0.0942840576171875, 0.104217529296875, 0.1141510009765625, 0.12408447265625, 0.1340179443359375, 0.143951416015625, 0.1538848876953125, 0.163818359375, 0.1737518310546875, 0.183685302734375, 0.1936187744140625, 0.20355224609375, 0.2134857177734375, 0.223419189453125, 0.2333526611328125, 0.2432861328125, 0.2532196044921875, 0.263153076171875, 0.2730865478515625, 0.28302001953125, 0.2929534912109375, 0.302886962890625, 0.3128204345703125, 0.32275390625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 9.0, 5.0, 24.0, 50.0, 134.0, 278.0, 271.0, 153.0, 55.0, 12.0, 9.0, 1.0, 6.0, 1.0, 2.0, 0.0, 3.0], "bins": [-21.024106979370117, -20.627666473388672, -20.231225967407227, -19.83478546142578, -19.438343048095703, -19.041902542114258, -18.645462036132812, -18.249021530151367, -17.852581024169922, -17.456140518188477, -17.05970001220703, -16.663259506225586, -16.266817092895508, -15.870377540588379, -15.473936080932617, -15.077495574951172, -14.681055068969727, -14.284614562988281, -13.88817310333252, -13.491732597351074, -13.095292091369629, -12.698851585388184, -12.302410125732422, -11.905969619750977, -11.509528160095215, -11.11308765411377, -10.716646194458008, -10.320205688476562, -9.923765182495117, -9.527324676513672, -9.13088321685791, -8.734442710876465, -8.338001251220703, -7.9415602684021, -7.545119762420654, -7.148678779602051, -6.7522382736206055, -6.355797290802002, -5.959356307983398, -5.562915802001953, -5.166475296020508, -4.770034313201904, -4.373593807220459, -3.9771528244018555, -3.58071231842041, -3.1842713356018066, -2.7878305912017822, -2.391389846801758, -1.9949493408203125, -1.598508596420288, -1.2020678520202637, -0.8056269884109497, -0.4091862440109253, -0.012745499610900879, 0.3836953639984131, 0.7801361083984375, 1.176576852798462, 1.5730175971984863, 1.9694583415985107, 2.365899085998535, 2.7623400688171387, 3.158780574798584, 3.5552215576171875, 3.951662302017212, 4.348103046417236]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 4.0, 8.0, 13.0, 13.0, 10.0, 18.0, 28.0, 15.0, 22.0, 26.0, 35.0, 27.0, 39.0, 31.0, 43.0, 44.0, 44.0, 39.0, 38.0, 48.0, 46.0, 41.0, 35.0, 45.0, 34.0, 37.0, 27.0, 23.0, 34.0, 20.0, 11.0, 14.0, 18.0, 13.0, 13.0, 7.0, 5.0, 8.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.569394111633301, -6.385113716125488, -6.200833320617676, -6.016552925109863, -5.832272529602051, -5.647992134094238, -5.463711738586426, -5.279431343078613, -5.095150947570801, -4.910870552062988, -4.726590156555176, -4.542309761047363, -4.358029365539551, -4.173748970031738, -3.989468574523926, -3.8051881790161133, -3.620907783508301, -3.4366273880004883, -3.252346992492676, -3.0680665969848633, -2.883786201477051, -2.6995058059692383, -2.515225410461426, -2.3309450149536133, -2.146664619445801, -1.9623842239379883, -1.7781038284301758, -1.5938234329223633, -1.4095430374145508, -1.2252626419067383, -1.0409822463989258, -0.8567018508911133, -0.6724214553833008, -0.4881410598754883, -0.3038606643676758, -0.11958026885986328, 0.06470012664794922, 0.24898052215576172, 0.4332609176635742, 0.6175413131713867, 0.8018217086791992, 0.9861021041870117, 1.1703824996948242, 1.3546628952026367, 1.5389432907104492, 1.7232236862182617, 1.9075040817260742, 2.0917844772338867, 2.276064872741699, 2.4603452682495117, 2.644625663757324, 2.8289060592651367, 3.013186454772949, 3.1974668502807617, 3.381747245788574, 3.5660276412963867, 3.750308036804199, 3.9345884323120117, 4.118868827819824, 4.303149223327637, 4.487429618835449, 4.671710014343262, 4.855990409851074, 5.040270805358887, 5.224551200866699]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 6.0, 16.0, 22.0, 23.0, 34.0, 28.0, 59.0, 90.0, 130.0, 133.0, 214.0, 333.0, 560.0, 947.0, 2248.0, 6118.0, 24189.0, 248927.0, 3730464.0, 150573.0, 19479.0, 5320.0, 1981.0, 897.0, 462.0, 287.0, 193.0, 151.0, 103.0, 67.0, 60.0, 49.0, 37.0, 17.0, 16.0, 12.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.794921875, -3.684661865234375, -3.57440185546875, -3.464141845703125, -3.3538818359375, -3.243621826171875, -3.13336181640625, -3.023101806640625, -2.912841796875, -2.802581787109375, -2.69232177734375, -2.582061767578125, -2.4718017578125, -2.361541748046875, -2.25128173828125, -2.141021728515625, -2.03076171875, -1.920501708984375, -1.81024169921875, -1.699981689453125, -1.5897216796875, -1.479461669921875, -1.36920166015625, -1.258941650390625, -1.148681640625, -1.038421630859375, -0.92816162109375, -0.817901611328125, -0.7076416015625, -0.597381591796875, -0.48712158203125, -0.376861572265625, -0.2666015625, -0.156341552734375, -0.04608154296875, 0.064178466796875, 0.1744384765625, 0.284698486328125, 0.39495849609375, 0.505218505859375, 0.615478515625, 0.725738525390625, 0.83599853515625, 0.946258544921875, 1.0565185546875, 1.166778564453125, 1.27703857421875, 1.387298583984375, 1.49755859375, 1.607818603515625, 1.71807861328125, 1.828338623046875, 1.9385986328125, 2.048858642578125, 2.15911865234375, 2.269378662109375, 2.379638671875, 2.489898681640625, 2.60015869140625, 2.710418701171875, 2.8206787109375, 2.930938720703125, 3.04119873046875, 3.151458740234375, 3.26171875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 6.0, 6.0, 9.0, 17.0, 16.0, 16.0, 37.0, 27.0, 40.0, 48.0, 68.0, 70.0, 72.0, 76.0, 94.0, 70.0, 54.0, 61.0, 58.0, 34.0, 22.0, 21.0, 14.0, 13.0, 12.0, 10.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.81927490234375, -1.7664794921875, -1.71368408203125, -1.660888671875, -1.60809326171875, -1.5552978515625, -1.50250244140625, -1.44970703125, -1.39691162109375, -1.3441162109375, -1.29132080078125, -1.238525390625, -1.18572998046875, -1.1329345703125, -1.08013916015625, -1.02734375, -0.97454833984375, -0.9217529296875, -0.86895751953125, -0.816162109375, -0.76336669921875, -0.7105712890625, -0.65777587890625, -0.60498046875, -0.55218505859375, -0.4993896484375, -0.44659423828125, -0.393798828125, -0.34100341796875, -0.2882080078125, -0.23541259765625, -0.1826171875, -0.12982177734375, -0.0770263671875, -0.02423095703125, 0.028564453125, 0.08135986328125, 0.1341552734375, 0.18695068359375, 0.23974609375, 0.29254150390625, 0.3453369140625, 0.39813232421875, 0.450927734375, 0.50372314453125, 0.5565185546875, 0.60931396484375, 0.662109375, 0.71490478515625, 0.7677001953125, 0.82049560546875, 0.873291015625, 0.92608642578125, 0.9788818359375, 1.03167724609375, 1.08447265625, 1.13726806640625, 1.1900634765625, 1.24285888671875, 1.295654296875, 1.34844970703125, 1.4012451171875, 1.45404052734375, 1.5068359375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 11.0, 6.0, 13.0, 15.0, 23.0, 45.0, 79.0, 147.0, 333.0, 910.0, 4510.0, 45955.0, 3757299.0, 367265.0, 14408.0, 2212.0, 546.0, 212.0, 109.0, 51.0, 36.0, 29.0, 12.0, 9.0, 14.0, 5.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.46453857421875, -4.2767333984375, -4.08892822265625, -3.901123046875, -3.71331787109375, -3.5255126953125, -3.33770751953125, -3.14990234375, -2.96209716796875, -2.7742919921875, -2.58648681640625, -2.398681640625, -2.21087646484375, -2.0230712890625, -1.83526611328125, -1.6474609375, -1.45965576171875, -1.2718505859375, -1.08404541015625, -0.896240234375, -0.70843505859375, -0.5206298828125, -0.33282470703125, -0.14501953125, 0.04278564453125, 0.2305908203125, 0.41839599609375, 0.606201171875, 0.79400634765625, 0.9818115234375, 1.16961669921875, 1.357421875, 1.54522705078125, 1.7330322265625, 1.92083740234375, 2.108642578125, 2.29644775390625, 2.4842529296875, 2.67205810546875, 2.85986328125, 3.04766845703125, 3.2354736328125, 3.42327880859375, 3.611083984375, 3.79888916015625, 3.9866943359375, 4.17449951171875, 4.3623046875, 4.55010986328125, 4.7379150390625, 4.92572021484375, 5.113525390625, 5.30133056640625, 5.4891357421875, 5.67694091796875, 5.86474609375, 6.05255126953125, 6.2403564453125, 6.42816162109375, 6.615966796875, 6.80377197265625, 6.9915771484375, 7.17938232421875, 7.3671875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 14.0, 8.0, 12.0, 16.0, 20.0, 25.0, 29.0, 39.0, 76.0, 90.0, 131.0, 217.0, 337.0, 571.0, 763.0, 594.0, 382.0, 219.0, 153.0, 93.0, 69.0, 34.0, 44.0, 26.0, 24.0, 13.0, 16.0, 8.0, 10.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7569046020507812, -0.7350006103515625, -0.7130966186523438, -0.691192626953125, -0.6692886352539062, -0.6473846435546875, -0.6254806518554688, -0.60357666015625, -0.5816726684570312, -0.5597686767578125, -0.5378646850585938, -0.515960693359375, -0.49405670166015625, -0.4721527099609375, -0.45024871826171875, -0.4283447265625, -0.40644073486328125, -0.3845367431640625, -0.36263275146484375, -0.340728759765625, -0.31882476806640625, -0.2969207763671875, -0.27501678466796875, -0.25311279296875, -0.23120880126953125, -0.2093048095703125, -0.18740081787109375, -0.165496826171875, -0.14359283447265625, -0.1216888427734375, -0.09978485107421875, -0.077880859375, -0.05597686767578125, -0.0340728759765625, -0.01216888427734375, 0.009735107421875, 0.03163909912109375, 0.0535430908203125, 0.07544708251953125, 0.09735107421875, 0.11925506591796875, 0.1411590576171875, 0.16306304931640625, 0.184967041015625, 0.20687103271484375, 0.2287750244140625, 0.25067901611328125, 0.2725830078125, 0.29448699951171875, 0.3163909912109375, 0.33829498291015625, 0.360198974609375, 0.38210296630859375, 0.4040069580078125, 0.42591094970703125, 0.44781494140625, 0.46971893310546875, 0.4916229248046875, 0.5135269165039062, 0.535430908203125, 0.5573348999023438, 0.5792388916015625, 0.6011428833007812, 0.623046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 13.0, 21.0, 12.0, 28.0, 33.0, 49.0, 65.0, 79.0, 102.0, 122.0, 98.0, 98.0, 88.0, 58.0, 45.0, 26.0, 30.0, 13.0, 11.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.552720069885254, -2.454667091369629, -2.356614351272583, -2.258561372756958, -2.160508632659912, -2.062455654144287, -1.9644027948379517, -1.8663499355316162, -1.7682969570159912, -1.6702440977096558, -1.5721912384033203, -1.4741382598876953, -1.3760854005813599, -1.2780325412750244, -1.179979681968689, -1.0819268226623535, -0.9838739633560181, -0.8858211040496826, -0.7877681851387024, -0.6897153258323669, -0.5916624069213867, -0.49360954761505127, -0.3955566883087158, -0.2975037693977356, -0.19945091009140015, -0.1013980284333229, -0.0033451467752456665, 0.09470772743225098, 0.1927606165409088, 0.29081350564956665, 0.3888663649559021, 0.4869192838668823, 0.5849721431732178, 0.6830250024795532, 0.7810779213905334, 0.8791307806968689, 0.9771836996078491, 1.0752365589141846, 1.17328941822052, 1.2713422775268555, 1.3693952560424805, 1.467448115348816, 1.5655009746551514, 1.6635539531707764, 1.7616068124771118, 1.8596596717834473, 1.9577125310897827, 2.055765390396118, 2.153818130493164, 2.251871109008789, 2.349923849105835, 2.44797682762146, 2.546029567718506, 2.644082546234131, 2.742135524749756, 2.8401882648468018, 2.9382412433624268, 3.0362942218780518, 3.1343469619750977, 3.2323999404907227, 3.3304526805877686, 3.4285056591033936, 3.5265583992004395, 3.6246113777160645, 3.7226643562316895]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 2.0, 4.0, 9.0, 12.0, 11.0, 19.0, 19.0, 18.0, 21.0, 25.0, 23.0, 31.0, 33.0, 38.0, 39.0, 38.0, 46.0, 42.0, 40.0, 53.0, 55.0, 39.0, 49.0, 34.0, 30.0, 36.0, 26.0, 25.0, 28.0, 23.0, 20.0, 23.0, 11.0, 11.0, 15.0, 12.0, 6.0, 5.0, 2.0, 4.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4101009368896484, -1.361124873161316, -1.312148928642273, -1.2631728649139404, -1.2141969203948975, -1.165220856666565, -1.1162447929382324, -1.0672688484191895, -1.0182929039001465, -0.9693168997764587, -0.920340895652771, -0.8713648319244385, -0.8223888874053955, -0.773412823677063, -0.7244368195533752, -0.6754608154296875, -0.626484751701355, -0.5775087475776672, -0.5285327434539795, -0.47955670952796936, -0.4305807054042816, -0.38160470128059387, -0.33262866735458374, -0.283652663230896, -0.23467665910720825, -0.1857006549835205, -0.13672463595867157, -0.08774861693382263, -0.03877261281013489, 0.010203391313552856, 0.05917942523956299, 0.10815542936325073, 0.15713131427764893, 0.20610731840133667, 0.2550833225250244, 0.30405935645103455, 0.3530353605747223, 0.40201136469841003, 0.45098739862442017, 0.4999634027481079, 0.5489394068717957, 0.5979154109954834, 0.6468914151191711, 0.6958674192428589, 0.7448434829711914, 0.7938194274902344, 0.8427954912185669, 0.8917714953422546, 0.9407474994659424, 0.9897235035896301, 1.0386995077133179, 1.0876755714416504, 1.1366515159606934, 1.1856275796890259, 1.2346036434173584, 1.2835795879364014, 1.3325555324554443, 1.3815315961837769, 1.4305075407028198, 1.4794836044311523, 1.5284595489501953, 1.5774356126785278, 1.6264116764068604, 1.6753876209259033, 1.7243636846542358]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 4.0, 6.0, 7.0, 15.0, 25.0, 38.0, 36.0, 77.0, 116.0, 211.0, 366.0, 668.0, 1528.0, 3455.0, 8631.0, 26996.0, 106096.0, 408498.0, 364885.0, 89954.0, 23184.0, 7889.0, 3066.0, 1305.0, 628.0, 340.0, 176.0, 92.0, 78.0, 49.0, 37.0, 23.0, 19.0, 13.0, 9.0, 8.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.25432586669921875, -0.2452239990234375, -0.23612213134765625, -0.227020263671875, -0.21791839599609375, -0.2088165283203125, -0.19971466064453125, -0.19061279296875, -0.18151092529296875, -0.1724090576171875, -0.16330718994140625, -0.154205322265625, -0.14510345458984375, -0.1360015869140625, -0.12689971923828125, -0.1177978515625, -0.10869598388671875, -0.0995941162109375, -0.09049224853515625, -0.081390380859375, -0.07228851318359375, -0.0631866455078125, -0.05408477783203125, -0.04498291015625, -0.03588104248046875, -0.0267791748046875, -0.01767730712890625, -0.008575439453125, 0.00052642822265625, 0.0096282958984375, 0.01873016357421875, 0.02783203125, 0.03693389892578125, 0.0460357666015625, 0.05513763427734375, 0.064239501953125, 0.07334136962890625, 0.0824432373046875, 0.09154510498046875, 0.10064697265625, 0.10974884033203125, 0.1188507080078125, 0.12795257568359375, 0.137054443359375, 0.14615631103515625, 0.1552581787109375, 0.16436004638671875, 0.1734619140625, 0.18256378173828125, 0.1916656494140625, 0.20076751708984375, 0.209869384765625, 0.21897125244140625, 0.2280731201171875, 0.23717498779296875, 0.24627685546875, 0.25537872314453125, 0.2644805908203125, 0.27358245849609375, 0.282684326171875, 0.29178619384765625, 0.3008880615234375, 0.30998992919921875, 0.319091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 4.0, 16.0, 21.0, 18.0, 21.0, 21.0, 30.0, 34.0, 39.0, 35.0, 35.0, 52.0, 48.0, 47.0, 52.0, 50.0, 48.0, 50.0, 48.0, 41.0, 44.0, 32.0, 26.0, 28.0, 22.0, 14.0, 22.0, 17.0, 17.0, 11.0, 6.0, 6.0, 7.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0390625, -1.0032958984375, -0.967529296875, -0.9317626953125, -0.89599609375, -0.8602294921875, -0.824462890625, -0.7886962890625, -0.7529296875, -0.7171630859375, -0.681396484375, -0.6456298828125, -0.60986328125, -0.5740966796875, -0.538330078125, -0.5025634765625, -0.466796875, -0.4310302734375, -0.395263671875, -0.3594970703125, -0.32373046875, -0.2879638671875, -0.252197265625, -0.2164306640625, -0.1806640625, -0.1448974609375, -0.109130859375, -0.0733642578125, -0.03759765625, -0.0018310546875, 0.033935546875, 0.0697021484375, 0.10546875, 0.1412353515625, 0.177001953125, 0.2127685546875, 0.24853515625, 0.2843017578125, 0.320068359375, 0.3558349609375, 0.3916015625, 0.4273681640625, 0.463134765625, 0.4989013671875, 0.53466796875, 0.5704345703125, 0.606201171875, 0.6419677734375, 0.677734375, 0.7135009765625, 0.749267578125, 0.7850341796875, 0.82080078125, 0.8565673828125, 0.892333984375, 0.9281005859375, 0.9638671875, 0.9996337890625, 1.035400390625, 1.0711669921875, 1.10693359375, 1.1427001953125, 1.178466796875, 1.2142333984375, 1.25]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 7.0, 21.0, 26.0, 40.0, 52.0, 91.0, 131.0, 205.0, 357.0, 659.0, 1393.0, 3220.0, 8832.0, 33451.0, 163752.0, 492601.0, 265962.0, 56182.0, 13643.0, 4302.0, 1715.0, 730.0, 440.0, 248.0, 187.0, 97.0, 57.0, 49.0, 24.0, 24.0, 17.0, 9.0, 2.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.23785972595214844, -0.22925949096679688, -0.2206592559814453, -0.21205902099609375, -0.2034587860107422, -0.19485855102539062, -0.18625831604003906, -0.1776580810546875, -0.16905784606933594, -0.16045761108398438, -0.1518573760986328, -0.14325714111328125, -0.1346569061279297, -0.12605667114257812, -0.11745643615722656, -0.108856201171875, -0.10025596618652344, -0.09165573120117188, -0.08305549621582031, -0.07445526123046875, -0.06585502624511719, -0.057254791259765625, -0.04865455627441406, -0.0400543212890625, -0.03145408630371094, -0.022853851318359375, -0.014253616333007812, -0.00565338134765625, 0.0029468536376953125, 0.011547088623046875, 0.020147323608398438, 0.02874755859375, 0.03734779357910156, 0.045948028564453125, 0.05454826354980469, 0.06314849853515625, 0.07174873352050781, 0.08034896850585938, 0.08894920349121094, 0.0975494384765625, 0.10614967346191406, 0.11474990844726562, 0.12335014343261719, 0.13195037841796875, 0.1405506134033203, 0.14915084838867188, 0.15775108337402344, 0.166351318359375, 0.17495155334472656, 0.18355178833007812, 0.1921520233154297, 0.20075225830078125, 0.2093524932861328, 0.21795272827148438, 0.22655296325683594, 0.2351531982421875, 0.24375343322753906, 0.2523536682128906, 0.2609539031982422, 0.26955413818359375, 0.2781543731689453, 0.2867546081542969, 0.29535484313964844, 0.303955078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 11.0, 15.0, 13.0, 8.0, 18.0, 9.0, 21.0, 27.0, 30.0, 35.0, 37.0, 26.0, 51.0, 37.0, 41.0, 44.0, 46.0, 58.0, 39.0, 29.0, 35.0, 45.0, 29.0, 30.0, 36.0, 28.0, 19.0, 18.0, 21.0, 16.0, 10.0, 13.0, 10.0, 12.0, 6.0, 6.0, 15.0, 5.0, 7.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.09393310546875, -2.0277099609375, -1.96148681640625, -1.895263671875, -1.82904052734375, -1.7628173828125, -1.69659423828125, -1.63037109375, -1.56414794921875, -1.4979248046875, -1.43170166015625, -1.365478515625, -1.29925537109375, -1.2330322265625, -1.16680908203125, -1.1005859375, -1.03436279296875, -0.9681396484375, -0.90191650390625, -0.835693359375, -0.76947021484375, -0.7032470703125, -0.63702392578125, -0.57080078125, -0.50457763671875, -0.4383544921875, -0.37213134765625, -0.305908203125, -0.23968505859375, -0.1734619140625, -0.10723876953125, -0.041015625, 0.02520751953125, 0.0914306640625, 0.15765380859375, 0.223876953125, 0.29010009765625, 0.3563232421875, 0.42254638671875, 0.48876953125, 0.55499267578125, 0.6212158203125, 0.68743896484375, 0.753662109375, 0.81988525390625, 0.8861083984375, 0.95233154296875, 1.0185546875, 1.08477783203125, 1.1510009765625, 1.21722412109375, 1.283447265625, 1.34967041015625, 1.4158935546875, 1.48211669921875, 1.54833984375, 1.61456298828125, 1.6807861328125, 1.74700927734375, 1.813232421875, 1.87945556640625, 1.9456787109375, 2.01190185546875, 2.078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 15.0, 28.0, 31.0, 50.0, 66.0, 106.0, 189.0, 333.0, 645.0, 1379.0, 3352.0, 10236.0, 40243.0, 230384.0, 584235.0, 138243.0, 26624.0, 7355.0, 2703.0, 1093.0, 530.0, 249.0, 147.0, 80.0, 71.0, 42.0, 30.0, 26.0, 16.0, 18.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.1258544921875, -0.1225738525390625, -0.119293212890625, -0.1160125732421875, -0.11273193359375, -0.1094512939453125, -0.106170654296875, -0.1028900146484375, -0.099609375, -0.0963287353515625, -0.093048095703125, -0.0897674560546875, -0.08648681640625, -0.0832061767578125, -0.079925537109375, -0.0766448974609375, -0.0733642578125, -0.0700836181640625, -0.066802978515625, -0.0635223388671875, -0.06024169921875, -0.0569610595703125, -0.053680419921875, -0.0503997802734375, -0.047119140625, -0.0438385009765625, -0.040557861328125, -0.0372772216796875, -0.03399658203125, -0.0307159423828125, -0.027435302734375, -0.0241546630859375, -0.0208740234375, -0.0175933837890625, -0.014312744140625, -0.0110321044921875, -0.00775146484375, -0.0044708251953125, -0.001190185546875, 0.0020904541015625, 0.00537109375, 0.0086517333984375, 0.011932373046875, 0.0152130126953125, 0.01849365234375, 0.0217742919921875, 0.025054931640625, 0.0283355712890625, 0.0316162109375, 0.0348968505859375, 0.038177490234375, 0.0414581298828125, 0.04473876953125, 0.0480194091796875, 0.051300048828125, 0.0545806884765625, 0.057861328125, 0.0611419677734375, 0.064422607421875, 0.0677032470703125, 0.07098388671875, 0.0742645263671875, 0.077545166015625, 0.0808258056640625, 0.0841064453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 15.0, 13.0, 22.0, 27.0, 46.0, 48.0, 70.0, 84.0, 96.0, 105.0, 114.0, 77.0, 56.0, 53.0, 37.0, 31.0, 24.0, 13.0, 18.0, 8.0, 4.0, 10.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.324052810668945e-05, -6.123911589384079e-05, -5.9237703680992126e-05, -5.723629146814346e-05, -5.52348792552948e-05, -5.3233467042446136e-05, -5.123205482959747e-05, -4.923064261674881e-05, -4.7229230403900146e-05, -4.522781819105148e-05, -4.322640597820282e-05, -4.1224993765354156e-05, -3.922358155250549e-05, -3.722216933965683e-05, -3.5220757126808167e-05, -3.32193449139595e-05, -3.121793270111084e-05, -2.9216520488262177e-05, -2.7215108275413513e-05, -2.521369606256485e-05, -2.3212283849716187e-05, -2.1210871636867523e-05, -1.920945942401886e-05, -1.7208047211170197e-05, -1.5206634998321533e-05, -1.320522278547287e-05, -1.1203810572624207e-05, -9.202398359775543e-06, -7.20098614692688e-06, -5.1995739340782166e-06, -3.1981617212295532e-06, -1.1967495083808899e-06, 8.046627044677734e-07, 2.8060749173164368e-06, 4.8074871301651e-06, 6.8088993430137634e-06, 8.810311555862427e-06, 1.081172376871109e-05, 1.2813135981559753e-05, 1.4814548194408417e-05, 1.681596040725708e-05, 1.8817372620105743e-05, 2.0818784832954407e-05, 2.282019704580307e-05, 2.4821609258651733e-05, 2.6823021471500397e-05, 2.882443368434906e-05, 3.0825845897197723e-05, 3.282725811004639e-05, 3.482867032289505e-05, 3.683008253574371e-05, 3.883149474859238e-05, 4.083290696144104e-05, 4.28343191742897e-05, 4.483573138713837e-05, 4.683714359998703e-05, 4.883855581283569e-05, 5.083996802568436e-05, 5.284138023853302e-05, 5.484279245138168e-05, 5.684420466423035e-05, 5.884561687707901e-05, 6.084702908992767e-05, 6.284844130277634e-05, 6.4849853515625e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 9.0, 14.0, 13.0, 9.0, 13.0, 29.0, 41.0, 50.0, 62.0, 94.0, 139.0, 194.0, 343.0, 574.0, 1056.0, 2080.0, 4543.0, 11026.0, 34572.0, 143975.0, 497216.0, 264014.0, 58813.0, 17030.0, 6421.0, 2888.0, 1402.0, 742.0, 413.0, 248.0, 155.0, 102.0, 80.0, 42.0, 27.0, 31.0, 24.0, 20.0, 12.0, 13.0, 5.0, 2.0, 8.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09637451171875, -0.09323501586914062, -0.09009552001953125, -0.08695602416992188, -0.0838165283203125, -0.08067703247070312, -0.07753753662109375, -0.07439804077148438, -0.071258544921875, -0.06811904907226562, -0.06497955322265625, -0.061840057373046875, -0.0587005615234375, -0.055561065673828125, -0.05242156982421875, -0.049282073974609375, -0.046142578125, -0.043003082275390625, -0.03986358642578125, -0.036724090576171875, -0.0335845947265625, -0.030445098876953125, -0.02730560302734375, -0.024166107177734375, -0.021026611328125, -0.017887115478515625, -0.01474761962890625, -0.011608123779296875, -0.0084686279296875, -0.005329132080078125, -0.00218963623046875, 0.000949859619140625, 0.00408935546875, 0.007228851318359375, 0.01036834716796875, 0.013507843017578125, 0.0166473388671875, 0.019786834716796875, 0.02292633056640625, 0.026065826416015625, 0.029205322265625, 0.032344818115234375, 0.03548431396484375, 0.038623809814453125, 0.0417633056640625, 0.044902801513671875, 0.04804229736328125, 0.051181793212890625, 0.0543212890625, 0.057460784912109375, 0.06060028076171875, 0.06373977661132812, 0.0668792724609375, 0.07001876831054688, 0.07315826416015625, 0.07629776000976562, 0.079437255859375, 0.08257675170898438, 0.08571624755859375, 0.08885574340820312, 0.0919952392578125, 0.09513473510742188, 0.09827423095703125, 0.10141372680664062, 0.10455322265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 6.0, 4.0, 8.0, 8.0, 12.0, 9.0, 38.0, 37.0, 44.0, 41.0, 73.0, 94.0, 83.0, 83.0, 88.0, 82.0, 63.0, 51.0, 44.0, 29.0, 17.0, 26.0, 11.0, 6.0, 12.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0306854248046875, -0.0298919677734375, -0.0290985107421875, -0.0283050537109375, -0.0275115966796875, -0.0267181396484375, -0.0259246826171875, -0.0251312255859375, -0.0243377685546875, -0.0235443115234375, -0.0227508544921875, -0.0219573974609375, -0.0211639404296875, -0.0203704833984375, -0.0195770263671875, -0.0187835693359375, -0.0179901123046875, -0.0171966552734375, -0.0164031982421875, -0.0156097412109375, -0.0148162841796875, -0.0140228271484375, -0.0132293701171875, -0.0124359130859375, -0.0116424560546875, -0.0108489990234375, -0.0100555419921875, -0.0092620849609375, -0.0084686279296875, -0.0076751708984375, -0.0068817138671875, -0.0060882568359375, -0.0052947998046875, -0.0045013427734375, -0.0037078857421875, -0.0029144287109375, -0.0021209716796875, -0.0013275146484375, -0.0005340576171875, 0.0002593994140625, 0.0010528564453125, 0.0018463134765625, 0.0026397705078125, 0.0034332275390625, 0.0042266845703125, 0.0050201416015625, 0.0058135986328125, 0.0066070556640625, 0.0074005126953125, 0.0081939697265625, 0.0089874267578125, 0.0097808837890625, 0.0105743408203125, 0.0113677978515625, 0.0121612548828125, 0.0129547119140625, 0.0137481689453125, 0.0145416259765625, 0.0153350830078125, 0.0161285400390625, 0.0169219970703125, 0.0177154541015625, 0.0185089111328125, 0.0193023681640625, 0.0200958251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 9.0, 10.0, 23.0, 24.0, 35.0, 46.0, 56.0, 63.0, 94.0, 97.0, 88.0, 109.0, 86.0, 60.0, 55.0, 40.0, 23.0, 20.0, 18.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6849658489227295, -1.6311278343200684, -1.5772899389266968, -1.5234519243240356, -1.4696139097213745, -1.415776014328003, -1.3619379997253418, -1.3080999851226807, -1.2542619705200195, -1.2004239559173584, -1.1465860605239868, -1.0927480459213257, -1.0389100313186646, -0.9850720763206482, -0.9312341213226318, -0.8773961067199707, -0.8235582113265991, -0.7697202563285828, -0.7158822417259216, -0.6620442867279053, -0.6082062721252441, -0.5543683171272278, -0.5005303621292114, -0.4466923773288727, -0.39285439252853394, -0.3390164077281952, -0.28517842292785645, -0.2313404679298401, -0.17750248312950134, -0.1236644983291626, -0.06982654333114624, -0.015988558530807495, 0.0378495454788208, 0.09168752282857895, 0.1455255001783371, 0.19936347007751465, 0.2532014548778534, 0.30703943967819214, 0.3608773946762085, 0.41471537947654724, 0.468553364276886, 0.5223913192749023, 0.5762293338775635, 0.6300672888755798, 0.6839052438735962, 0.7377432584762573, 0.7915812134742737, 0.84541916847229, 0.8992571830749512, 0.9530951380729675, 1.0069330930709839, 1.060771107673645, 1.1146091222763062, 1.1684470176696777, 1.2222850322723389, 1.276123046875, 1.3299610614776611, 1.3837990760803223, 1.4376369714736938, 1.491474986076355, 1.5453130006790161, 1.5991508960723877, 1.6529889106750488, 1.70682692527771, 1.7606648206710815]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 5.0, 5.0, 11.0, 17.0, 20.0, 23.0, 24.0, 17.0, 33.0, 35.0, 43.0, 42.0, 45.0, 49.0, 48.0, 57.0, 60.0, 53.0, 52.0, 47.0, 26.0, 44.0, 30.0, 28.0, 21.0, 22.0, 35.0, 16.0, 12.0, 11.0, 12.0, 9.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9726780652999878, -0.9380478858947754, -0.903417706489563, -0.8687874674797058, -0.8341572880744934, -0.799527108669281, -0.7648968696594238, -0.7302666902542114, -0.695636510848999, -0.6610063314437866, -0.6263761520385742, -0.591745913028717, -0.5571157336235046, -0.5224855542182922, -0.48785534501075745, -0.45322513580322266, -0.41859495639801025, -0.38396477699279785, -0.34933456778526306, -0.31470435857772827, -0.28007417917251587, -0.24544398486614227, -0.21081379055976868, -0.17618359625339508, -0.14155340194702148, -0.10692320764064789, -0.07229301333427429, -0.037662819027900696, -0.0030326247215270996, 0.0315975695848465, 0.06622776389122009, 0.10085795819759369, 0.13548815250396729, 0.17011834681034088, 0.20474854111671448, 0.23937873542308807, 0.27400892972946167, 0.3086391091346741, 0.34326931834220886, 0.37789952754974365, 0.41252970695495605, 0.44715988636016846, 0.48179009556770325, 0.516420304775238, 0.5510504841804504, 0.5856806635856628, 0.62031090259552, 0.6549410820007324, 0.6895712614059448, 0.7242014408111572, 0.7588316202163696, 0.7934618592262268, 0.8280920386314392, 0.8627222180366516, 0.8973524570465088, 0.9319826364517212, 0.9666128158569336, 1.001242995262146, 1.0358731746673584, 1.0705033540725708, 1.1051335334777832, 1.1397638320922852, 1.1743940114974976, 1.20902419090271, 1.2436543703079224]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 4.0, 11.0, 4.0, 17.0, 22.0, 29.0, 49.0, 44.0, 67.0, 121.0, 173.0, 299.0, 450.0, 811.0, 1467.0, 2864.0, 5878.0, 13789.0, 36316.0, 145395.0, 630537.0, 147493.0, 36434.0, 13689.0, 6064.0, 2866.0, 1504.0, 810.0, 462.0, 311.0, 193.0, 140.0, 65.0, 61.0, 33.0, 28.0, 14.0, 10.0, 8.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6796875, -1.6227569580078125, -1.565826416015625, -1.5088958740234375, -1.45196533203125, -1.3950347900390625, -1.338104248046875, -1.2811737060546875, -1.2242431640625, -1.1673126220703125, -1.110382080078125, -1.0534515380859375, -0.99652099609375, -0.9395904541015625, -0.882659912109375, -0.8257293701171875, -0.768798828125, -0.7118682861328125, -0.654937744140625, -0.5980072021484375, -0.54107666015625, -0.4841461181640625, -0.427215576171875, -0.3702850341796875, -0.3133544921875, -0.2564239501953125, -0.199493408203125, -0.1425628662109375, -0.08563232421875, -0.0287017822265625, 0.028228759765625, 0.0851593017578125, 0.14208984375, 0.1990203857421875, 0.255950927734375, 0.3128814697265625, 0.36981201171875, 0.4267425537109375, 0.483673095703125, 0.5406036376953125, 0.5975341796875, 0.6544647216796875, 0.711395263671875, 0.7683258056640625, 0.82525634765625, 0.8821868896484375, 0.939117431640625, 0.9960479736328125, 1.052978515625, 1.1099090576171875, 1.166839599609375, 1.2237701416015625, 1.28070068359375, 1.3376312255859375, 1.394561767578125, 1.4514923095703125, 1.5084228515625, 1.5653533935546875, 1.622283935546875, 1.6792144775390625, 1.73614501953125, 1.7930755615234375, 1.850006103515625, 1.9069366455078125, 1.9638671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 9.0, 6.0, 12.0, 19.0, 21.0, 15.0, 28.0, 28.0, 33.0, 31.0, 38.0, 57.0, 57.0, 59.0, 52.0, 58.0, 49.0, 47.0, 50.0, 49.0, 30.0, 38.0, 28.0, 29.0, 26.0, 29.0, 23.0, 11.0, 5.0, 12.0, 5.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.34765625, -2.267669677734375, -2.18768310546875, -2.107696533203125, -2.0277099609375, -1.947723388671875, -1.86773681640625, -1.787750244140625, -1.707763671875, -1.627777099609375, -1.54779052734375, -1.467803955078125, -1.3878173828125, -1.307830810546875, -1.22784423828125, -1.147857666015625, -1.06787109375, -0.987884521484375, -0.90789794921875, -0.827911376953125, -0.7479248046875, -0.667938232421875, -0.58795166015625, -0.507965087890625, -0.427978515625, -0.347991943359375, -0.26800537109375, -0.188018798828125, -0.1080322265625, -0.028045654296875, 0.05194091796875, 0.131927490234375, 0.2119140625, 0.291900634765625, 0.37188720703125, 0.451873779296875, 0.5318603515625, 0.611846923828125, 0.69183349609375, 0.771820068359375, 0.851806640625, 0.931793212890625, 1.01177978515625, 1.091766357421875, 1.1717529296875, 1.251739501953125, 1.33172607421875, 1.411712646484375, 1.49169921875, 1.571685791015625, 1.65167236328125, 1.731658935546875, 1.8116455078125, 1.891632080078125, 1.97161865234375, 2.051605224609375, 2.131591796875, 2.211578369140625, 2.29156494140625, 2.371551513671875, 2.4515380859375, 2.531524658203125, 2.61151123046875, 2.691497802734375, 2.771484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 6.0, 12.0, 20.0, 20.0, 42.0, 70.0, 107.0, 222.0, 548.0, 1752.0, 7510.0, 42669.0, 760811.0, 208594.0, 20208.0, 4091.0, 1091.0, 363.0, 157.0, 92.0, 46.0, 40.0, 24.0, 14.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.28125, -4.173675537109375, -4.06610107421875, -3.958526611328125, -3.8509521484375, -3.743377685546875, -3.63580322265625, -3.528228759765625, -3.420654296875, -3.313079833984375, -3.20550537109375, -3.097930908203125, -2.9903564453125, -2.882781982421875, -2.77520751953125, -2.667633056640625, -2.56005859375, -2.452484130859375, -2.34490966796875, -2.237335205078125, -2.1297607421875, -2.022186279296875, -1.91461181640625, -1.807037353515625, -1.699462890625, -1.591888427734375, -1.48431396484375, -1.376739501953125, -1.2691650390625, -1.161590576171875, -1.05401611328125, -0.946441650390625, -0.8388671875, -0.731292724609375, -0.62371826171875, -0.516143798828125, -0.4085693359375, -0.300994873046875, -0.19342041015625, -0.085845947265625, 0.021728515625, 0.129302978515625, 0.23687744140625, 0.344451904296875, 0.4520263671875, 0.559600830078125, 0.66717529296875, 0.774749755859375, 0.88232421875, 0.989898681640625, 1.09747314453125, 1.205047607421875, 1.3126220703125, 1.420196533203125, 1.52777099609375, 1.635345458984375, 1.742919921875, 1.850494384765625, 1.95806884765625, 2.065643310546875, 2.1732177734375, 2.280792236328125, 2.38836669921875, 2.495941162109375, 2.603515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 7.0, 11.0, 15.0, 24.0, 16.0, 19.0, 18.0, 15.0, 17.0, 47.0, 40.0, 41.0, 45.0, 50.0, 66.0, 60.0, 69.0, 52.0, 43.0, 46.0, 49.0, 34.0, 38.0, 32.0, 24.0, 18.0, 15.0, 11.0, 15.0, 11.0, 6.0, 4.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.74609375, -3.634857177734375, -3.52362060546875, -3.412384033203125, -3.3011474609375, -3.189910888671875, -3.07867431640625, -2.967437744140625, -2.856201171875, -2.744964599609375, -2.63372802734375, -2.522491455078125, -2.4112548828125, -2.300018310546875, -2.18878173828125, -2.077545166015625, -1.96630859375, -1.855072021484375, -1.74383544921875, -1.632598876953125, -1.5213623046875, -1.410125732421875, -1.29888916015625, -1.187652587890625, -1.076416015625, -0.965179443359375, -0.85394287109375, -0.742706298828125, -0.6314697265625, -0.520233154296875, -0.40899658203125, -0.297760009765625, -0.1865234375, -0.075286865234375, 0.03594970703125, 0.147186279296875, 0.2584228515625, 0.369659423828125, 0.48089599609375, 0.592132568359375, 0.703369140625, 0.814605712890625, 0.92584228515625, 1.037078857421875, 1.1483154296875, 1.259552001953125, 1.37078857421875, 1.482025146484375, 1.59326171875, 1.704498291015625, 1.81573486328125, 1.926971435546875, 2.0382080078125, 2.149444580078125, 2.26068115234375, 2.371917724609375, 2.483154296875, 2.594390869140625, 2.70562744140625, 2.816864013671875, 2.9281005859375, 3.039337158203125, 3.15057373046875, 3.261810302734375, 3.373046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 18.0, 21.0, 29.0, 45.0, 96.0, 204.0, 644.0, 2165.0, 9775.0, 61268.0, 773860.0, 174144.0, 20389.0, 4136.0, 1048.0, 349.0, 142.0, 91.0, 32.0, 24.0, 18.0, 9.0, 6.0, 4.0, 10.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8788986206054688, -0.8520355224609375, -0.8251724243164062, -0.798309326171875, -0.7714462280273438, -0.7445831298828125, -0.7177200317382812, -0.69085693359375, -0.6639938354492188, -0.6371307373046875, -0.6102676391601562, -0.583404541015625, -0.5565414428710938, -0.5296783447265625, -0.5028152465820312, -0.4759521484375, -0.44908905029296875, -0.4222259521484375, -0.39536285400390625, -0.368499755859375, -0.34163665771484375, -0.3147735595703125, -0.28791046142578125, -0.26104736328125, -0.23418426513671875, -0.2073211669921875, -0.18045806884765625, -0.153594970703125, -0.12673187255859375, -0.0998687744140625, -0.07300567626953125, -0.046142578125, -0.01927947998046875, 0.0075836181640625, 0.03444671630859375, 0.061309814453125, 0.08817291259765625, 0.1150360107421875, 0.14189910888671875, 0.16876220703125, 0.19562530517578125, 0.2224884033203125, 0.24935150146484375, 0.276214599609375, 0.30307769775390625, 0.3299407958984375, 0.35680389404296875, 0.3836669921875, 0.41053009033203125, 0.4373931884765625, 0.46425628662109375, 0.491119384765625, 0.5179824829101562, 0.5448455810546875, 0.5717086791992188, 0.59857177734375, 0.6254348754882812, 0.6522979736328125, 0.6791610717773438, 0.706024169921875, 0.7328872680664062, 0.7597503662109375, 0.7866134643554688, 0.8134765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 12.0, 7.0, 10.0, 15.0, 26.0, 29.0, 45.0, 71.0, 78.0, 189.0, 171.0, 105.0, 62.0, 48.0, 32.0, 27.0, 22.0, 18.0, 4.0, 11.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001310110092163086, -0.000127376988530159, -0.0001237429678440094, -0.0001201089471578598, -0.0001164749264717102, -0.00011284090578556061, -0.00010920688509941101, -0.00010557286441326141, -0.00010193884372711182, -9.830482304096222e-05, -9.467080235481262e-05, -9.103678166866302e-05, -8.740276098251343e-05, -8.376874029636383e-05, -8.013471961021423e-05, -7.650069892406464e-05, -7.286667823791504e-05, -6.923265755176544e-05, -6.559863686561584e-05, -6.196461617946625e-05, -5.833059549331665e-05, -5.469657480716705e-05, -5.1062554121017456e-05, -4.742853343486786e-05, -4.379451274871826e-05, -4.0160492062568665e-05, -3.652647137641907e-05, -3.289245069026947e-05, -2.9258430004119873e-05, -2.5624409317970276e-05, -2.199038863182068e-05, -1.835636794567108e-05, -1.4722347259521484e-05, -1.1088326573371887e-05, -7.45430588722229e-06, -3.820285201072693e-06, -1.862645149230957e-07, 3.4477561712265015e-06, 7.081776857376099e-06, 1.0715797543525696e-05, 1.4349818229675293e-05, 1.798383891582489e-05, 2.1617859601974487e-05, 2.5251880288124084e-05, 2.888590097427368e-05, 3.251992166042328e-05, 3.6153942346572876e-05, 3.978796303272247e-05, 4.342198371887207e-05, 4.705600440502167e-05, 5.0690025091171265e-05, 5.432404577732086e-05, 5.795806646347046e-05, 6.159208714962006e-05, 6.522610783576965e-05, 6.886012852191925e-05, 7.249414920806885e-05, 7.612816989421844e-05, 7.976219058036804e-05, 8.339621126651764e-05, 8.703023195266724e-05, 9.066425263881683e-05, 9.429827332496643e-05, 9.793229401111603e-05, 0.00010156631469726562]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 14.0, 20.0, 24.0, 36.0, 61.0, 103.0, 178.0, 280.0, 611.0, 1197.0, 3072.0, 8887.0, 30303.0, 149372.0, 700751.0, 115535.0, 25411.0, 7645.0, 2739.0, 1142.0, 491.0, 280.0, 153.0, 84.0, 50.0, 31.0, 26.0, 21.0, 17.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55419921875, -0.533233642578125, -0.51226806640625, -0.491302490234375, -0.4703369140625, -0.449371337890625, -0.42840576171875, -0.407440185546875, -0.386474609375, -0.365509033203125, -0.34454345703125, -0.323577880859375, -0.3026123046875, -0.281646728515625, -0.26068115234375, -0.239715576171875, -0.21875, -0.197784423828125, -0.17681884765625, -0.155853271484375, -0.1348876953125, -0.113922119140625, -0.09295654296875, -0.071990966796875, -0.051025390625, -0.030059814453125, -0.00909423828125, 0.011871337890625, 0.0328369140625, 0.053802490234375, 0.07476806640625, 0.095733642578125, 0.11669921875, 0.137664794921875, 0.15863037109375, 0.179595947265625, 0.2005615234375, 0.221527099609375, 0.24249267578125, 0.263458251953125, 0.284423828125, 0.305389404296875, 0.32635498046875, 0.347320556640625, 0.3682861328125, 0.389251708984375, 0.41021728515625, 0.431182861328125, 0.4521484375, 0.473114013671875, 0.49407958984375, 0.515045166015625, 0.5360107421875, 0.556976318359375, 0.57794189453125, 0.598907470703125, 0.619873046875, 0.640838623046875, 0.66180419921875, 0.682769775390625, 0.7037353515625, 0.724700927734375, 0.74566650390625, 0.766632080078125, 0.78759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 10.0, 10.0, 10.0, 6.0, 15.0, 23.0, 21.0, 27.0, 31.0, 44.0, 76.0, 122.0, 161.0, 132.0, 99.0, 45.0, 39.0, 24.0, 24.0, 13.0, 11.0, 12.0, 14.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.425048828125, -0.41400909423828125, -0.4029693603515625, -0.39192962646484375, -0.380889892578125, -0.36985015869140625, -0.3588104248046875, -0.34777069091796875, -0.33673095703125, -0.32569122314453125, -0.3146514892578125, -0.30361175537109375, -0.292572021484375, -0.28153228759765625, -0.2704925537109375, -0.25945281982421875, -0.2484130859375, -0.23737335205078125, -0.2263336181640625, -0.21529388427734375, -0.204254150390625, -0.19321441650390625, -0.1821746826171875, -0.17113494873046875, -0.16009521484375, -0.14905548095703125, -0.1380157470703125, -0.12697601318359375, -0.115936279296875, -0.10489654541015625, -0.0938568115234375, -0.08281707763671875, -0.07177734375, -0.06073760986328125, -0.0496978759765625, -0.03865814208984375, -0.027618408203125, -0.01657867431640625, -0.0055389404296875, 0.00550079345703125, 0.01654052734375, 0.02758026123046875, 0.0386199951171875, 0.04965972900390625, 0.060699462890625, 0.07173919677734375, 0.0827789306640625, 0.09381866455078125, 0.1048583984375, 0.11589813232421875, 0.1269378662109375, 0.13797760009765625, 0.149017333984375, 0.16005706787109375, 0.1710968017578125, 0.18213653564453125, 0.19317626953125, 0.20421600341796875, 0.2152557373046875, 0.22629547119140625, 0.237335205078125, 0.24837493896484375, 0.2594146728515625, 0.27045440673828125, 0.281494140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 15.0, 42.0, 66.0, 129.0, 176.0, 192.0, 164.0, 96.0, 53.0, 25.0, 19.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.952287197113037, -2.713155508041382, -2.4740238189697266, -2.234891891479492, -1.9957603216171265, -1.7566286325454712, -1.5174968242645264, -1.278365135192871, -1.0392334461212158, -0.8001017570495605, -0.5609700083732605, -0.32183825969696045, -0.08270657062530518, 0.1564251184463501, 0.3955569267272949, 0.6346886157989502, 0.8738203048706055, 1.1129519939422607, 1.352083683013916, 1.5912154912948608, 1.8303471803665161, 2.069478988647461, 2.308610677719116, 2.5477423667907715, 2.7868740558624268, 3.026005744934082, 3.2651374340057373, 3.5042691230773926, 3.743401050567627, 3.982532501220703, 4.2216644287109375, 4.460796356201172, 4.699928283691406, 4.939060211181641, 5.178191661834717, 5.417323589324951, 5.656455039978027, 5.895586967468262, 6.134718894958496, 6.373850345611572, 6.612981796264648, 6.852113723754883, 7.091245174407959, 7.330377101898193, 7.5695085525512695, 7.808640480041504, 8.047772407531738, 8.286903381347656, 8.52603530883789, 8.765167236328125, 9.00429916381836, 9.243430137634277, 9.482562065124512, 9.721693992614746, 9.96082592010498, 10.199956893920898, 10.43908977508545, 10.678221702575684, 10.917353630065918, 11.156484603881836, 11.39561653137207, 11.634748458862305, 11.873880386352539, 12.113012313842773, 12.352143287658691]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 5.0, 13.0, 4.0, 18.0, 16.0, 14.0, 24.0, 31.0, 20.0, 28.0, 31.0, 35.0, 39.0, 41.0, 48.0, 37.0, 30.0, 43.0, 40.0, 42.0, 40.0, 39.0, 30.0, 38.0, 33.0, 33.0, 35.0, 26.0, 18.0, 22.0, 18.0, 18.0, 12.0, 18.0, 9.0, 10.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.527335166931152, -6.350761413574219, -6.174187660217285, -5.997613906860352, -5.821040630340576, -5.644466876983643, -5.467893123626709, -5.291319370269775, -5.11474609375, -4.938172340393066, -4.761598587036133, -4.585024833679199, -4.408451557159424, -4.23187780380249, -4.055304050445557, -3.878730297088623, -3.7021565437316895, -3.525582790374756, -3.3490092754364014, -3.1724355220794678, -2.9958620071411133, -2.8192882537841797, -2.642714500427246, -2.4661407470703125, -2.289567232131958, -2.1129934787750244, -1.93641996383667, -1.7598462104797363, -1.5832725763320923, -1.4066989421844482, -1.2301251888275146, -1.0535515546798706, -0.8769774436950684, -0.7004038095474243, -0.5238301157951355, -0.3472564220428467, -0.17068278789520264, 0.005890846252441406, 0.182464599609375, 0.35903823375701904, 0.5356118679046631, 0.7121855020523071, 0.888759195804596, 1.0653328895568848, 1.2419065237045288, 1.4184801578521729, 1.5950539112091064, 1.7716275453567505, 1.9482011795043945, 2.124774932861328, 2.3013484477996826, 2.477922201156616, 2.6544957160949707, 2.8310694694519043, 3.007643222808838, 3.1842169761657715, 3.360790491104126, 3.5373642444610596, 3.713937759399414, 3.8905115127563477, 4.067085266113281, 4.243659019470215, 4.420232772827148, 4.596806049346924, 4.773379802703857]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 9.0, 7.0, 21.0, 22.0, 16.0, 45.0, 50.0, 84.0, 116.0, 184.0, 370.0, 703.0, 1854.0, 5358.0, 21717.0, 269852.0, 3773701.0, 99776.0, 13849.0, 3799.0, 1354.0, 578.0, 280.0, 147.0, 94.0, 66.0, 53.0, 36.0, 27.0, 21.0, 16.0, 17.0, 11.0, 7.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.13360595703125, -4.0133056640625, -3.89300537109375, -3.772705078125, -3.65240478515625, -3.5321044921875, -3.41180419921875, -3.29150390625, -3.17120361328125, -3.0509033203125, -2.93060302734375, -2.810302734375, -2.69000244140625, -2.5697021484375, -2.44940185546875, -2.3291015625, -2.20880126953125, -2.0885009765625, -1.96820068359375, -1.847900390625, -1.72760009765625, -1.6072998046875, -1.48699951171875, -1.36669921875, -1.24639892578125, -1.1260986328125, -1.00579833984375, -0.885498046875, -0.76519775390625, -0.6448974609375, -0.52459716796875, -0.404296875, -0.28399658203125, -0.1636962890625, -0.04339599609375, 0.076904296875, 0.19720458984375, 0.3175048828125, 0.43780517578125, 0.55810546875, 0.67840576171875, 0.7987060546875, 0.91900634765625, 1.039306640625, 1.15960693359375, 1.2799072265625, 1.40020751953125, 1.5205078125, 1.64080810546875, 1.7611083984375, 1.88140869140625, 2.001708984375, 2.12200927734375, 2.2423095703125, 2.36260986328125, 2.48291015625, 2.60321044921875, 2.7235107421875, 2.84381103515625, 2.964111328125, 3.08441162109375, 3.2047119140625, 3.32501220703125, 3.4453125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 8.0, 9.0, 16.0, 18.0, 28.0, 28.0, 33.0, 37.0, 31.0, 42.0, 56.0, 34.0, 61.0, 62.0, 71.0, 73.0, 55.0, 41.0, 40.0, 38.0, 35.0, 29.0, 18.0, 20.0, 25.0, 18.0, 14.0, 10.0, 4.0, 10.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8184661865234375, -0.784393310546875, -0.7503204345703125, -0.71624755859375, -0.6821746826171875, -0.648101806640625, -0.6140289306640625, -0.5799560546875, -0.5458831787109375, -0.511810302734375, -0.4777374267578125, -0.44366455078125, -0.4095916748046875, -0.375518798828125, -0.3414459228515625, -0.307373046875, -0.2733001708984375, -0.239227294921875, -0.2051544189453125, -0.17108154296875, -0.1370086669921875, -0.102935791015625, -0.0688629150390625, -0.0347900390625, -0.0007171630859375, 0.033355712890625, 0.0674285888671875, 0.10150146484375, 0.1355743408203125, 0.169647216796875, 0.2037200927734375, 0.23779296875, 0.2718658447265625, 0.305938720703125, 0.3400115966796875, 0.37408447265625, 0.4081573486328125, 0.442230224609375, 0.4763031005859375, 0.5103759765625, 0.5444488525390625, 0.578521728515625, 0.6125946044921875, 0.64666748046875, 0.6807403564453125, 0.714813232421875, 0.7488861083984375, 0.782958984375, 0.8170318603515625, 0.851104736328125, 0.8851776123046875, 0.91925048828125, 0.9533233642578125, 0.987396240234375, 1.0214691162109375, 1.0555419921875, 1.0896148681640625, 1.123687744140625, 1.1577606201171875, 1.19183349609375, 1.2259063720703125, 1.259979248046875, 1.2940521240234375, 1.328125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 11.0, 8.0, 7.0, 11.0, 5.0, 17.0, 27.0, 33.0, 54.0, 57.0, 82.0, 152.0, 232.0, 524.0, 1387.0, 4825.0, 22037.0, 179211.0, 3489294.0, 447359.0, 38078.0, 7330.0, 1964.0, 714.0, 309.0, 167.0, 105.0, 76.0, 42.0, 36.0, 27.0, 25.0, 14.0, 14.0, 6.0, 8.0, 4.0, 9.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84375, -2.747833251953125, -2.65191650390625, -2.555999755859375, -2.4600830078125, -2.364166259765625, -2.26824951171875, -2.172332763671875, -2.076416015625, -1.980499267578125, -1.88458251953125, -1.788665771484375, -1.6927490234375, -1.596832275390625, -1.50091552734375, -1.404998779296875, -1.30908203125, -1.213165283203125, -1.11724853515625, -1.021331787109375, -0.9254150390625, -0.829498291015625, -0.73358154296875, -0.637664794921875, -0.541748046875, -0.445831298828125, -0.34991455078125, -0.253997802734375, -0.1580810546875, -0.062164306640625, 0.03375244140625, 0.129669189453125, 0.2255859375, 0.321502685546875, 0.41741943359375, 0.513336181640625, 0.6092529296875, 0.705169677734375, 0.80108642578125, 0.897003173828125, 0.992919921875, 1.088836669921875, 1.18475341796875, 1.280670166015625, 1.3765869140625, 1.472503662109375, 1.56842041015625, 1.664337158203125, 1.76025390625, 1.856170654296875, 1.95208740234375, 2.048004150390625, 2.1439208984375, 2.239837646484375, 2.33575439453125, 2.431671142578125, 2.527587890625, 2.623504638671875, 2.71942138671875, 2.815338134765625, 2.9112548828125, 3.007171630859375, 3.10308837890625, 3.199005126953125, 3.294921875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 8.0, 15.0, 18.0, 16.0, 27.0, 43.0, 46.0, 65.0, 77.0, 127.0, 191.0, 270.0, 416.0, 586.0, 632.0, 463.0, 317.0, 216.0, 142.0, 102.0, 63.0, 58.0, 34.0, 34.0, 26.0, 13.0, 14.0, 13.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.673828125, -0.6547012329101562, -0.6355743408203125, -0.6164474487304688, -0.597320556640625, -0.5781936645507812, -0.5590667724609375, -0.5399398803710938, -0.52081298828125, -0.5016860961914062, -0.4825592041015625, -0.46343231201171875, -0.444305419921875, -0.42517852783203125, -0.4060516357421875, -0.38692474365234375, -0.3677978515625, -0.34867095947265625, -0.3295440673828125, -0.31041717529296875, -0.291290283203125, -0.27216339111328125, -0.2530364990234375, -0.23390960693359375, -0.21478271484375, -0.19565582275390625, -0.1765289306640625, -0.15740203857421875, -0.138275146484375, -0.11914825439453125, -0.1000213623046875, -0.08089447021484375, -0.061767578125, -0.04264068603515625, -0.0235137939453125, -0.00438690185546875, 0.014739990234375, 0.03386688232421875, 0.0529937744140625, 0.07212066650390625, 0.09124755859375, 0.11037445068359375, 0.1295013427734375, 0.14862823486328125, 0.167755126953125, 0.18688201904296875, 0.2060089111328125, 0.22513580322265625, 0.2442626953125, 0.26338958740234375, 0.2825164794921875, 0.30164337158203125, 0.320770263671875, 0.33989715576171875, 0.3590240478515625, 0.37815093994140625, 0.39727783203125, 0.41640472412109375, 0.4355316162109375, 0.45465850830078125, 0.473785400390625, 0.49291229248046875, 0.5120391845703125, 0.5311660766601562, 0.55029296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 11.0, 22.0, 24.0, 39.0, 53.0, 73.0, 77.0, 107.0, 102.0, 105.0, 90.0, 75.0, 67.0, 51.0, 37.0, 24.0, 12.0, 15.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5456047058105469, -1.4555232524871826, -1.3654416799545288, -1.2753602266311646, -1.1852786540985107, -1.0951972007751465, -1.0051157474517822, -0.9150342345237732, -0.8249527215957642, -0.7348712086677551, -0.6447896957397461, -0.5547082424163818, -0.4646267294883728, -0.37454521656036377, -0.2844637632369995, -0.19438225030899048, -0.10430073738098145, -0.014219239354133606, 0.07586225867271423, 0.16594374179840088, 0.2560252547264099, 0.34610676765441895, 0.4361882209777832, 0.5262697339057922, 0.6163512468338013, 0.7064327597618103, 0.7965142726898193, 0.8865957260131836, 0.9766772389411926, 1.0667587518692017, 1.156840205192566, 1.2469217777252197, 1.337003231048584, 1.4270846843719482, 1.517166256904602, 1.6072477102279663, 1.6973292827606201, 1.7874107360839844, 1.8774921894073486, 1.967573642730713, 2.0576553344726562, 2.1477367877960205, 2.2378182411193848, 2.327899932861328, 2.4179813861846924, 2.5080628395080566, 2.598144292831421, 2.688225746154785, 2.7783071994781494, 2.8683886528015137, 2.958470106124878, 3.048551559448242, 3.1386332511901855, 3.22871470451355, 3.318796157836914, 3.4088776111602783, 3.4989590644836426, 3.589040517807007, 3.679121971130371, 3.7692036628723145, 3.8592851161956787, 3.949366569519043, 4.039447784423828, 4.1295294761657715, 4.219611167907715]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 3.0, 1.0, 14.0, 12.0, 10.0, 13.0, 16.0, 19.0, 25.0, 20.0, 32.0, 24.0, 42.0, 35.0, 34.0, 37.0, 49.0, 35.0, 45.0, 43.0, 32.0, 37.0, 40.0, 44.0, 48.0, 36.0, 26.0, 23.0, 21.0, 28.0, 21.0, 21.0, 14.0, 20.0, 19.0, 9.0, 9.0, 9.0, 4.0, 5.0, 4.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3104372024536133, -1.2676371335983276, -1.224837064743042, -1.182037115097046, -1.1392370462417603, -1.0964369773864746, -1.053636908531189, -1.0108368396759033, -0.9680368304252625, -0.9252367615699768, -0.8824367523193359, -0.8396366834640503, -0.7968366146087646, -0.7540366053581238, -0.7112365365028381, -0.6684365272521973, -0.6256364583969116, -0.582836389541626, -0.5400363802909851, -0.49723631143569946, -0.4544362723827362, -0.41163623332977295, -0.3688361644744873, -0.32603612542152405, -0.2832360863685608, -0.24043604731559753, -0.19763599336147308, -0.15483593940734863, -0.11203590035438538, -0.06923586130142212, -0.026435792446136475, 0.016364246606826782, 0.05916416645050049, 0.10196421295404434, 0.1447642594575882, 0.18756431341171265, 0.2303643524646759, 0.27316439151763916, 0.3159644603729248, 0.35876449942588806, 0.4015645384788513, 0.4443645775318146, 0.48716461658477783, 0.5299646854400635, 0.5727647542953491, 0.61556476354599, 0.6583648324012756, 0.7011648416519165, 0.7439649105072021, 0.7867649793624878, 0.8295649886131287, 0.8723650574684143, 0.9151650667190552, 0.9579651355743408, 1.0007652044296265, 1.043565273284912, 1.0863652229309082, 1.1291652917861938, 1.1719653606414795, 1.2147653102874756, 1.2575653791427612, 1.3003654479980469, 1.3431655168533325, 1.3859655857086182, 1.4287656545639038]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 5.0, 9.0, 18.0, 31.0, 26.0, 42.0, 50.0, 84.0, 120.0, 201.0, 353.0, 904.0, 2613.0, 11545.0, 219890.0, 767297.0, 37614.0, 4966.0, 1484.0, 558.0, 258.0, 150.0, 99.0, 63.0, 57.0, 33.0, 21.0, 15.0, 12.0, 6.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47509765625, -0.45465850830078125, -0.4342193603515625, -0.41378021240234375, -0.393341064453125, -0.37290191650390625, -0.3524627685546875, -0.33202362060546875, -0.31158447265625, -0.29114532470703125, -0.2707061767578125, -0.25026702880859375, -0.229827880859375, -0.20938873291015625, -0.1889495849609375, -0.16851043701171875, -0.1480712890625, -0.12763214111328125, -0.1071929931640625, -0.08675384521484375, -0.066314697265625, -0.04587554931640625, -0.0254364013671875, -0.00499725341796875, 0.01544189453125, 0.03588104248046875, 0.0563201904296875, 0.07675933837890625, 0.097198486328125, 0.11763763427734375, 0.1380767822265625, 0.15851593017578125, 0.178955078125, 0.19939422607421875, 0.2198333740234375, 0.24027252197265625, 0.260711669921875, 0.28115081787109375, 0.3015899658203125, 0.32202911376953125, 0.34246826171875, 0.36290740966796875, 0.3833465576171875, 0.40378570556640625, 0.424224853515625, 0.44466400146484375, 0.4651031494140625, 0.48554229736328125, 0.5059814453125, 0.5264205932617188, 0.5468597412109375, 0.5672988891601562, 0.587738037109375, 0.6081771850585938, 0.6286163330078125, 0.6490554809570312, 0.66949462890625, 0.6899337768554688, 0.7103729248046875, 0.7308120727539062, 0.751251220703125, 0.7716903686523438, 0.7921295166015625, 0.8125686645507812, 0.8330078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 6.0, 9.0, 16.0, 16.0, 22.0, 21.0, 29.0, 46.0, 42.0, 48.0, 59.0, 61.0, 61.0, 61.0, 54.0, 54.0, 47.0, 54.0, 52.0, 40.0, 39.0, 26.0, 29.0, 20.0, 19.0, 21.0, 15.0, 7.0, 6.0, 8.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.70703125, -1.6634521484375, -1.619873046875, -1.5762939453125, -1.53271484375, -1.4891357421875, -1.445556640625, -1.4019775390625, -1.3583984375, -1.3148193359375, -1.271240234375, -1.2276611328125, -1.18408203125, -1.1405029296875, -1.096923828125, -1.0533447265625, -1.009765625, -0.9661865234375, -0.922607421875, -0.8790283203125, -0.83544921875, -0.7918701171875, -0.748291015625, -0.7047119140625, -0.6611328125, -0.6175537109375, -0.573974609375, -0.5303955078125, -0.48681640625, -0.4432373046875, -0.399658203125, -0.3560791015625, -0.3125, -0.2689208984375, -0.225341796875, -0.1817626953125, -0.13818359375, -0.0946044921875, -0.051025390625, -0.0074462890625, 0.0361328125, 0.0797119140625, 0.123291015625, 0.1668701171875, 0.21044921875, 0.2540283203125, 0.297607421875, 0.3411865234375, 0.384765625, 0.4283447265625, 0.471923828125, 0.5155029296875, 0.55908203125, 0.6026611328125, 0.646240234375, 0.6898193359375, 0.7333984375, 0.7769775390625, 0.820556640625, 0.8641357421875, 0.90771484375, 0.9512939453125, 0.994873046875, 1.0384521484375, 1.08203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 9.0, 10.0, 7.0, 17.0, 20.0, 32.0, 47.0, 57.0, 80.0, 111.0, 158.0, 266.0, 463.0, 849.0, 1633.0, 3487.0, 10094.0, 42902.0, 256105.0, 545857.0, 147708.0, 26215.0, 6728.0, 2609.0, 1244.0, 675.0, 410.0, 248.0, 166.0, 94.0, 73.0, 35.0, 57.0, 19.0, 11.0, 12.0, 5.0, 5.0, 10.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2534294128417969, -0.24416351318359375, -0.23489761352539062, -0.2256317138671875, -0.21636581420898438, -0.20709991455078125, -0.19783401489257812, -0.188568115234375, -0.17930221557617188, -0.17003631591796875, -0.16077041625976562, -0.1515045166015625, -0.14223861694335938, -0.13297271728515625, -0.12370681762695312, -0.11444091796875, -0.10517501831054688, -0.09590911865234375, -0.08664321899414062, -0.0773773193359375, -0.06811141967773438, -0.05884552001953125, -0.049579620361328125, -0.040313720703125, -0.031047821044921875, -0.02178192138671875, -0.012516021728515625, -0.0032501220703125, 0.006015777587890625, 0.01528167724609375, 0.024547576904296875, 0.0338134765625, 0.043079376220703125, 0.05234527587890625, 0.061611175537109375, 0.0708770751953125, 0.08014297485351562, 0.08940887451171875, 0.09867477416992188, 0.107940673828125, 0.11720657348632812, 0.12647247314453125, 0.13573837280273438, 0.1450042724609375, 0.15427017211914062, 0.16353607177734375, 0.17280197143554688, 0.18206787109375, 0.19133377075195312, 0.20059967041015625, 0.20986557006835938, 0.2191314697265625, 0.22839736938476562, 0.23766326904296875, 0.24692916870117188, 0.256195068359375, 0.2654609680175781, 0.27472686767578125, 0.2839927673339844, 0.2932586669921875, 0.3025245666503906, 0.31179046630859375, 0.3210563659667969, 0.330322265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 12.0, 9.0, 31.0, 26.0, 32.0, 43.0, 44.0, 57.0, 43.0, 61.0, 41.0, 42.0, 59.0, 52.0, 65.0, 41.0, 49.0, 42.0, 33.0, 40.0, 25.0, 20.0, 22.0, 20.0, 16.0, 10.0, 5.0, 10.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.64453125, -3.545074462890625, -3.44561767578125, -3.346160888671875, -3.2467041015625, -3.147247314453125, -3.04779052734375, -2.948333740234375, -2.848876953125, -2.749420166015625, -2.64996337890625, -2.550506591796875, -2.4510498046875, -2.351593017578125, -2.25213623046875, -2.152679443359375, -2.05322265625, -1.953765869140625, -1.85430908203125, -1.754852294921875, -1.6553955078125, -1.555938720703125, -1.45648193359375, -1.357025146484375, -1.257568359375, -1.158111572265625, -1.05865478515625, -0.959197998046875, -0.8597412109375, -0.760284423828125, -0.66082763671875, -0.561370849609375, -0.4619140625, -0.362457275390625, -0.26300048828125, -0.163543701171875, -0.0640869140625, 0.035369873046875, 0.13482666015625, 0.234283447265625, 0.333740234375, 0.433197021484375, 0.53265380859375, 0.632110595703125, 0.7315673828125, 0.831024169921875, 0.93048095703125, 1.029937744140625, 1.12939453125, 1.228851318359375, 1.32830810546875, 1.427764892578125, 1.5272216796875, 1.626678466796875, 1.72613525390625, 1.825592041015625, 1.925048828125, 2.024505615234375, 2.12396240234375, 2.223419189453125, 2.3228759765625, 2.422332763671875, 2.52178955078125, 2.621246337890625, 2.720703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 5.0, 7.0, 2.0, 4.0, 8.0, 24.0, 30.0, 63.0, 130.0, 289.0, 738.0, 1888.0, 7004.0, 41825.0, 737265.0, 235658.0, 17740.0, 3798.0, 1213.0, 456.0, 193.0, 96.0, 65.0, 27.0, 13.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.20801162719726562, -0.20166778564453125, -0.19532394409179688, -0.1889801025390625, -0.18263626098632812, -0.17629241943359375, -0.16994857788085938, -0.163604736328125, -0.15726089477539062, -0.15091705322265625, -0.14457321166992188, -0.1382293701171875, -0.13188552856445312, -0.12554168701171875, -0.11919784545898438, -0.11285400390625, -0.10651016235351562, -0.10016632080078125, -0.09382247924804688, -0.0874786376953125, -0.08113479614257812, -0.07479095458984375, -0.06844711303710938, -0.062103271484375, -0.055759429931640625, -0.04941558837890625, -0.043071746826171875, -0.0367279052734375, -0.030384063720703125, -0.02404022216796875, -0.017696380615234375, -0.0113525390625, -0.005008697509765625, 0.00133514404296875, 0.007678985595703125, 0.0140228271484375, 0.020366668701171875, 0.02671051025390625, 0.033054351806640625, 0.039398193359375, 0.045742034912109375, 0.05208587646484375, 0.058429718017578125, 0.0647735595703125, 0.07111740112304688, 0.07746124267578125, 0.08380508422851562, 0.09014892578125, 0.09649276733398438, 0.10283660888671875, 0.10918045043945312, 0.1155242919921875, 0.12186813354492188, 0.12821197509765625, 0.13455581665039062, 0.140899658203125, 0.14724349975585938, 0.15358734130859375, 0.15993118286132812, 0.1662750244140625, 0.17261886596679688, 0.17896270751953125, 0.18530654907226562, 0.191650390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 5.0, 13.0, 8.0, 22.0, 19.0, 31.0, 56.0, 71.0, 92.0, 117.0, 117.0, 109.0, 96.0, 83.0, 51.0, 31.0, 24.0, 17.0, 11.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.192922592163086e-05, -5.942676216363907e-05, -5.692429840564728e-05, -5.442183464765549e-05, -5.1919370889663696e-05, -4.9416907131671906e-05, -4.6914443373680115e-05, -4.4411979615688324e-05, -4.190951585769653e-05, -3.940705209970474e-05, -3.690458834171295e-05, -3.440212458372116e-05, -3.189966082572937e-05, -2.939719706773758e-05, -2.689473330974579e-05, -2.4392269551753998e-05, -2.1889805793762207e-05, -1.9387342035770416e-05, -1.6884878277778625e-05, -1.4382414519786835e-05, -1.1879950761795044e-05, -9.377487003803253e-06, -6.875023245811462e-06, -4.372559487819672e-06, -1.8700957298278809e-06, 6.323680281639099e-07, 3.1348317861557007e-06, 5.6372955441474915e-06, 8.139759302139282e-06, 1.0642223060131073e-05, 1.3144686818122864e-05, 1.5647150576114655e-05, 1.8149614334106445e-05, 2.0652078092098236e-05, 2.3154541850090027e-05, 2.5657005608081818e-05, 2.815946936607361e-05, 3.06619331240654e-05, 3.316439688205719e-05, 3.566686064004898e-05, 3.816932439804077e-05, 4.067178815603256e-05, 4.317425191402435e-05, 4.5676715672016144e-05, 4.8179179430007935e-05, 5.0681643187999725e-05, 5.3184106945991516e-05, 5.568657070398331e-05, 5.81890344619751e-05, 6.069149821996689e-05, 6.319396197795868e-05, 6.569642573595047e-05, 6.819888949394226e-05, 7.070135325193405e-05, 7.320381700992584e-05, 7.570628076791763e-05, 7.820874452590942e-05, 8.071120828390121e-05, 8.3213672041893e-05, 8.57161357998848e-05, 8.821859955787659e-05, 9.072106331586838e-05, 9.322352707386017e-05, 9.572599083185196e-05, 9.822845458984375e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 15.0, 22.0, 28.0, 51.0, 89.0, 170.0, 272.0, 522.0, 912.0, 1582.0, 3029.0, 5911.0, 12022.0, 29141.0, 90231.0, 340112.0, 393616.0, 109150.0, 33951.0, 13763.0, 6556.0, 3344.0, 1811.0, 993.0, 541.0, 277.0, 173.0, 109.0, 66.0, 28.0, 12.0, 18.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08135986328125, -0.07882308959960938, -0.07628631591796875, -0.07374954223632812, -0.0712127685546875, -0.06867599487304688, -0.06613922119140625, -0.06360244750976562, -0.061065673828125, -0.058528900146484375, -0.05599212646484375, -0.053455352783203125, -0.0509185791015625, -0.048381805419921875, -0.04584503173828125, -0.043308258056640625, -0.040771484375, -0.038234710693359375, -0.03569793701171875, -0.033161163330078125, -0.0306243896484375, -0.028087615966796875, -0.02555084228515625, -0.023014068603515625, -0.020477294921875, -0.017940521240234375, -0.01540374755859375, -0.012866973876953125, -0.0103302001953125, -0.007793426513671875, -0.00525665283203125, -0.002719879150390625, -0.00018310546875, 0.002353668212890625, 0.00489044189453125, 0.007427215576171875, 0.0099639892578125, 0.012500762939453125, 0.01503753662109375, 0.017574310302734375, 0.020111083984375, 0.022647857666015625, 0.02518463134765625, 0.027721405029296875, 0.0302581787109375, 0.032794952392578125, 0.03533172607421875, 0.037868499755859375, 0.0404052734375, 0.042942047119140625, 0.04547882080078125, 0.048015594482421875, 0.0505523681640625, 0.053089141845703125, 0.05562591552734375, 0.058162689208984375, 0.060699462890625, 0.06323623657226562, 0.06577301025390625, 0.06830978393554688, 0.0708465576171875, 0.07338333129882812, 0.07592010498046875, 0.07845687866210938, 0.08099365234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 11.0, 21.0, 30.0, 42.0, 60.0, 94.0, 125.0, 152.0, 123.0, 110.0, 53.0, 35.0, 37.0, 22.0, 7.0, 11.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036590576171875, -0.035463809967041016, -0.03433704376220703, -0.03321027755737305, -0.03208351135253906, -0.030956745147705078, -0.029829978942871094, -0.02870321273803711, -0.027576446533203125, -0.02644968032836914, -0.025322914123535156, -0.024196147918701172, -0.023069381713867188, -0.021942615509033203, -0.02081584930419922, -0.019689083099365234, -0.01856231689453125, -0.017435550689697266, -0.01630878448486328, -0.015182018280029297, -0.014055252075195312, -0.012928485870361328, -0.011801719665527344, -0.01067495346069336, -0.009548187255859375, -0.00842142105102539, -0.007294654846191406, -0.006167888641357422, -0.0050411224365234375, -0.003914356231689453, -0.0027875900268554688, -0.0016608238220214844, -0.0005340576171875, 0.0005927085876464844, 0.0017194747924804688, 0.002846240997314453, 0.0039730072021484375, 0.005099773406982422, 0.006226539611816406, 0.007353305816650391, 0.008480072021484375, 0.00960683822631836, 0.010733604431152344, 0.011860370635986328, 0.012987136840820312, 0.014113903045654297, 0.015240669250488281, 0.016367435455322266, 0.01749420166015625, 0.018620967864990234, 0.01974773406982422, 0.020874500274658203, 0.022001266479492188, 0.023128032684326172, 0.024254798889160156, 0.02538156509399414, 0.026508331298828125, 0.02763509750366211, 0.028761863708496094, 0.029888629913330078, 0.031015396118164062, 0.03214216232299805, 0.03326892852783203, 0.034395694732666016, 0.0355224609375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 20.0, 24.0, 22.0, 51.0, 66.0, 71.0, 82.0, 101.0, 103.0, 96.0, 95.0, 64.0, 56.0, 47.0, 33.0, 17.0, 21.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0808062553405762, -1.0233845710754395, -0.9659629464149475, -0.9085413217544556, -0.8511196970939636, -0.7936980724334717, -0.736276388168335, -0.678854763507843, -0.6214331388473511, -0.5640115141868591, -0.5065898299217224, -0.44916820526123047, -0.3917465806007385, -0.3343249261379242, -0.27690327167510986, -0.21948164701461792, -0.1620599627494812, -0.10463832318782806, -0.04721667617559433, 0.010204970836639404, 0.06762661039829254, 0.12504824995994568, 0.18246990442276, 0.23989152908325195, 0.2973131835460663, 0.3547348380088806, 0.41215646266937256, 0.4695781171321869, 0.5269997715950012, 0.5844213962554932, 0.6418430805206299, 0.699264645576477, 0.7566863298416138, 0.8141079545021057, 0.8715296387672424, 0.9289512634277344, 0.9863728880882263, 1.0437945127487183, 1.101216197013855, 1.1586377620697021, 1.2160594463348389, 1.2734811305999756, 1.3309026956558228, 1.3883243799209595, 1.4457460641860962, 1.5031676292419434, 1.56058931350708, 1.6180109977722168, 1.6754326820373535, 1.7328543663024902, 1.7902759313583374, 1.8476976156234741, 1.9051192998886108, 1.962540864944458, 2.0199625492095947, 2.0773842334747314, 2.134805679321289, 2.192227363586426, 2.2496490478515625, 2.307070732116699, 2.364492177963257, 2.4219138622283936, 2.4793355464935303, 2.536757230758667, 2.5941789150238037]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 16.0, 14.0, 13.0, 21.0, 25.0, 32.0, 42.0, 39.0, 55.0, 43.0, 51.0, 55.0, 67.0, 53.0, 58.0, 58.0, 52.0, 49.0, 33.0, 35.0, 31.0, 37.0, 21.0, 27.0, 16.0, 10.0, 12.0, 3.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3500936031341553, -1.3102937936782837, -1.2704938650131226, -1.230694055557251, -1.1908942461013794, -1.1510944366455078, -1.1112945079803467, -1.071494698524475, -1.0316948890686035, -0.9918950200080872, -0.9520952105522156, -0.9122953414916992, -0.8724955320358276, -0.8326956629753113, -0.7928957939147949, -0.7530959844589233, -0.713296115398407, -0.6734962463378906, -0.633696436882019, -0.5938965678215027, -0.5540967583656311, -0.5142968893051147, -0.4744970500469208, -0.4346972107887268, -0.39489737153053284, -0.35509753227233887, -0.3152976930141449, -0.2754978537559509, -0.23569799959659576, -0.1958981603384018, -0.15609830617904663, -0.11629846692085266, -0.07649862766265869, -0.03669878467917442, 0.003101058304309845, 0.04290090501308441, 0.08270074427127838, 0.12250058352947235, 0.16230043768882751, 0.20210027694702148, 0.24190011620521545, 0.2816999554634094, 0.3214997947216034, 0.36129963397979736, 0.4010995030403137, 0.4408993124961853, 0.48069918155670166, 0.5204989910125732, 0.5602988600730896, 0.600098729133606, 0.6398985385894775, 0.6796984076499939, 0.7194982171058655, 0.7592980861663818, 0.7990978956222534, 0.8388977646827698, 0.8786976337432861, 0.9184975028038025, 0.9582973122596741, 0.9980971813201904, 1.037896990776062, 1.0776968002319336, 1.1174967288970947, 1.1572965383529663, 1.197096347808838]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 8.0, 16.0, 28.0, 46.0, 50.0, 87.0, 141.0, 222.0, 403.0, 721.0, 1463.0, 2760.0, 5858.0, 12809.0, 33046.0, 104302.0, 421887.0, 332861.0, 82939.0, 27581.0, 10859.0, 5055.0, 2532.0, 1291.0, 647.0, 374.0, 215.0, 133.0, 59.0, 53.0, 37.0, 19.0, 14.0, 17.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.9732666015625, -1.909423828125, -1.8455810546875, -1.78173828125, -1.7178955078125, -1.654052734375, -1.5902099609375, -1.5263671875, -1.4625244140625, -1.398681640625, -1.3348388671875, -1.27099609375, -1.2071533203125, -1.143310546875, -1.0794677734375, -1.015625, -0.9517822265625, -0.887939453125, -0.8240966796875, -0.76025390625, -0.6964111328125, -0.632568359375, -0.5687255859375, -0.5048828125, -0.4410400390625, -0.377197265625, -0.3133544921875, -0.24951171875, -0.1856689453125, -0.121826171875, -0.0579833984375, 0.005859375, 0.0697021484375, 0.133544921875, 0.1973876953125, 0.26123046875, 0.3250732421875, 0.388916015625, 0.4527587890625, 0.5166015625, 0.5804443359375, 0.644287109375, 0.7081298828125, 0.77197265625, 0.8358154296875, 0.899658203125, 0.9635009765625, 1.02734375, 1.0911865234375, 1.155029296875, 1.2188720703125, 1.28271484375, 1.3465576171875, 1.410400390625, 1.4742431640625, 1.5380859375, 1.6019287109375, 1.665771484375, 1.7296142578125, 1.79345703125, 1.8572998046875, 1.921142578125, 1.9849853515625, 2.048828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 10.0, 18.0, 15.0, 21.0, 14.0, 31.0, 38.0, 35.0, 30.0, 34.0, 35.0, 42.0, 56.0, 48.0, 57.0, 51.0, 50.0, 50.0, 39.0, 39.0, 35.0, 27.0, 35.0, 31.0, 28.0, 24.0, 15.0, 10.0, 15.0, 13.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.90234375, -1.8438720703125, -1.785400390625, -1.7269287109375, -1.66845703125, -1.6099853515625, -1.551513671875, -1.4930419921875, -1.4345703125, -1.3760986328125, -1.317626953125, -1.2591552734375, -1.20068359375, -1.1422119140625, -1.083740234375, -1.0252685546875, -0.966796875, -0.9083251953125, -0.849853515625, -0.7913818359375, -0.73291015625, -0.6744384765625, -0.615966796875, -0.5574951171875, -0.4990234375, -0.4405517578125, -0.382080078125, -0.3236083984375, -0.26513671875, -0.2066650390625, -0.148193359375, -0.0897216796875, -0.03125, 0.0272216796875, 0.085693359375, 0.1441650390625, 0.20263671875, 0.2611083984375, 0.319580078125, 0.3780517578125, 0.4365234375, 0.4949951171875, 0.553466796875, 0.6119384765625, 0.67041015625, 0.7288818359375, 0.787353515625, 0.8458251953125, 0.904296875, 0.9627685546875, 1.021240234375, 1.0797119140625, 1.13818359375, 1.1966552734375, 1.255126953125, 1.3135986328125, 1.3720703125, 1.4305419921875, 1.489013671875, 1.5474853515625, 1.60595703125, 1.6644287109375, 1.722900390625, 1.7813720703125, 1.83984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 11.0, 15.0, 31.0, 28.0, 37.0, 67.0, 90.0, 129.0, 194.0, 351.0, 582.0, 1036.0, 1824.0, 3382.0, 6636.0, 13280.0, 29826.0, 74041.0, 218096.0, 425043.0, 166631.0, 59080.0, 24607.0, 11236.0, 5474.0, 2933.0, 1572.0, 879.0, 526.0, 319.0, 219.0, 125.0, 76.0, 63.0, 36.0, 32.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7001953125, -1.6521453857421875, -1.604095458984375, -1.5560455322265625, -1.50799560546875, -1.4599456787109375, -1.411895751953125, -1.3638458251953125, -1.3157958984375, -1.2677459716796875, -1.219696044921875, -1.1716461181640625, -1.12359619140625, -1.0755462646484375, -1.027496337890625, -0.9794464111328125, -0.931396484375, -0.8833465576171875, -0.835296630859375, -0.7872467041015625, -0.73919677734375, -0.6911468505859375, -0.643096923828125, -0.5950469970703125, -0.5469970703125, -0.4989471435546875, -0.450897216796875, -0.4028472900390625, -0.35479736328125, -0.3067474365234375, -0.258697509765625, -0.2106475830078125, -0.16259765625, -0.1145477294921875, -0.066497802734375, -0.0184478759765625, 0.02960205078125, 0.0776519775390625, 0.125701904296875, 0.1737518310546875, 0.2218017578125, 0.2698516845703125, 0.317901611328125, 0.3659515380859375, 0.41400146484375, 0.4620513916015625, 0.510101318359375, 0.5581512451171875, 0.606201171875, 0.6542510986328125, 0.702301025390625, 0.7503509521484375, 0.79840087890625, 0.8464508056640625, 0.894500732421875, 0.9425506591796875, 0.9906005859375, 1.0386505126953125, 1.086700439453125, 1.1347503662109375, 1.18280029296875, 1.2308502197265625, 1.278900146484375, 1.3269500732421875, 1.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 2.0, 12.0, 7.0, 11.0, 15.0, 14.0, 23.0, 28.0, 19.0, 30.0, 25.0, 36.0, 30.0, 31.0, 39.0, 41.0, 40.0, 46.0, 50.0, 56.0, 36.0, 52.0, 48.0, 42.0, 34.0, 30.0, 26.0, 25.0, 20.0, 20.0, 15.0, 12.0, 12.0, 8.0, 7.0, 11.0, 3.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0], "bins": [-2.8359375, -2.759490966796875, -2.68304443359375, -2.606597900390625, -2.5301513671875, -2.453704833984375, -2.37725830078125, -2.300811767578125, -2.224365234375, -2.147918701171875, -2.07147216796875, -1.995025634765625, -1.9185791015625, -1.842132568359375, -1.76568603515625, -1.689239501953125, -1.61279296875, -1.536346435546875, -1.45989990234375, -1.383453369140625, -1.3070068359375, -1.230560302734375, -1.15411376953125, -1.077667236328125, -1.001220703125, -0.924774169921875, -0.84832763671875, -0.771881103515625, -0.6954345703125, -0.618988037109375, -0.54254150390625, -0.466094970703125, -0.3896484375, -0.313201904296875, -0.23675537109375, -0.160308837890625, -0.0838623046875, -0.007415771484375, 0.06903076171875, 0.145477294921875, 0.221923828125, 0.298370361328125, 0.37481689453125, 0.451263427734375, 0.5277099609375, 0.604156494140625, 0.68060302734375, 0.757049560546875, 0.83349609375, 0.909942626953125, 0.98638916015625, 1.062835693359375, 1.1392822265625, 1.215728759765625, 1.29217529296875, 1.368621826171875, 1.445068359375, 1.521514892578125, 1.59796142578125, 1.674407958984375, 1.7508544921875, 1.827301025390625, 1.90374755859375, 1.980194091796875, 2.056640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 3.0, 8.0, 14.0, 23.0, 30.0, 31.0, 60.0, 111.0, 145.0, 258.0, 412.0, 548.0, 1043.0, 1696.0, 2798.0, 4905.0, 8576.0, 15474.0, 28666.0, 53365.0, 100313.0, 192965.0, 312652.0, 151032.0, 79202.0, 42182.0, 22788.0, 12500.0, 6848.0, 3914.0, 2297.0, 1383.0, 873.0, 523.0, 310.0, 191.0, 133.0, 89.0, 65.0, 27.0, 32.0, 24.0, 12.0, 5.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.271484375, -0.26357269287109375, -0.2556610107421875, -0.24774932861328125, -0.239837646484375, -0.23192596435546875, -0.2240142822265625, -0.21610260009765625, -0.20819091796875, -0.20027923583984375, -0.1923675537109375, -0.18445587158203125, -0.176544189453125, -0.16863250732421875, -0.1607208251953125, -0.15280914306640625, -0.1448974609375, -0.13698577880859375, -0.1290740966796875, -0.12116241455078125, -0.113250732421875, -0.10533905029296875, -0.0974273681640625, -0.08951568603515625, -0.08160400390625, -0.07369232177734375, -0.0657806396484375, -0.05786895751953125, -0.049957275390625, -0.04204559326171875, -0.0341339111328125, -0.02622222900390625, -0.018310546875, -0.01039886474609375, -0.0024871826171875, 0.00542449951171875, 0.013336181640625, 0.02124786376953125, 0.0291595458984375, 0.03707122802734375, 0.04498291015625, 0.05289459228515625, 0.0608062744140625, 0.06871795654296875, 0.076629638671875, 0.08454132080078125, 0.0924530029296875, 0.10036468505859375, 0.1082763671875, 0.11618804931640625, 0.1240997314453125, 0.13201141357421875, 0.139923095703125, 0.14783477783203125, 0.1557464599609375, 0.16365814208984375, 0.17156982421875, 0.17948150634765625, 0.1873931884765625, 0.19530487060546875, 0.203216552734375, 0.21112823486328125, 0.2190399169921875, 0.22695159912109375, 0.23486328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 8.0, 8.0, 22.0, 26.0, 21.0, 31.0, 31.0, 41.0, 46.0, 61.0, 67.0, 100.0, 116.0, 68.0, 62.0, 53.0, 42.0, 32.0, 28.0, 29.0, 18.0, 12.0, 16.0, 5.0, 11.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.00012564659118652344, -0.00012251641601324081, -0.00011938624083995819, -0.00011625606566667557, -0.00011312589049339294, -0.00010999571532011032, -0.0001068655401468277, -0.00010373536497354507, -0.00010060518980026245, -9.747501462697983e-05, -9.43448394536972e-05, -9.121466428041458e-05, -8.808448910713196e-05, -8.495431393384933e-05, -8.182413876056671e-05, -7.869396358728409e-05, -7.556378841400146e-05, -7.243361324071884e-05, -6.930343806743622e-05, -6.61732628941536e-05, -6.304308772087097e-05, -5.991291254758835e-05, -5.6782737374305725e-05, -5.36525622010231e-05, -5.052238702774048e-05, -4.7392211854457855e-05, -4.426203668117523e-05, -4.113186150789261e-05, -3.8001686334609985e-05, -3.487151116132736e-05, -3.174133598804474e-05, -2.8611160814762115e-05, -2.5480985641479492e-05, -2.235081046819687e-05, -1.9220635294914246e-05, -1.6090460121631622e-05, -1.2960284948348999e-05, -9.830109775066376e-06, -6.6999346017837524e-06, -3.569759428501129e-06, -4.3958425521850586e-07, 2.6905909180641174e-06, 5.820766091346741e-06, 8.950941264629364e-06, 1.2081116437911987e-05, 1.521129161119461e-05, 1.8341466784477234e-05, 2.1471641957759857e-05, 2.460181713104248e-05, 2.7731992304325104e-05, 3.086216747760773e-05, 3.399234265089035e-05, 3.7122517824172974e-05, 4.02526929974556e-05, 4.338286817073822e-05, 4.6513043344020844e-05, 4.964321851730347e-05, 5.277339369058609e-05, 5.590356886386871e-05, 5.903374403715134e-05, 6.216391921043396e-05, 6.529409438371658e-05, 6.84242695569992e-05, 7.155444473028183e-05, 7.468461990356445e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 10.0, 7.0, 12.0, 15.0, 24.0, 33.0, 46.0, 82.0, 108.0, 157.0, 202.0, 355.0, 536.0, 876.0, 1399.0, 2320.0, 4059.0, 7350.0, 14228.0, 28981.0, 62387.0, 139447.0, 351544.0, 235351.0, 103814.0, 46820.0, 22561.0, 11237.0, 5835.0, 3473.0, 1944.0, 1170.0, 754.0, 467.0, 344.0, 202.0, 121.0, 88.0, 52.0, 48.0, 36.0, 26.0, 14.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.393310546875, -0.3820152282714844, -0.37071990966796875, -0.3594245910644531, -0.3481292724609375, -0.3368339538574219, -0.32553863525390625, -0.3142433166503906, -0.302947998046875, -0.2916526794433594, -0.28035736083984375, -0.2690620422363281, -0.2577667236328125, -0.24647140502929688, -0.23517608642578125, -0.22388076782226562, -0.21258544921875, -0.20129013061523438, -0.18999481201171875, -0.17869949340820312, -0.1674041748046875, -0.15610885620117188, -0.14481353759765625, -0.13351821899414062, -0.122222900390625, -0.11092758178710938, -0.09963226318359375, -0.08833694458007812, -0.0770416259765625, -0.06574630737304688, -0.05445098876953125, -0.043155670166015625, -0.0318603515625, -0.020565032958984375, -0.00926971435546875, 0.002025604248046875, 0.0133209228515625, 0.024616241455078125, 0.03591156005859375, 0.047206878662109375, 0.058502197265625, 0.06979751586914062, 0.08109283447265625, 0.09238815307617188, 0.1036834716796875, 0.11497879028320312, 0.12627410888671875, 0.13756942749023438, 0.14886474609375, 0.16016006469726562, 0.17145538330078125, 0.18275070190429688, 0.1940460205078125, 0.20534133911132812, 0.21663665771484375, 0.22793197631835938, 0.239227294921875, 0.2505226135253906, 0.26181793212890625, 0.2731132507324219, 0.2844085693359375, 0.2957038879394531, 0.30699920654296875, 0.3182945251464844, 0.32958984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 11.0, 10.0, 10.0, 15.0, 18.0, 22.0, 31.0, 33.0, 36.0, 42.0, 50.0, 72.0, 96.0, 93.0, 82.0, 51.0, 52.0, 49.0, 36.0, 29.0, 29.0, 28.0, 22.0, 15.0, 17.0, 9.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.2469940185546875, -0.238616943359375, -0.2302398681640625, -0.22186279296875, -0.2134857177734375, -0.205108642578125, -0.1967315673828125, -0.1883544921875, -0.1799774169921875, -0.171600341796875, -0.1632232666015625, -0.15484619140625, -0.1464691162109375, -0.138092041015625, -0.1297149658203125, -0.121337890625, -0.1129608154296875, -0.104583740234375, -0.0962066650390625, -0.08782958984375, -0.0794525146484375, -0.071075439453125, -0.0626983642578125, -0.0543212890625, -0.0459442138671875, -0.037567138671875, -0.0291900634765625, -0.02081298828125, -0.0124359130859375, -0.004058837890625, 0.0043182373046875, 0.0126953125, 0.0210723876953125, 0.029449462890625, 0.0378265380859375, 0.04620361328125, 0.0545806884765625, 0.062957763671875, 0.0713348388671875, 0.0797119140625, 0.0880889892578125, 0.096466064453125, 0.1048431396484375, 0.11322021484375, 0.1215972900390625, 0.129974365234375, 0.1383514404296875, 0.146728515625, 0.1551055908203125, 0.163482666015625, 0.1718597412109375, 0.18023681640625, 0.1886138916015625, 0.196990966796875, 0.2053680419921875, 0.2137451171875, 0.2221221923828125, 0.230499267578125, 0.2388763427734375, 0.24725341796875, 0.2556304931640625, 0.264007568359375, 0.2723846435546875, 0.28076171875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 13.0, 13.0, 28.0, 29.0, 78.0, 78.0, 95.0, 138.0, 93.0, 126.0, 104.0, 70.0, 48.0, 36.0, 17.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.894886016845703, -4.7289509773254395, -4.563016414642334, -4.39708137512207, -4.231146812438965, -4.065211772918701, -3.8992769718170166, -3.733342170715332, -3.5674073696136475, -3.401472568511963, -3.2355377674102783, -3.0696029663085938, -2.90366792678833, -2.7377333641052246, -2.571798324584961, -2.4058635234832764, -2.239928722381592, -2.0739939212799072, -1.9080591201782227, -1.7421241998672485, -1.576189398765564, -1.4102545976638794, -1.2443196773529053, -1.0783848762512207, -0.9124500751495361, -0.7465152740478516, -0.5805804133415222, -0.41464558243751526, -0.2487107515335083, -0.08277595043182373, 0.08315891027450562, 0.24909377098083496, 0.41502904891967773, 0.5809638500213623, 0.7468987107276917, 0.912833571434021, 1.0787683725357056, 1.2447031736373901, 1.4106380939483643, 1.5765728950500488, 1.7425076961517334, 1.908442497253418, 2.0743772983551025, 2.240312099456787, 2.406247138977051, 2.5721817016601562, 2.73811674118042, 2.9040515422821045, 3.069986343383789, 3.2359211444854736, 3.401855945587158, 3.5677907466888428, 3.7337255477905273, 3.899660587310791, 4.0655951499938965, 4.23153018951416, 4.397464752197266, 4.563399791717529, 4.729334354400635, 4.895269393920898, 5.061203956604004, 5.227138996124268, 5.393073558807373, 5.559008598327637, 5.7249436378479]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 7.0, 3.0, 6.0, 7.0, 8.0, 12.0, 15.0, 15.0, 17.0, 23.0, 16.0, 20.0, 14.0, 19.0, 28.0, 31.0, 39.0, 40.0, 29.0, 37.0, 44.0, 30.0, 37.0, 52.0, 32.0, 41.0, 35.0, 31.0, 30.0, 25.0, 28.0, 26.0, 24.0, 25.0, 22.0, 21.0, 17.0, 16.0, 17.0, 10.0, 17.0, 9.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.084555625915527, -3.9525306224823, -3.8205056190490723, -3.6884806156158447, -3.556455612182617, -3.4244308471679688, -3.292405843734741, -3.1603808403015137, -3.028355836868286, -2.8963308334350586, -2.764305830001831, -2.6322808265686035, -2.500256061553955, -2.3682308197021484, -2.2362060546875, -2.1041810512542725, -1.972156047821045, -1.8401310443878174, -1.7081060409545898, -1.5760811567306519, -1.4440561532974243, -1.3120311498641968, -1.1800062656402588, -1.0479812622070312, -0.9159562587738037, -0.7839312553405762, -0.6519063115119934, -0.5198813676834106, -0.3878563642501831, -0.25583136081695557, -0.1238064169883728, 0.008218526840209961, 0.1402430534362793, 0.27226802706718445, 0.4042930006980896, 0.5363179445266724, 0.6683429479598999, 0.8003679513931274, 0.9323928952217102, 1.064417839050293, 1.1964428424835205, 1.328467845916748, 1.4604928493499756, 1.5925177335739136, 1.7245427370071411, 1.8565677404403687, 1.9885926246643066, 2.120617628097534, 2.2526426315307617, 2.3846676349639893, 2.516692638397217, 2.6487176418304443, 2.780742645263672, 2.9127674102783203, 3.044792413711548, 3.1768174171447754, 3.308842420578003, 3.4408674240112305, 3.572892427444458, 3.7049174308776855, 3.836942195892334, 3.9689674377441406, 4.100992202758789, 4.2330169677734375, 4.365042209625244]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 6.0, 12.0, 9.0, 12.0, 21.0, 31.0, 37.0, 42.0, 68.0, 77.0, 113.0, 129.0, 164.0, 212.0, 235.0, 313.0, 372.0, 431.0, 512.0, 587.0, 785.0, 1167.0, 1040670.0, 929.0, 670.0, 561.0, 449.0, 399.0, 323.0, 243.0, 193.0, 190.0, 122.0, 121.0, 97.0, 75.0, 55.0, 33.0, 28.0, 29.0, 19.0, 19.0, 9.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-4.427000045776367, -4.280395984649658, -4.133791923522949, -3.9871878623962402, -3.8405838012695312, -3.6939797401428223, -3.5473756790161133, -3.4007716178894043, -3.2541675567626953, -3.1075634956359863, -2.9609594345092773, -2.8143553733825684, -2.6677513122558594, -2.5211472511291504, -2.3745431900024414, -2.2279391288757324, -2.0813350677490234, -1.9347310066223145, -1.7881269454956055, -1.6415228843688965, -1.4949188232421875, -1.3483147621154785, -1.2017107009887695, -1.0551066398620605, -0.9085025787353516, -0.7618985176086426, -0.6152944564819336, -0.4686903953552246, -0.3220863342285156, -0.17548227310180664, -0.028878211975097656, 0.11772584915161133, 0.2643303871154785, 0.4109344482421875, 0.5575385093688965, 0.7041425704956055, 0.8507466316223145, 0.9973506927490234, 1.1439547538757324, 1.2905588150024414, 1.4371628761291504, 1.5837669372558594, 1.7303709983825684, 1.8769750595092773, 2.0235791206359863, 2.1701831817626953, 2.3167872428894043, 2.4633913040161133, 2.6099953651428223, 2.7565994262695312, 2.9032034873962402, 3.049807548522949, 3.196411609649658, 3.343015670776367, 3.489619731903076, 3.636223793029785, 3.782827854156494, 3.929431915283203, 4.076035976409912, 4.222640037536621, 4.36924409866333, 4.515848159790039, 4.662452220916748, 4.809056282043457, 4.955660343170166]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 8.0, 11.0, 15.0, 35.0, 80.0, 155.0, 393.0, 1144.0, 3213.0, 9693.0, 51413792.0, 31560.0, 7211.0, 2556.0, 858.0, 317.0, 132.0, 63.0, 26.0, 21.0, 10.0, 7.0, 8.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.18787384033203, -20.453519821166992, -19.719165802001953, -18.984811782836914, -18.250457763671875, -17.516103744506836, -16.781749725341797, -16.047395706176758, -15.313041687011719, -14.57868766784668, -13.84433364868164, -13.109979629516602, -12.375625610351562, -11.641271591186523, -10.906917572021484, -10.172563552856445, -9.438210487365723, -8.703856468200684, -7.9695024490356445, -7.2351484298706055, -6.500794410705566, -5.766440391540527, -5.0320868492126465, -4.297732830047607, -3.5633788108825684, -2.8290247917175293, -2.0946707725524902, -1.3603169918060303, -0.6259629726409912, 0.10839104652404785, 0.8427448272705078, 1.5770988464355469, 2.311452865600586, 3.045806884765625, 3.780160903930664, 4.514514923095703, 5.248868942260742, 5.983222961425781, 6.717576503753662, 7.451930522918701, 8.186285018920898, 8.920639038085938, 9.654993057250977, 10.389347076416016, 11.123701095581055, 11.858055114746094, 12.592409133911133, 13.326763153076172, 14.061116218566895, 14.795470237731934, 15.529824256896973, 16.264177322387695, 16.998531341552734, 17.732885360717773, 18.467239379882812, 19.20159339904785, 19.93594741821289, 20.67030143737793, 21.40465545654297, 22.139009475708008, 22.873363494873047, 23.607717514038086, 24.342071533203125, 25.076425552368164, 25.810779571533203]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 14.0, 6.0, 27.0, 35.0, 66.0, 69.0, 86.0, 151.0, 186.0, 302.0, 484.0, 759.0, 1212.0, 2023.0, 3615.0, 6101.0, 10912.0, 19809.0, 36960.0, 68946.0, 125730.0, 217430.0, 346115.0, 597760.0, 3375342.0, 621559.0, 349673.0, 222420.0, 127958.0, 70477.0, 37910.0, 20382.0, 11366.0, 6269.0, 3647.0, 2022.0, 1304.0, 796.0, 509.0, 339.0, 196.0, 129.0, 111.0, 83.0, 45.0, 31.0, 28.0, 15.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.810546875, -0.7848281860351562, -0.7591094970703125, -0.7333908081054688, -0.707672119140625, -0.6819534301757812, -0.6562347412109375, -0.6305160522460938, -0.60479736328125, -0.5790786743164062, -0.5533599853515625, -0.5276412963867188, -0.501922607421875, -0.47620391845703125, -0.4504852294921875, -0.42476654052734375, -0.3990478515625, -0.37332916259765625, -0.3476104736328125, -0.32189178466796875, -0.296173095703125, -0.27045440673828125, -0.2447357177734375, -0.21901702880859375, -0.19329833984375, -0.16757965087890625, -0.1418609619140625, -0.11614227294921875, -0.090423583984375, -0.06470489501953125, -0.0389862060546875, -0.01326751708984375, 0.012451171875, 0.03816986083984375, 0.0638885498046875, 0.08960723876953125, 0.115325927734375, 0.14104461669921875, 0.1667633056640625, 0.19248199462890625, 0.21820068359375, 0.24391937255859375, 0.2696380615234375, 0.29535675048828125, 0.321075439453125, 0.34679412841796875, 0.3725128173828125, 0.39823150634765625, 0.4239501953125, 0.44966888427734375, 0.4753875732421875, 0.5011062622070312, 0.526824951171875, 0.5525436401367188, 0.5782623291015625, 0.6039810180664062, 0.62969970703125, 0.6554183959960938, 0.6811370849609375, 0.7068557739257812, 0.732574462890625, 0.7582931518554688, 0.7840118408203125, 0.8097305297851562, 0.83544921875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 3.0, 5.0, 9.0, 18.0, 14.0, 16.0, 20.0, 15.0, 32.0, 33.0, 34.0, 51.0, 27.0, 46.0, 50.0, 35.0, 75.0, 956.0, 110.0, 48.0, 38.0, 48.0, 36.0, 26.0, 42.0, 33.0, 28.0, 14.0, 31.0, 22.0, 12.0, 18.0, 9.0, 7.0, 11.0, 7.0, 6.0, 4.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9296875, -12.5203857421875, -12.111083984375, -11.7017822265625, -11.29248046875, -10.8831787109375, -10.473876953125, -10.0645751953125, -9.6552734375, -9.2459716796875, -8.836669921875, -8.4273681640625, -8.01806640625, -7.6087646484375, -7.199462890625, -6.7901611328125, -6.380859375, -5.9715576171875, -5.562255859375, -5.1529541015625, -4.74365234375, -4.3343505859375, -3.925048828125, -3.5157470703125, -3.1064453125, -2.6971435546875, -2.287841796875, -1.8785400390625, -1.46923828125, -1.0599365234375, -0.650634765625, -0.2413330078125, 0.16796875, 0.5772705078125, 0.986572265625, 1.3958740234375, 1.80517578125, 2.2144775390625, 2.623779296875, 3.0330810546875, 3.4423828125, 3.8516845703125, 4.260986328125, 4.6702880859375, 5.07958984375, 5.4888916015625, 5.898193359375, 6.3074951171875, 6.716796875, 7.1260986328125, 7.535400390625, 7.9447021484375, 8.35400390625, 8.7633056640625, 9.172607421875, 9.5819091796875, 9.9912109375, 10.4005126953125, 10.809814453125, 11.2191162109375, 11.62841796875, 12.0377197265625, 12.447021484375, 12.8563232421875, 13.265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 6.0, 7.0, 15.0, 15.0, 26.0, 38.0, 63.0, 111.0, 217.0, 471.0, 1082.0, 2590.0, 7117.0, 18970.0, 51129.0, 129822.0, 289793.0, 530696.0, 3646687.0, 845763.0, 419395.0, 207161.0, 87072.0, 33396.0, 12120.0, 4436.0, 1755.0, 774.0, 326.0, 160.0, 92.0, 58.0, 26.0, 16.0, 16.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.1201171875, -1.09393310546875, -1.0677490234375, -1.04156494140625, -1.015380859375, -0.98919677734375, -0.9630126953125, -0.93682861328125, -0.91064453125, -0.88446044921875, -0.8582763671875, -0.83209228515625, -0.805908203125, -0.77972412109375, -0.7535400390625, -0.72735595703125, -0.701171875, -0.67498779296875, -0.6488037109375, -0.62261962890625, -0.596435546875, -0.57025146484375, -0.5440673828125, -0.51788330078125, -0.49169921875, -0.46551513671875, -0.4393310546875, -0.41314697265625, -0.386962890625, -0.36077880859375, -0.3345947265625, -0.30841064453125, -0.2822265625, -0.25604248046875, -0.2298583984375, -0.20367431640625, -0.177490234375, -0.15130615234375, -0.1251220703125, -0.09893798828125, -0.07275390625, -0.04656982421875, -0.0203857421875, 0.00579833984375, 0.031982421875, 0.05816650390625, 0.0843505859375, 0.11053466796875, 0.13671875, 0.16290283203125, 0.1890869140625, 0.21527099609375, 0.241455078125, 0.26763916015625, 0.2938232421875, 0.32000732421875, 0.34619140625, 0.37237548828125, 0.3985595703125, 0.42474365234375, 0.450927734375, 0.47711181640625, 0.5032958984375, 0.52947998046875, 0.5556640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 14.0, 14.0, 20.0, 23.0, 23.0, 33.0, 31.0, 34.0, 41.0, 47.0, 49.0, 46.0, 56.0, 729.0, 399.0, 42.0, 54.0, 48.0, 54.0, 42.0, 34.0, 34.0, 23.0, 24.0, 15.0, 23.0, 14.0, 17.0, 13.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -9.926025390625, -9.49267578125, -9.059326171875, -8.6259765625, -8.192626953125, -7.75927734375, -7.325927734375, -6.892578125, -6.459228515625, -6.02587890625, -5.592529296875, -5.1591796875, -4.725830078125, -4.29248046875, -3.859130859375, -3.42578125, -2.992431640625, -2.55908203125, -2.125732421875, -1.6923828125, -1.259033203125, -0.82568359375, -0.392333984375, 0.041015625, 0.474365234375, 0.90771484375, 1.341064453125, 1.7744140625, 2.207763671875, 2.64111328125, 3.074462890625, 3.5078125, 3.941162109375, 4.37451171875, 4.807861328125, 5.2412109375, 5.674560546875, 6.10791015625, 6.541259765625, 6.974609375, 7.407958984375, 7.84130859375, 8.274658203125, 8.7080078125, 9.141357421875, 9.57470703125, 10.008056640625, 10.44140625, 10.874755859375, 11.30810546875, 11.741455078125, 12.1748046875, 12.608154296875, 13.04150390625, 13.474853515625, 13.908203125, 14.341552734375, 14.77490234375, 15.208251953125, 15.6416015625, 16.074951171875, 16.50830078125, 16.941650390625, 17.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 8.0, 10.0, 13.0, 25.0, 43.0, 63.0, 90.0, 163.0, 203.0, 336.0, 553.0, 822.0, 1378.0, 2734.0, 5518.0, 14007.0, 44053.0, 204353.0, 4574113.0, 1228844.0, 155472.0, 36119.0, 11836.0, 4856.0, 2367.0, 1269.0, 780.0, 485.0, 311.0, 207.0, 133.0, 81.0, 50.0, 37.0, 26.0, 23.0, 5.0, 17.0, 6.0, 5.0, 8.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5712890625, -1.5129241943359375, -1.454559326171875, -1.3961944580078125, -1.33782958984375, -1.2794647216796875, -1.221099853515625, -1.1627349853515625, -1.1043701171875, -1.0460052490234375, -0.987640380859375, -0.9292755126953125, -0.87091064453125, -0.8125457763671875, -0.754180908203125, -0.6958160400390625, -0.637451171875, -0.5790863037109375, -0.520721435546875, -0.4623565673828125, -0.40399169921875, -0.3456268310546875, -0.287261962890625, -0.2288970947265625, -0.1705322265625, -0.1121673583984375, -0.053802490234375, 0.0045623779296875, 0.06292724609375, 0.1212921142578125, 0.179656982421875, 0.2380218505859375, 0.29638671875, 0.3547515869140625, 0.413116455078125, 0.4714813232421875, 0.52984619140625, 0.5882110595703125, 0.646575927734375, 0.7049407958984375, 0.7633056640625, 0.8216705322265625, 0.880035400390625, 0.9384002685546875, 0.99676513671875, 1.0551300048828125, 1.113494873046875, 1.1718597412109375, 1.230224609375, 1.2885894775390625, 1.346954345703125, 1.4053192138671875, 1.46368408203125, 1.5220489501953125, 1.580413818359375, 1.6387786865234375, 1.6971435546875, 1.7555084228515625, 1.813873291015625, 1.8722381591796875, 1.93060302734375, 1.9889678955078125, 2.047332763671875, 2.1056976318359375, 2.1640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 7.0, 9.0, 6.0, 10.0, 9.0, 24.0, 27.0, 28.0, 33.0, 41.0, 36.0, 54.0, 56.0, 43.0, 40.0, 150.0, 986.0, 61.0, 49.0, 37.0, 49.0, 40.0, 35.0, 26.0, 29.0, 27.0, 28.0, 13.0, 19.0, 13.0, 5.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5078125, -12.07861328125, -11.6494140625, -11.22021484375, -10.791015625, -10.36181640625, -9.9326171875, -9.50341796875, -9.07421875, -8.64501953125, -8.2158203125, -7.78662109375, -7.357421875, -6.92822265625, -6.4990234375, -6.06982421875, -5.640625, -5.21142578125, -4.7822265625, -4.35302734375, -3.923828125, -3.49462890625, -3.0654296875, -2.63623046875, -2.20703125, -1.77783203125, -1.3486328125, -0.91943359375, -0.490234375, -0.06103515625, 0.3681640625, 0.79736328125, 1.2265625, 1.65576171875, 2.0849609375, 2.51416015625, 2.943359375, 3.37255859375, 3.8017578125, 4.23095703125, 4.66015625, 5.08935546875, 5.5185546875, 5.94775390625, 6.376953125, 6.80615234375, 7.2353515625, 7.66455078125, 8.09375, 8.52294921875, 8.9521484375, 9.38134765625, 9.810546875, 10.23974609375, 10.6689453125, 11.09814453125, 11.52734375, 11.95654296875, 12.3857421875, 12.81494140625, 13.244140625, 13.67333984375, 14.1025390625, 14.53173828125, 14.9609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 10.0, 27.0, 58.0, 290.0, 361.0, 179.0, 45.0, 18.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.83673858642578, -38.67256164550781, -37.508384704589844, -36.34421157836914, -35.18003463745117, -34.0158576965332, -32.8516845703125, -31.68750762939453, -30.523330688476562, -29.359153747558594, -28.194978713989258, -27.030803680419922, -25.866626739501953, -24.702449798583984, -23.53827476501465, -22.374099731445312, -21.209922790527344, -20.045745849609375, -18.88157081604004, -17.717395782470703, -16.553218841552734, -15.389042854309082, -14.22486686706543, -13.060690879821777, -11.896514892578125, -10.732338905334473, -9.56816291809082, -8.403986930847168, -7.239810943603516, -6.075634956359863, -4.911458969116211, -3.7472829818725586, -2.583110809326172, -1.4189348220825195, -0.2547588348388672, 0.9094171524047852, 2.0735931396484375, 3.23776912689209, 4.401945114135742, 5.5661211013793945, 6.730297088623047, 7.894473075866699, 9.058649063110352, 10.222825050354004, 11.387001037597656, 12.551177024841309, 13.715353012084961, 14.879528999328613, 16.043704986572266, 17.207881927490234, 18.37205696105957, 19.536231994628906, 20.700408935546875, 21.864585876464844, 23.02876091003418, 24.192935943603516, 25.357112884521484, 26.521289825439453, 27.68546485900879, 28.849639892578125, 30.013816833496094, 31.177993774414062, 32.34217071533203, 33.506343841552734, 34.6705207824707]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 13.0, 10.0, 19.0, 16.0, 39.0, 56.0, 54.0, 71.0, 96.0, 88.0, 103.0, 81.0, 83.0, 62.0, 45.0, 30.0, 33.0, 24.0, 17.0, 11.0, 14.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.75379180908203, -34.51516342163086, -33.27653121948242, -32.03790283203125, -30.799270629882812, -29.56064224243164, -28.322011947631836, -27.08338165283203, -25.844751358032227, -24.606121063232422, -23.367490768432617, -22.128860473632812, -20.89023208618164, -19.651599884033203, -18.41297149658203, -17.174341201782227, -15.935710906982422, -14.697080612182617, -13.458450317382812, -12.219820976257324, -10.98119068145752, -9.742560386657715, -8.503931045532227, -7.265300750732422, -6.026670455932617, -4.7880401611328125, -3.549410343170166, -2.3107802867889404, -1.0721502304077148, 0.16648006439208984, 1.4051098823547363, 2.643739700317383, 3.882373809814453, 5.121004104614258, 6.359633922576904, 7.598263740539551, 8.836894035339355, 10.07552433013916, 11.314153671264648, 12.552783966064453, 13.791414260864258, 15.030044555664062, 16.268674850463867, 17.507305145263672, 18.745933532714844, 19.98456573486328, 21.223194122314453, 22.461824417114258, 23.700454711914062, 24.939085006713867, 26.177715301513672, 27.416345596313477, 28.65497589111328, 29.893604278564453, 31.132234573364258, 32.37086486816406, 33.6094970703125, 34.84812545776367, 36.08675765991211, 37.32538604736328, 38.56401824951172, 39.80264663696289, 41.04127883911133, 42.2799072265625, 43.51853561401367]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 10.0, 20.0, 892.0, 1817.0, 2797.0, 6540.0, 39773.0, 3110763.0, 1000234.0, 25372.0, 3689.0, 1995.0, 295.0, 26.0, 18.0, 10.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.1486968994140625, -0.142730712890625, -0.1367645263671875, -0.13079833984375, -0.1248321533203125, -0.118865966796875, -0.1128997802734375, -0.10693359375, -0.1009674072265625, -0.095001220703125, -0.0890350341796875, -0.08306884765625, -0.0771026611328125, -0.071136474609375, -0.0651702880859375, -0.0592041015625, -0.0532379150390625, -0.047271728515625, -0.0413055419921875, -0.03533935546875, -0.0293731689453125, -0.023406982421875, -0.0174407958984375, -0.011474609375, -0.0055084228515625, 0.000457763671875, 0.0064239501953125, 0.01239013671875, 0.0183563232421875, 0.024322509765625, 0.0302886962890625, 0.0362548828125, 0.0422210693359375, 0.048187255859375, 0.0541534423828125, 0.06011962890625, 0.0660858154296875, 0.072052001953125, 0.0780181884765625, 0.083984375, 0.0899505615234375, 0.095916748046875, 0.1018829345703125, 0.10784912109375, 0.1138153076171875, 0.119781494140625, 0.1257476806640625, 0.1317138671875, 0.1376800537109375, 0.143646240234375, 0.1496124267578125, 0.15557861328125, 0.1615447998046875, 0.167510986328125, 0.1734771728515625, 0.179443359375, 0.1854095458984375, 0.191375732421875, 0.1973419189453125, 0.20330810546875, 0.2092742919921875, 0.215240478515625, 0.2212066650390625, 0.2271728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 9.0, 12.0, 18.0, 35.0, 41.0, 81.0, 147.0, 339.0, 132.0, 71.0, 40.0, 18.0, 16.0, 9.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1600341796875, -0.15440750122070312, -0.14878082275390625, -0.14315414428710938, -0.1375274658203125, -0.13190078735351562, -0.12627410888671875, -0.12064743041992188, -0.115020751953125, -0.10939407348632812, -0.10376739501953125, -0.09814071655273438, -0.0925140380859375, -0.08688735961914062, -0.08126068115234375, -0.07563400268554688, -0.07000732421875, -0.06438064575195312, -0.05875396728515625, -0.053127288818359375, -0.0475006103515625, -0.041873931884765625, -0.03624725341796875, -0.030620574951171875, -0.024993896484375, -0.019367218017578125, -0.01374053955078125, -0.008113861083984375, -0.0024871826171875, 0.003139495849609375, 0.00876617431640625, 0.014392852783203125, 0.02001953125, 0.025646209716796875, 0.03127288818359375, 0.036899566650390625, 0.0425262451171875, 0.048152923583984375, 0.05377960205078125, 0.059406280517578125, 0.065032958984375, 0.07065963745117188, 0.07628631591796875, 0.08191299438476562, 0.0875396728515625, 0.09316635131835938, 0.09879302978515625, 0.10441970825195312, 0.11004638671875, 0.11567306518554688, 0.12129974365234375, 0.12692642211914062, 0.1325531005859375, 0.13817977905273438, 0.14380645751953125, 0.14943313598632812, 0.155059814453125, 0.16068649291992188, 0.16631317138671875, 0.17193984985351562, 0.1775665283203125, 0.18319320678710938, 0.18881988525390625, 0.19444656372070312, 0.2000732421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 23.0, 32.0, 35.0, 48.0, 132.0, 408.0, 3295.0, 4181872.0, 7511.0, 567.0, 160.0, 70.0, 44.0, 22.0, 21.0, 8.0, 6.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.29569244384765625, -0.2813262939453125, -0.26696014404296875, -0.252593994140625, -0.23822784423828125, -0.2238616943359375, -0.20949554443359375, -0.19512939453125, -0.18076324462890625, -0.1663970947265625, -0.15203094482421875, -0.137664794921875, -0.12329864501953125, -0.1089324951171875, -0.09456634521484375, -0.0802001953125, -0.06583404541015625, -0.0514678955078125, -0.03710174560546875, -0.022735595703125, -0.00836944580078125, 0.0059967041015625, 0.02036285400390625, 0.03472900390625, 0.04909515380859375, 0.0634613037109375, 0.07782745361328125, 0.092193603515625, 0.10655975341796875, 0.1209259033203125, 0.13529205322265625, 0.149658203125, 0.16402435302734375, 0.1783905029296875, 0.19275665283203125, 0.207122802734375, 0.22148895263671875, 0.2358551025390625, 0.25022125244140625, 0.26458740234375, 0.27895355224609375, 0.2933197021484375, 0.30768585205078125, 0.322052001953125, 0.33641815185546875, 0.3507843017578125, 0.36515045166015625, 0.3795166015625, 0.39388275146484375, 0.4082489013671875, 0.42261505126953125, 0.436981201171875, 0.45134735107421875, 0.4657135009765625, 0.48007965087890625, 0.49444580078125, 0.5088119506835938, 0.5231781005859375, 0.5375442504882812, 0.551910400390625, 0.5662765502929688, 0.5806427001953125, 0.5950088500976562, 0.609375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 10.0, 18.0, 28.0, 34.0, 28.0, 102.0, 217.0, 567.0, 1280.0, 960.0, 470.0, 168.0, 69.0, 41.0, 28.0, 23.0, 13.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06317138671875, -0.060128211975097656, -0.05708503723144531, -0.05404186248779297, -0.050998687744140625, -0.04795551300048828, -0.04491233825683594, -0.041869163513183594, -0.03882598876953125, -0.035782814025878906, -0.03273963928222656, -0.02969646453857422, -0.026653289794921875, -0.02361011505126953, -0.020566940307617188, -0.017523765563964844, -0.0144805908203125, -0.011437416076660156, -0.008394241333007812, -0.005351066589355469, -0.002307891845703125, 0.0007352828979492188, 0.0037784576416015625, 0.006821632385253906, 0.00986480712890625, 0.012907981872558594, 0.015951156616210938, 0.01899433135986328, 0.022037506103515625, 0.02508068084716797, 0.028123855590820312, 0.031167030334472656, 0.034210205078125, 0.037253379821777344, 0.04029655456542969, 0.04333972930908203, 0.046382904052734375, 0.04942607879638672, 0.05246925354003906, 0.055512428283691406, 0.05855560302734375, 0.061598777770996094, 0.06464195251464844, 0.06768512725830078, 0.07072830200195312, 0.07377147674560547, 0.07681465148925781, 0.07985782623291016, 0.0829010009765625, 0.08594417572021484, 0.08898735046386719, 0.09203052520751953, 0.09507369995117188, 0.09811687469482422, 0.10116004943847656, 0.1042032241821289, 0.10724639892578125, 0.1102895736694336, 0.11333274841308594, 0.11637592315673828, 0.11941909790039062, 0.12246227264404297, 0.1255054473876953, 0.12854862213134766, 0.131591796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 25.0, 848.0, 142.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.639014720916748, -2.5812911987304688, -2.5235679149627686, -2.4658443927764893, -2.40812087059021, -2.3503975868225098, -2.2926740646362305, -2.234950542449951, -2.177227258682251, -2.1195037364959717, -2.0617804527282715, -2.004056930541992, -1.9463335275650024, -1.8886101245880127, -1.8308866024017334, -1.7731631994247437, -1.7154396772384644, -1.6577162742614746, -1.5999927520751953, -1.5422693490982056, -1.4845459461212158, -1.4268224239349365, -1.3690990209579468, -1.311375617980957, -1.2536520957946777, -1.195928692817688, -1.1382051706314087, -1.080481767654419, -1.0227583646774292, -0.9650349020957947, -0.9073114395141602, -0.8495880365371704, -0.7918646335601807, -0.7341411709785461, -0.6764177680015564, -0.6186943054199219, -0.5609709024429321, -0.5032474398612976, -0.4455239772796631, -0.38780054450035095, -0.3300771117210388, -0.2723536789417267, -0.21463023126125336, -0.15690678358078003, -0.0991833508014679, -0.04145991802215576, 0.01626354455947876, 0.0739869773387909, 0.13171041011810303, 0.18943384289741516, 0.2471572905778885, 0.3048807382583618, 0.36260417103767395, 0.4203276038169861, 0.4780510663986206, 0.5357744693756104, 0.5934979319572449, 0.6512213945388794, 0.7089447975158691, 0.7666682600975037, 0.8243917226791382, 0.8821151256561279, 0.9398385882377625, 0.997562050819397, 1.0552854537963867]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 17.0, 24.0, 20.0, 34.0, 28.0, 43.0, 38.0, 39.0, 48.0, 46.0, 41.0, 46.0, 47.0, 53.0, 44.0, 44.0, 46.0, 51.0, 37.0, 23.0, 34.0, 20.0, 20.0, 18.0, 15.0, 14.0, 14.0, 12.0, 12.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1742118000984192, -0.16894155740737915, -0.1636713296175003, -0.15840108692646027, -0.15313085913658142, -0.14786061644554138, -0.14259037375450134, -0.1373201459646225, -0.13204991817474365, -0.1267796754837036, -0.12150944769382477, -0.11623920500278473, -0.11096897721290588, -0.10569873452186584, -0.1004284992814064, -0.09515826404094696, -0.08988802134990692, -0.08461778610944748, -0.07934755086898804, -0.074077308177948, -0.06880708038806915, -0.06353683769702911, -0.05826660245656967, -0.05299636721611023, -0.04772613197565079, -0.042455896735191345, -0.0371856614947319, -0.03191542252898216, -0.02664518728852272, -0.021374952048063278, -0.016104713082313538, -0.010834477841854095, -0.005564242601394653, -0.00029400642961263657, 0.00497622974216938, 0.010246466845273972, 0.015516702085733414, 0.020786937326192856, 0.026057176291942596, 0.03132741153240204, 0.03659764677286148, 0.04186788201332092, 0.047138117253780365, 0.052408356219530106, 0.05767859145998955, 0.06294882297515869, 0.06821906566619873, 0.07348930090665817, 0.07875953614711761, 0.08402977138757706, 0.0893000066280365, 0.09457024931907654, 0.09984047710895538, 0.10511071979999542, 0.11038095504045486, 0.1156511902809143, 0.12092142552137375, 0.1261916607618332, 0.13146190345287323, 0.13673213124275208, 0.14200237393379211, 0.14727260172367096, 0.152542844414711, 0.15781307220458984, 0.16308331489562988]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 20.0, 6.0, 13.0, 13.0, 28.0, 33.0, 42.0, 61.0, 70.0, 110.0, 183.0, 232.0, 443.0, 848.0, 1980.0, 5429.0, 26903.0, 918887.0, 78919.0, 8975.0, 2687.0, 1090.0, 566.0, 355.0, 203.0, 119.0, 91.0, 63.0, 42.0, 26.0, 28.0, 14.0, 15.0, 11.0, 9.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.935546875, -0.9029388427734375, -0.870330810546875, -0.8377227783203125, -0.80511474609375, -0.7725067138671875, -0.739898681640625, -0.7072906494140625, -0.6746826171875, -0.6420745849609375, -0.609466552734375, -0.5768585205078125, -0.54425048828125, -0.5116424560546875, -0.479034423828125, -0.4464263916015625, -0.413818359375, -0.3812103271484375, -0.348602294921875, -0.3159942626953125, -0.28338623046875, -0.2507781982421875, -0.218170166015625, -0.1855621337890625, -0.1529541015625, -0.1203460693359375, -0.087738037109375, -0.0551300048828125, -0.02252197265625, 0.0100860595703125, 0.042694091796875, 0.0753021240234375, 0.10791015625, 0.1405181884765625, 0.173126220703125, 0.2057342529296875, 0.23834228515625, 0.2709503173828125, 0.303558349609375, 0.3361663818359375, 0.3687744140625, 0.4013824462890625, 0.433990478515625, 0.4665985107421875, 0.49920654296875, 0.5318145751953125, 0.564422607421875, 0.5970306396484375, 0.629638671875, 0.6622467041015625, 0.694854736328125, 0.7274627685546875, 0.76007080078125, 0.7926788330078125, 0.825286865234375, 0.8578948974609375, 0.8905029296875, 0.9231109619140625, 0.955718994140625, 0.9883270263671875, 1.02093505859375, 1.0535430908203125, 1.086151123046875, 1.1187591552734375, 1.1513671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 15.0, 16.0, 33.0, 45.0, 71.0, 148.0, 349.0, 130.0, 74.0, 43.0, 16.0, 13.0, 9.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16455078125, -0.1587677001953125, -0.152984619140625, -0.1472015380859375, -0.14141845703125, -0.1356353759765625, -0.129852294921875, -0.1240692138671875, -0.1182861328125, -0.1125030517578125, -0.106719970703125, -0.1009368896484375, -0.09515380859375, -0.0893707275390625, -0.083587646484375, -0.0778045654296875, -0.072021484375, -0.0662384033203125, -0.060455322265625, -0.0546722412109375, -0.04888916015625, -0.0431060791015625, -0.037322998046875, -0.0315399169921875, -0.0257568359375, -0.0199737548828125, -0.014190673828125, -0.0084075927734375, -0.00262451171875, 0.0031585693359375, 0.008941650390625, 0.0147247314453125, 0.0205078125, 0.0262908935546875, 0.032073974609375, 0.0378570556640625, 0.04364013671875, 0.0494232177734375, 0.055206298828125, 0.0609893798828125, 0.0667724609375, 0.0725555419921875, 0.078338623046875, 0.0841217041015625, 0.08990478515625, 0.0956878662109375, 0.101470947265625, 0.1072540283203125, 0.113037109375, 0.1188201904296875, 0.124603271484375, 0.1303863525390625, 0.13616943359375, 0.1419525146484375, 0.147735595703125, 0.1535186767578125, 0.1593017578125, 0.1650848388671875, 0.170867919921875, 0.1766510009765625, 0.18243408203125, 0.1882171630859375, 0.194000244140625, 0.1997833251953125, 0.20556640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 10.0, 5.0, 9.0, 10.0, 11.0, 19.0, 25.0, 19.0, 24.0, 42.0, 58.0, 60.0, 74.0, 99.0, 129.0, 158.0, 298.0, 502.0, 1082.0, 3567.0, 17496.0, 118066.0, 580559.0, 276644.0, 39093.0, 6949.0, 1672.0, 678.0, 325.0, 215.0, 143.0, 117.0, 79.0, 64.0, 55.0, 32.0, 36.0, 26.0, 23.0, 11.0, 16.0, 7.0, 15.0, 7.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.2249755859375, -0.2176513671875, -0.2103271484375, -0.2030029296875, -0.1956787109375, -0.1883544921875, -0.1810302734375, -0.1737060546875, -0.1663818359375, -0.1590576171875, -0.1517333984375, -0.1444091796875, -0.1370849609375, -0.1297607421875, -0.1224365234375, -0.1151123046875, -0.1077880859375, -0.1004638671875, -0.0931396484375, -0.0858154296875, -0.0784912109375, -0.0711669921875, -0.0638427734375, -0.0565185546875, -0.0491943359375, -0.0418701171875, -0.0345458984375, -0.0272216796875, -0.0198974609375, -0.0125732421875, -0.0052490234375, 0.0020751953125, 0.0093994140625, 0.0167236328125, 0.0240478515625, 0.0313720703125, 0.0386962890625, 0.0460205078125, 0.0533447265625, 0.0606689453125, 0.0679931640625, 0.0753173828125, 0.0826416015625, 0.0899658203125, 0.0972900390625, 0.1046142578125, 0.1119384765625, 0.1192626953125, 0.1265869140625, 0.1339111328125, 0.1412353515625, 0.1485595703125, 0.1558837890625, 0.1632080078125, 0.1705322265625, 0.1778564453125, 0.1851806640625, 0.1925048828125, 0.1998291015625, 0.2071533203125, 0.2144775390625, 0.2218017578125, 0.2291259765625, 0.2364501953125, 0.2437744140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 3.0, 1.0, 7.0, 3.0, 9.0, 15.0, 13.0, 21.0, 20.0, 20.0, 15.0, 34.0, 25.0, 34.0, 28.0, 39.0, 34.0, 41.0, 40.0, 38.0, 28.0, 36.0, 57.0, 38.0, 39.0, 25.0, 37.0, 31.0, 29.0, 38.0, 32.0, 33.0, 25.0, 18.0, 17.0, 11.0, 16.0, 12.0, 7.0, 9.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1937255859375, -0.18821144104003906, -0.18269729614257812, -0.1771831512451172, -0.17166900634765625, -0.1661548614501953, -0.16064071655273438, -0.15512657165527344, -0.1496124267578125, -0.14409828186035156, -0.13858413696289062, -0.1330699920654297, -0.12755584716796875, -0.12204170227050781, -0.11652755737304688, -0.11101341247558594, -0.105499267578125, -0.09998512268066406, -0.09447097778320312, -0.08895683288574219, -0.08344268798828125, -0.07792854309082031, -0.07241439819335938, -0.06690025329589844, -0.0613861083984375, -0.05587196350097656, -0.050357818603515625, -0.04484367370605469, -0.03932952880859375, -0.03381538391113281, -0.028301239013671875, -0.022787094116210938, -0.01727294921875, -0.011758804321289062, -0.006244659423828125, -0.0007305145263671875, 0.00478363037109375, 0.010297775268554688, 0.015811920166015625, 0.021326065063476562, 0.0268402099609375, 0.03235435485839844, 0.037868499755859375, 0.04338264465332031, 0.04889678955078125, 0.05441093444824219, 0.059925079345703125, 0.06543922424316406, 0.070953369140625, 0.07646751403808594, 0.08198165893554688, 0.08749580383300781, 0.09300994873046875, 0.09852409362792969, 0.10403823852539062, 0.10955238342285156, 0.1150665283203125, 0.12058067321777344, 0.12609481811523438, 0.1316089630126953, 0.13712310791015625, 0.1426372528076172, 0.14815139770507812, 0.15366554260253906, 0.1591796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 8.0, 13.0, 12.0, 13.0, 31.0, 31.0, 40.0, 74.0, 95.0, 155.0, 246.0, 317.0, 531.0, 806.0, 1286.0, 2280.0, 4024.0, 7766.0, 16500.0, 40266.0, 116127.0, 370705.0, 320975.0, 99847.0, 35391.0, 14918.0, 7134.0, 3678.0, 1959.0, 1146.0, 740.0, 448.0, 312.0, 202.0, 141.0, 82.0, 56.0, 53.0, 42.0, 34.0, 8.0, 14.0, 11.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06536865234375, -0.06325531005859375, -0.0611419677734375, -0.05902862548828125, -0.056915283203125, -0.05480194091796875, -0.0526885986328125, -0.05057525634765625, -0.0484619140625, -0.04634857177734375, -0.0442352294921875, -0.04212188720703125, -0.040008544921875, -0.03789520263671875, -0.0357818603515625, -0.03366851806640625, -0.03155517578125, -0.02944183349609375, -0.0273284912109375, -0.02521514892578125, -0.023101806640625, -0.02098846435546875, -0.0188751220703125, -0.01676177978515625, -0.0146484375, -0.01253509521484375, -0.0104217529296875, -0.00830841064453125, -0.006195068359375, -0.00408172607421875, -0.0019683837890625, 0.00014495849609375, 0.00225830078125, 0.00437164306640625, 0.0064849853515625, 0.00859832763671875, 0.010711669921875, 0.01282501220703125, 0.0149383544921875, 0.01705169677734375, 0.0191650390625, 0.02127838134765625, 0.0233917236328125, 0.02550506591796875, 0.027618408203125, 0.02973175048828125, 0.0318450927734375, 0.03395843505859375, 0.03607177734375, 0.03818511962890625, 0.0402984619140625, 0.04241180419921875, 0.044525146484375, 0.04663848876953125, 0.0487518310546875, 0.05086517333984375, 0.052978515625, 0.05509185791015625, 0.0572052001953125, 0.05931854248046875, 0.061431884765625, 0.06354522705078125, 0.0656585693359375, 0.06777191162109375, 0.06988525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 5.0, 6.0, 8.0, 9.0, 14.0, 24.0, 19.0, 33.0, 37.0, 52.0, 54.0, 63.0, 92.0, 67.0, 110.0, 81.0, 82.0, 54.0, 43.0, 37.0, 14.0, 29.0, 15.0, 10.0, 4.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1298805475234985e-05, -1.0974705219268799e-05, -1.0650604963302612e-05, -1.0326504707336426e-05, -1.000240445137024e-05, -9.678304195404053e-06, -9.354203939437866e-06, -9.03010368347168e-06, -8.706003427505493e-06, -8.381903171539307e-06, -8.05780291557312e-06, -7.733702659606934e-06, -7.409602403640747e-06, -7.0855021476745605e-06, -6.761401891708374e-06, -6.4373016357421875e-06, -6.113201379776001e-06, -5.7891011238098145e-06, -5.465000867843628e-06, -5.140900611877441e-06, -4.816800355911255e-06, -4.492700099945068e-06, -4.168599843978882e-06, -3.844499588012695e-06, -3.520399332046509e-06, -3.1962990760803223e-06, -2.8721988201141357e-06, -2.5480985641479492e-06, -2.2239983081817627e-06, -1.8998980522155762e-06, -1.5757977962493896e-06, -1.2516975402832031e-06, -9.275972843170166e-07, -6.034970283508301e-07, -2.7939677238464355e-07, 4.470348358154297e-08, 3.688037395477295e-07, 6.92903995513916e-07, 1.0170042514801025e-06, 1.341104507446289e-06, 1.6652047634124756e-06, 1.989305019378662e-06, 2.3134052753448486e-06, 2.637505531311035e-06, 2.9616057872772217e-06, 3.285706043243408e-06, 3.6098062992095947e-06, 3.933906555175781e-06, 4.258006811141968e-06, 4.582107067108154e-06, 4.906207323074341e-06, 5.230307579040527e-06, 5.554407835006714e-06, 5.8785080909729e-06, 6.202608346939087e-06, 6.5267086029052734e-06, 6.85080885887146e-06, 7.1749091148376465e-06, 7.499009370803833e-06, 7.82310962677002e-06, 8.147209882736206e-06, 8.471310138702393e-06, 8.795410394668579e-06, 9.119510650634766e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 11.0, 11.0, 13.0, 26.0, 21.0, 31.0, 55.0, 106.0, 131.0, 220.0, 399.0, 779.0, 1422.0, 2902.0, 6949.0, 20941.0, 82015.0, 404445.0, 410161.0, 83400.0, 21181.0, 7127.0, 2952.0, 1452.0, 725.0, 402.0, 242.0, 154.0, 85.0, 51.0, 45.0, 33.0, 20.0, 12.0, 7.0, 7.0, 7.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09063720703125, -0.08804798126220703, -0.08545875549316406, -0.0828695297241211, -0.08028030395507812, -0.07769107818603516, -0.07510185241699219, -0.07251262664794922, -0.06992340087890625, -0.06733417510986328, -0.06474494934082031, -0.062155723571777344, -0.059566497802734375, -0.056977272033691406, -0.05438804626464844, -0.05179882049560547, -0.0492095947265625, -0.04662036895751953, -0.04403114318847656, -0.041441917419433594, -0.038852691650390625, -0.036263465881347656, -0.03367424011230469, -0.03108501434326172, -0.02849578857421875, -0.02590656280517578, -0.023317337036132812, -0.020728111267089844, -0.018138885498046875, -0.015549659729003906, -0.012960433959960938, -0.010371208190917969, -0.007781982421875, -0.005192756652832031, -0.0026035308837890625, -1.430511474609375e-05, 0.002574920654296875, 0.005164146423339844, 0.0077533721923828125, 0.010342597961425781, 0.01293182373046875, 0.015521049499511719, 0.018110275268554688, 0.020699501037597656, 0.023288726806640625, 0.025877952575683594, 0.028467178344726562, 0.03105640411376953, 0.0336456298828125, 0.03623485565185547, 0.03882408142089844, 0.041413307189941406, 0.044002532958984375, 0.046591758728027344, 0.04918098449707031, 0.05177021026611328, 0.05435943603515625, 0.05694866180419922, 0.05953788757324219, 0.062127113342285156, 0.06471633911132812, 0.0673055648803711, 0.06989479064941406, 0.07248401641845703, 0.0750732421875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 11.0, 12.0, 16.0, 21.0, 28.0, 39.0, 35.0, 39.0, 55.0, 54.0, 62.0, 69.0, 88.0, 80.0, 60.0, 50.0, 46.0, 34.0, 38.0, 28.0, 26.0, 19.0, 11.0, 9.0, 7.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0458984375, -0.04403400421142578, -0.04216957092285156, -0.040305137634277344, -0.038440704345703125, -0.036576271057128906, -0.03471183776855469, -0.03284740447998047, -0.03098297119140625, -0.02911853790283203, -0.027254104614257812, -0.025389671325683594, -0.023525238037109375, -0.021660804748535156, -0.019796371459960938, -0.01793193817138672, -0.0160675048828125, -0.014203071594238281, -0.012338638305664062, -0.010474205017089844, -0.008609771728515625, -0.006745338439941406, -0.0048809051513671875, -0.0030164718627929688, -0.00115203857421875, 0.0007123947143554688, 0.0025768280029296875, 0.004441261291503906, 0.006305694580078125, 0.008170127868652344, 0.010034561157226562, 0.011898994445800781, 0.013763427734375, 0.01562786102294922, 0.017492294311523438, 0.019356727600097656, 0.021221160888671875, 0.023085594177246094, 0.024950027465820312, 0.02681446075439453, 0.02867889404296875, 0.03054332733154297, 0.03240776062011719, 0.034272193908691406, 0.036136627197265625, 0.038001060485839844, 0.03986549377441406, 0.04172992706298828, 0.0435943603515625, 0.04545879364013672, 0.04732322692871094, 0.049187660217285156, 0.051052093505859375, 0.052916526794433594, 0.05478096008300781, 0.05664539337158203, 0.05850982666015625, 0.06037425994873047, 0.06223869323730469, 0.0641031265258789, 0.06596755981445312, 0.06783199310302734, 0.06969642639160156, 0.07156085968017578, 0.07342529296875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 10.0, 29.0, 60.0, 167.0, 390.0, 261.0, 68.0, 17.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.976993560791016, -4.872744560241699, -4.768496036529541, -4.664247035980225, -4.559998512268066, -4.45574951171875, -4.351500988006592, -4.247251987457275, -4.143003463745117, -4.038754463195801, -3.9345059394836426, -3.8302571773529053, -3.726008415222168, -3.6217594146728516, -3.5175106525421143, -3.413261890411377, -3.3090128898620605, -3.2047641277313232, -3.100515365600586, -2.9962666034698486, -2.8920178413391113, -2.787768840789795, -2.6835200786590576, -2.5792713165283203, -2.475022554397583, -2.3707737922668457, -2.2665250301361084, -2.162276268005371, -2.0580272674560547, -1.953778624534607, -1.84952974319458, -1.7452809810638428, -1.6410322189331055, -1.5367834568023682, -1.4325346946716309, -1.328285813331604, -1.2240370512008667, -1.1197882890701294, -1.0155394077301025, -0.9112906455993652, -0.8070418834686279, -0.7027931213378906, -0.5985442996025085, -0.49429550766944885, -0.39004671573638916, -0.28579795360565186, -0.18154913187026978, -0.0773003101348877, 0.02694845199584961, 0.1311972439289093, 0.235446035861969, 0.3396948277950287, 0.4439436197280884, 0.5481923818588257, 0.6524412035942078, 0.7566900253295898, 0.8609387874603271, 0.9651875495910645, 1.0694363117218018, 1.1736851930618286, 1.277933955192566, 1.3821827173233032, 1.48643159866333, 1.5906803607940674, 1.6949291229248047]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 7.0, 17.0, 22.0, 26.0, 25.0, 46.0, 32.0, 39.0, 42.0, 48.0, 53.0, 54.0, 62.0, 46.0, 51.0, 56.0, 43.0, 51.0, 42.0, 33.0, 34.0, 34.0, 36.0, 21.0, 25.0, 14.0, 18.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8114482164382935, -1.7571368217468262, -1.7028255462646484, -1.6485141515731812, -1.5942028760910034, -1.5398914813995361, -1.4855802059173584, -1.4312688112258911, -1.3769574165344238, -1.3226460218429565, -1.2683347463607788, -1.2140233516693115, -1.1597120761871338, -1.1054006814956665, -1.0510892868041992, -0.9967780113220215, -0.9424667358398438, -0.8881554007530212, -0.8338440656661987, -0.7795326709747314, -0.7252213954925537, -0.6709100008010864, -0.6165986657142639, -0.5622873306274414, -0.5079759955406189, -0.4536646604537964, -0.3993533253669739, -0.345041960477829, -0.29073062539100647, -0.23641929030418396, -0.18210792541503906, -0.12779659032821655, -0.0734853744506836, -0.019174031913280487, 0.03513731062412262, 0.08944866061210632, 0.14375999569892883, 0.19807133078575134, 0.25238269567489624, 0.30669403076171875, 0.36100536584854126, 0.41531670093536377, 0.4696280360221863, 0.5239393711090088, 0.5782507658004761, 0.6325620412826538, 0.6868734359741211, 0.7411847710609436, 0.7954961061477661, 0.8498074412345886, 0.9041187763214111, 0.9584301710128784, 1.0127414464950562, 1.0670528411865234, 1.1213641166687012, 1.1756755113601685, 1.2299869060516357, 1.284298300743103, 1.3386095762252808, 1.392920970916748, 1.4472322463989258, 1.501543641090393, 1.5558550357818604, 1.610166311264038, 1.6644775867462158]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 7.0, 2.0, 1.0, 8.0, 14.0, 15.0, 22.0, 36.0, 56.0, 164.0, 915.0, 1450033.0, 2741716.0, 927.0, 178.0, 75.0, 44.0, 21.0, 17.0, 9.0, 9.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.908203125, -0.87188720703125, -0.8355712890625, -0.79925537109375, -0.762939453125, -0.72662353515625, -0.6903076171875, -0.65399169921875, -0.61767578125, -0.58135986328125, -0.5450439453125, -0.50872802734375, -0.472412109375, -0.43609619140625, -0.3997802734375, -0.36346435546875, -0.3271484375, -0.29083251953125, -0.2545166015625, -0.21820068359375, -0.181884765625, -0.14556884765625, -0.1092529296875, -0.07293701171875, -0.03662109375, -0.00030517578125, 0.0360107421875, 0.07232666015625, 0.108642578125, 0.14495849609375, 0.1812744140625, 0.21759033203125, 0.25390625, 0.29022216796875, 0.3265380859375, 0.36285400390625, 0.399169921875, 0.43548583984375, 0.4718017578125, 0.50811767578125, 0.54443359375, 0.58074951171875, 0.6170654296875, 0.65338134765625, 0.689697265625, 0.72601318359375, 0.7623291015625, 0.79864501953125, 0.8349609375, 0.87127685546875, 0.9075927734375, 0.94390869140625, 0.980224609375, 1.01654052734375, 1.0528564453125, 1.08917236328125, 1.12548828125, 1.16180419921875, 1.1981201171875, 1.23443603515625, 1.270751953125, 1.30706787109375, 1.3433837890625, 1.37969970703125, 1.416015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 16.0, 24.0, 33.0, 49.0, 105.0, 147.0, 187.0, 160.0, 97.0, 59.0, 37.0, 15.0, 19.0, 6.0, 15.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1231689453125, -0.11816215515136719, -0.11315536499023438, -0.10814857482910156, -0.10314178466796875, -0.09813499450683594, -0.09312820434570312, -0.08812141418457031, -0.0831146240234375, -0.07810783386230469, -0.07310104370117188, -0.06809425354003906, -0.06308746337890625, -0.05808067321777344, -0.053073883056640625, -0.04806709289550781, -0.043060302734375, -0.03805351257324219, -0.033046722412109375, -0.028039932250976562, -0.02303314208984375, -0.018026351928710938, -0.013019561767578125, -0.008012771606445312, -0.0030059814453125, 0.0020008087158203125, 0.007007598876953125, 0.012014389038085938, 0.01702117919921875, 0.022027969360351562, 0.027034759521484375, 0.03204154968261719, 0.03704833984375, 0.04205513000488281, 0.047061920166015625, 0.05206871032714844, 0.05707550048828125, 0.06208229064941406, 0.06708908081054688, 0.07209587097167969, 0.0771026611328125, 0.08210945129394531, 0.08711624145507812, 0.09212303161621094, 0.09712982177734375, 0.10213661193847656, 0.10714340209960938, 0.11215019226074219, 0.117156982421875, 0.12216377258300781, 0.12717056274414062, 0.13217735290527344, 0.13718414306640625, 0.14219093322753906, 0.14719772338867188, 0.1522045135498047, 0.1572113037109375, 0.1622180938720703, 0.16722488403320312, 0.17223167419433594, 0.17723846435546875, 0.18224525451660156, 0.18725204467773438, 0.1922588348388672, 0.197265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 18.0, 25.0, 30.0, 37.0, 54.0, 75.0, 161.0, 299.0, 1011.0, 4042.0, 24739.0, 423824.0, 3622569.0, 102968.0, 11047.0, 2188.0, 612.0, 235.0, 118.0, 63.0, 27.0, 25.0, 14.0, 11.0, 14.0, 8.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.439453125, -0.42930030822753906, -0.4191474914550781, -0.4089946746826172, -0.39884185791015625, -0.3886890411376953, -0.3785362243652344, -0.36838340759277344, -0.3582305908203125, -0.34807777404785156, -0.3379249572753906, -0.3277721405029297, -0.31761932373046875, -0.3074665069580078, -0.2973136901855469, -0.28716087341308594, -0.277008056640625, -0.26685523986816406, -0.2567024230957031, -0.2465496063232422, -0.23639678955078125, -0.2262439727783203, -0.21609115600585938, -0.20593833923339844, -0.1957855224609375, -0.18563270568847656, -0.17547988891601562, -0.1653270721435547, -0.15517425537109375, -0.1450214385986328, -0.13486862182617188, -0.12471580505371094, -0.11456298828125, -0.10441017150878906, -0.09425735473632812, -0.08410453796386719, -0.07395172119140625, -0.06379890441894531, -0.053646087646484375, -0.04349327087402344, -0.0333404541015625, -0.023187637329101562, -0.013034820556640625, -0.0028820037841796875, 0.00727081298828125, 0.017423629760742188, 0.027576446533203125, 0.03772926330566406, 0.047882080078125, 0.05803489685058594, 0.06818771362304688, 0.07834053039550781, 0.08849334716796875, 0.09864616394042969, 0.10879898071289062, 0.11895179748535156, 0.1291046142578125, 0.13925743103027344, 0.14941024780273438, 0.1595630645751953, 0.16971588134765625, 0.1798686981201172, 0.19002151489257812, 0.20017433166503906, 0.2103271484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 7.0, 8.0, 14.0, 13.0, 11.0, 22.0, 34.0, 21.0, 42.0, 53.0, 62.0, 102.0, 144.0, 209.0, 411.0, 739.0, 946.0, 510.0, 295.0, 165.0, 76.0, 61.0, 33.0, 19.0, 15.0, 10.0, 6.0, 5.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1312255859375, -0.1279773712158203, -0.12472915649414062, -0.12148094177246094, -0.11823272705078125, -0.11498451232910156, -0.11173629760742188, -0.10848808288574219, -0.1052398681640625, -0.10199165344238281, -0.09874343872070312, -0.09549522399902344, -0.09224700927734375, -0.08899879455566406, -0.08575057983398438, -0.08250236511230469, -0.079254150390625, -0.07600593566894531, -0.07275772094726562, -0.06950950622558594, -0.06626129150390625, -0.06301307678222656, -0.059764862060546875, -0.05651664733886719, -0.0532684326171875, -0.05002021789550781, -0.046772003173828125, -0.04352378845214844, -0.04027557373046875, -0.03702735900878906, -0.033779144287109375, -0.030530929565429688, -0.02728271484375, -0.024034500122070312, -0.020786285400390625, -0.017538070678710938, -0.01428985595703125, -0.011041641235351562, -0.007793426513671875, -0.0045452117919921875, -0.0012969970703125, 0.0019512176513671875, 0.005199432373046875, 0.008447647094726562, 0.01169586181640625, 0.014944076538085938, 0.018192291259765625, 0.021440505981445312, 0.024688720703125, 0.027936935424804688, 0.031185150146484375, 0.03443336486816406, 0.03768157958984375, 0.04092979431152344, 0.044178009033203125, 0.04742622375488281, 0.0506744384765625, 0.05392265319824219, 0.057170867919921875, 0.06041908264160156, 0.06366729736328125, 0.06691551208496094, 0.07016372680664062, 0.07341194152832031, 0.07666015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 697.0, 310.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.005799770355225, -3.782850980758667, -3.5599021911621094, -3.3369534015655518, -3.114004611968994, -2.8910558223724365, -2.668107032775879, -2.4451582431793213, -2.2222094535827637, -1.999260663986206, -1.7763118743896484, -1.5533630847930908, -1.3304142951965332, -1.1074655055999756, -0.884516716003418, -0.6615679264068604, -0.43861913681030273, -0.21567034721374512, 0.0072784423828125, 0.23022723197937012, 0.45317602157592773, 0.6761248111724854, 0.899073600769043, 1.1220223903656006, 1.3449711799621582, 1.5679199695587158, 1.7908687591552734, 2.013817548751831, 2.2367663383483887, 2.4597151279449463, 2.682663917541504, 2.9056127071380615, 3.1285619735717773, 3.351510763168335, 3.5744595527648926, 3.79740834236145, 4.020357131958008, 4.2433061599731445, 4.466254711151123, 4.689203262329102, 4.912152290344238, 5.135101318359375, 5.3580498695373535, 5.580998420715332, 5.803947448730469, 6.0268964767456055, 6.249845027923584, 6.4727935791015625, 6.695742607116699, 6.918691635131836, 7.1416401863098145, 7.364588737487793, 7.58753776550293, 7.810486793518066, 8.033435821533203, 8.256383895874023, 8.47933292388916, 8.702281951904297, 8.925230026245117, 9.148179054260254, 9.37112808227539, 9.594077110290527, 9.817026138305664, 10.039974212646484, 10.262923240661621]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 8.0, 12.0, 11.0, 15.0, 19.0, 32.0, 45.0, 34.0, 52.0, 55.0, 60.0, 60.0, 64.0, 52.0, 56.0, 53.0, 52.0, 49.0, 42.0, 47.0, 38.0, 37.0, 34.0, 16.0, 15.0, 11.0, 7.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4416899085044861, -0.42432186007499695, -0.4069538116455078, -0.3895857632160187, -0.37221771478652954, -0.3548496663570404, -0.33748161792755127, -0.32011356949806213, -0.302745521068573, -0.28537747263908386, -0.2680094242095947, -0.2506413757801056, -0.23327332735061646, -0.21590527892112732, -0.19853723049163818, -0.18116918206214905, -0.1638011336326599, -0.14643308520317078, -0.12906503677368164, -0.1116969883441925, -0.09432893991470337, -0.07696089148521423, -0.0595928430557251, -0.04222479462623596, -0.024856746196746826, -0.00748869776725769, 0.009879350662231445, 0.02724739909172058, 0.04461544752120972, 0.06198349595069885, 0.07935154438018799, 0.09671959280967712, 0.11408764123916626, 0.1314556896686554, 0.14882373809814453, 0.16619178652763367, 0.1835598349571228, 0.20092788338661194, 0.21829593181610107, 0.2356639802455902, 0.25303202867507935, 0.2704000771045685, 0.2877681255340576, 0.30513617396354675, 0.3225042223930359, 0.339872270822525, 0.35724031925201416, 0.3746083676815033, 0.39197641611099243, 0.40934446454048157, 0.4267125129699707, 0.44408056139945984, 0.461448609828949, 0.4788166582584381, 0.49618470668792725, 0.5135527849197388, 0.5309208035469055, 0.5482888221740723, 0.5656569004058838, 0.5830249786376953, 0.6003929972648621, 0.6177610158920288, 0.6351290941238403, 0.6524971723556519, 0.6698651909828186]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 8.0, 26.0, 26.0, 35.0, 63.0, 78.0, 147.0, 199.0, 373.0, 739.0, 1745.0, 5872.0, 30044.0, 298410.0, 639332.0, 57376.0, 9481.0, 2513.0, 938.0, 424.0, 260.0, 139.0, 103.0, 61.0, 40.0, 29.0, 17.0, 7.0, 12.0, 14.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.27724456787109375, -0.2666473388671875, -0.25605010986328125, -0.245452880859375, -0.23485565185546875, -0.2242584228515625, -0.21366119384765625, -0.20306396484375, -0.19246673583984375, -0.1818695068359375, -0.17127227783203125, -0.160675048828125, -0.15007781982421875, -0.1394805908203125, -0.12888336181640625, -0.1182861328125, -0.10768890380859375, -0.0970916748046875, -0.08649444580078125, -0.075897216796875, -0.06529998779296875, -0.0547027587890625, -0.04410552978515625, -0.03350830078125, -0.02291107177734375, -0.0123138427734375, -0.00171661376953125, 0.008880615234375, 0.01947784423828125, 0.0300750732421875, 0.04067230224609375, 0.05126953125, 0.06186676025390625, 0.0724639892578125, 0.08306121826171875, 0.093658447265625, 0.10425567626953125, 0.1148529052734375, 0.12545013427734375, 0.13604736328125, 0.14664459228515625, 0.1572418212890625, 0.16783905029296875, 0.178436279296875, 0.18903350830078125, 0.1996307373046875, 0.21022796630859375, 0.2208251953125, 0.23142242431640625, 0.2420196533203125, 0.25261688232421875, 0.263214111328125, 0.27381134033203125, 0.2844085693359375, 0.29500579833984375, 0.30560302734375, 0.31620025634765625, 0.3267974853515625, 0.33739471435546875, 0.347991943359375, 0.35858917236328125, 0.3691864013671875, 0.37978363037109375, 0.390380859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 7.0, 10.0, 7.0, 22.0, 29.0, 29.0, 49.0, 91.0, 119.0, 169.0, 158.0, 117.0, 66.0, 43.0, 21.0, 19.0, 20.0, 9.0, 9.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11322021484375, -0.10846805572509766, -0.10371589660644531, -0.09896373748779297, -0.09421157836914062, -0.08945941925048828, -0.08470726013183594, -0.0799551010131836, -0.07520294189453125, -0.0704507827758789, -0.06569862365722656, -0.06094646453857422, -0.056194305419921875, -0.05144214630126953, -0.04668998718261719, -0.041937828063964844, -0.0371856689453125, -0.032433509826660156, -0.027681350708007812, -0.02292919158935547, -0.018177032470703125, -0.013424873352050781, -0.008672714233398438, -0.003920555114746094, 0.00083160400390625, 0.005583763122558594, 0.010335922241210938, 0.015088081359863281, 0.019840240478515625, 0.02459239959716797, 0.029344558715820312, 0.034096717834472656, 0.038848876953125, 0.043601036071777344, 0.04835319519042969, 0.05310535430908203, 0.057857513427734375, 0.06260967254638672, 0.06736183166503906, 0.0721139907836914, 0.07686614990234375, 0.0816183090209961, 0.08637046813964844, 0.09112262725830078, 0.09587478637695312, 0.10062694549560547, 0.10537910461425781, 0.11013126373291016, 0.1148834228515625, 0.11963558197021484, 0.12438774108886719, 0.12913990020751953, 0.13389205932617188, 0.13864421844482422, 0.14339637756347656, 0.1481485366821289, 0.15290069580078125, 0.1576528549194336, 0.16240501403808594, 0.16715717315673828, 0.17190933227539062, 0.17666149139404297, 0.1814136505126953, 0.18616580963134766, 0.19091796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 7.0, 6.0, 8.0, 18.0, 13.0, 15.0, 14.0, 20.0, 20.0, 29.0, 23.0, 36.0, 34.0, 43.0, 45.0, 55.0, 127.0, 554.0, 9230.0, 890338.0, 145033.0, 2181.0, 295.0, 84.0, 58.0, 43.0, 22.0, 31.0, 33.0, 18.0, 22.0, 22.0, 13.0, 13.0, 11.0, 11.0, 6.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8560028076171875, -0.826263427734375, -0.7965240478515625, -0.76678466796875, -0.7370452880859375, -0.707305908203125, -0.6775665283203125, -0.6478271484375, -0.6180877685546875, -0.588348388671875, -0.5586090087890625, -0.52886962890625, -0.4991302490234375, -0.469390869140625, -0.4396514892578125, -0.409912109375, -0.3801727294921875, -0.350433349609375, -0.3206939697265625, -0.29095458984375, -0.2612152099609375, -0.231475830078125, -0.2017364501953125, -0.1719970703125, -0.1422576904296875, -0.112518310546875, -0.0827789306640625, -0.05303955078125, -0.0233001708984375, 0.006439208984375, 0.0361785888671875, 0.06591796875, 0.0956573486328125, 0.125396728515625, 0.1551361083984375, 0.18487548828125, 0.2146148681640625, 0.244354248046875, 0.2740936279296875, 0.3038330078125, 0.3335723876953125, 0.363311767578125, 0.3930511474609375, 0.42279052734375, 0.4525299072265625, 0.482269287109375, 0.5120086669921875, 0.541748046875, 0.5714874267578125, 0.601226806640625, 0.6309661865234375, 0.66070556640625, 0.6904449462890625, 0.720184326171875, 0.7499237060546875, 0.7796630859375, 0.8094024658203125, 0.839141845703125, 0.8688812255859375, 0.89862060546875, 0.9283599853515625, 0.958099365234375, 0.9878387451171875, 1.017578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 12.0, 10.0, 18.0, 14.0, 16.0, 19.0, 23.0, 24.0, 30.0, 41.0, 30.0, 43.0, 38.0, 38.0, 33.0, 46.0, 43.0, 43.0, 48.0, 41.0, 39.0, 36.0, 56.0, 30.0, 26.0, 27.0, 27.0, 28.0, 26.0, 12.0, 12.0, 13.0, 16.0, 7.0, 2.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15545082092285156, -0.15001296997070312, -0.1445751190185547, -0.13913726806640625, -0.1336994171142578, -0.12826156616210938, -0.12282371520996094, -0.1173858642578125, -0.11194801330566406, -0.10651016235351562, -0.10107231140136719, -0.09563446044921875, -0.09019660949707031, -0.08475875854492188, -0.07932090759277344, -0.073883056640625, -0.06844520568847656, -0.06300735473632812, -0.05756950378417969, -0.05213165283203125, -0.04669380187988281, -0.041255950927734375, -0.03581809997558594, -0.0303802490234375, -0.024942398071289062, -0.019504547119140625, -0.014066696166992188, -0.00862884521484375, -0.0031909942626953125, 0.002246856689453125, 0.0076847076416015625, 0.01312255859375, 0.018560409545898438, 0.023998260498046875, 0.029436111450195312, 0.03487396240234375, 0.04031181335449219, 0.045749664306640625, 0.05118751525878906, 0.0566253662109375, 0.06206321716308594, 0.06750106811523438, 0.07293891906738281, 0.07837677001953125, 0.08381462097167969, 0.08925247192382812, 0.09469032287597656, 0.100128173828125, 0.10556602478027344, 0.11100387573242188, 0.11644172668457031, 0.12187957763671875, 0.1273174285888672, 0.13275527954101562, 0.13819313049316406, 0.1436309814453125, 0.14906883239746094, 0.15450668334960938, 0.1599445343017578, 0.16538238525390625, 0.1708202362060547, 0.17625808715820312, 0.18169593811035156, 0.1871337890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 11.0, 12.0, 17.0, 27.0, 32.0, 52.0, 91.0, 163.0, 271.0, 475.0, 923.0, 1896.0, 4327.0, 11128.0, 36516.0, 182085.0, 632592.0, 132465.0, 29001.0, 9235.0, 3681.0, 1720.0, 826.0, 431.0, 205.0, 116.0, 88.0, 40.0, 36.0, 22.0, 22.0, 11.0, 13.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1361083984375, -0.1322650909423828, -0.12842178344726562, -0.12457847595214844, -0.12073516845703125, -0.11689186096191406, -0.11304855346679688, -0.10920524597167969, -0.1053619384765625, -0.10151863098144531, -0.09767532348632812, -0.09383201599121094, -0.08998870849609375, -0.08614540100097656, -0.08230209350585938, -0.07845878601074219, -0.074615478515625, -0.07077217102050781, -0.06692886352539062, -0.06308555603027344, -0.05924224853515625, -0.05539894104003906, -0.051555633544921875, -0.04771232604980469, -0.0438690185546875, -0.04002571105957031, -0.036182403564453125, -0.03233909606933594, -0.02849578857421875, -0.024652481079101562, -0.020809173583984375, -0.016965866088867188, -0.01312255859375, -0.009279251098632812, -0.005435943603515625, -0.0015926361083984375, 0.00225067138671875, 0.0060939788818359375, 0.009937286376953125, 0.013780593872070312, 0.0176239013671875, 0.021467208862304688, 0.025310516357421875, 0.029153823852539062, 0.03299713134765625, 0.03684043884277344, 0.040683746337890625, 0.04452705383300781, 0.048370361328125, 0.05221366882324219, 0.056056976318359375, 0.05990028381347656, 0.06374359130859375, 0.06758689880371094, 0.07143020629882812, 0.07527351379394531, 0.0791168212890625, 0.08296012878417969, 0.08680343627929688, 0.09064674377441406, 0.09449005126953125, 0.09833335876464844, 0.10217666625976562, 0.10601997375488281, 0.10986328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 9.0, 10.0, 9.0, 12.0, 13.0, 11.0, 22.0, 22.0, 36.0, 43.0, 57.0, 48.0, 78.0, 66.0, 86.0, 62.0, 80.0, 83.0, 51.0, 45.0, 27.0, 40.0, 12.0, 13.0, 19.0, 9.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.046627044677734e-06, -7.783062756061554e-06, -7.5194984674453735e-06, -7.255934178829193e-06, -6.992369890213013e-06, -6.728805601596832e-06, -6.465241312980652e-06, -6.2016770243644714e-06, -5.938112735748291e-06, -5.674548447132111e-06, -5.41098415851593e-06, -5.14741986989975e-06, -4.883855581283569e-06, -4.620291292667389e-06, -4.3567270040512085e-06, -4.093162715435028e-06, -3.829598426818848e-06, -3.5660341382026672e-06, -3.302469849586487e-06, -3.0389055609703064e-06, -2.775341272354126e-06, -2.5117769837379456e-06, -2.248212695121765e-06, -1.9846484065055847e-06, -1.7210841178894043e-06, -1.4575198292732239e-06, -1.1939555406570435e-06, -9.30391252040863e-07, -6.668269634246826e-07, -4.032626748085022e-07, -1.3969838619232178e-07, 1.2386590242385864e-07, 3.8743019104003906e-07, 6.509944796562195e-07, 9.145587682723999e-07, 1.1781230568885803e-06, 1.4416873455047607e-06, 1.7052516341209412e-06, 1.9688159227371216e-06, 2.232380211353302e-06, 2.4959444999694824e-06, 2.759508788585663e-06, 3.0230730772018433e-06, 3.2866373658180237e-06, 3.550201654434204e-06, 3.8137659430503845e-06, 4.077330231666565e-06, 4.340894520282745e-06, 4.604458808898926e-06, 4.868023097515106e-06, 5.131587386131287e-06, 5.395151674747467e-06, 5.6587159633636475e-06, 5.922280251979828e-06, 6.185844540596008e-06, 6.449408829212189e-06, 6.712973117828369e-06, 6.9765374064445496e-06, 7.24010169506073e-06, 7.50366598367691e-06, 7.76723027229309e-06, 8.030794560909271e-06, 8.294358849525452e-06, 8.557923138141632e-06, 8.821487426757812e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 4.0, 6.0, 8.0, 13.0, 14.0, 15.0, 30.0, 27.0, 41.0, 68.0, 104.0, 264.0, 1770.0, 162067.0, 878428.0, 4883.0, 382.0, 146.0, 62.0, 44.0, 37.0, 28.0, 24.0, 18.0, 18.0, 14.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3330078125, -0.3219642639160156, -0.31092071533203125, -0.2998771667480469, -0.2888336181640625, -0.2777900695800781, -0.26674652099609375, -0.2557029724121094, -0.244659423828125, -0.23361587524414062, -0.22257232666015625, -0.21152877807617188, -0.2004852294921875, -0.18944168090820312, -0.17839813232421875, -0.16735458374023438, -0.15631103515625, -0.14526748657226562, -0.13422393798828125, -0.12318038940429688, -0.1121368408203125, -0.10109329223632812, -0.09004974365234375, -0.07900619506835938, -0.067962646484375, -0.056919097900390625, -0.04587554931640625, -0.034832000732421875, -0.0237884521484375, -0.012744903564453125, -0.00170135498046875, 0.009342193603515625, 0.0203857421875, 0.031429290771484375, 0.04247283935546875, 0.053516387939453125, 0.0645599365234375, 0.07560348510742188, 0.08664703369140625, 0.09769058227539062, 0.108734130859375, 0.11977767944335938, 0.13082122802734375, 0.14186477661132812, 0.1529083251953125, 0.16395187377929688, 0.17499542236328125, 0.18603897094726562, 0.19708251953125, 0.20812606811523438, 0.21916961669921875, 0.23021316528320312, 0.2412567138671875, 0.2523002624511719, 0.26334381103515625, 0.2743873596191406, 0.285430908203125, 0.2964744567871094, 0.30751800537109375, 0.3185615539550781, 0.3296051025390625, 0.3406486511230469, 0.35169219970703125, 0.3627357482910156, 0.373779296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 5.0, 10.0, 14.0, 16.0, 19.0, 23.0, 26.0, 36.0, 46.0, 71.0, 59.0, 99.0, 85.0, 86.0, 76.0, 67.0, 46.0, 31.0, 34.0, 23.0, 23.0, 20.0, 16.0, 17.0, 11.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060638427734375, -0.05871772766113281, -0.056797027587890625, -0.05487632751464844, -0.05295562744140625, -0.05103492736816406, -0.049114227294921875, -0.04719352722167969, -0.0452728271484375, -0.04335212707519531, -0.041431427001953125, -0.03951072692871094, -0.03759002685546875, -0.03566932678222656, -0.033748626708984375, -0.03182792663574219, -0.0299072265625, -0.027986526489257812, -0.026065826416015625, -0.024145126342773438, -0.02222442626953125, -0.020303726196289062, -0.018383026123046875, -0.016462326049804688, -0.0145416259765625, -0.012620925903320312, -0.010700225830078125, -0.008779525756835938, -0.00685882568359375, -0.0049381256103515625, -0.003017425537109375, -0.0010967254638671875, 0.000823974609375, 0.0027446746826171875, 0.004665374755859375, 0.0065860748291015625, 0.00850677490234375, 0.010427474975585938, 0.012348175048828125, 0.014268875122070312, 0.0161895751953125, 0.018110275268554688, 0.020030975341796875, 0.021951675415039062, 0.02387237548828125, 0.025793075561523438, 0.027713775634765625, 0.029634475708007812, 0.03155517578125, 0.03347587585449219, 0.035396575927734375, 0.03731727600097656, 0.03923797607421875, 0.04115867614746094, 0.043079376220703125, 0.04500007629394531, 0.0469207763671875, 0.04884147644042969, 0.050762176513671875, 0.05268287658691406, 0.05460357666015625, 0.05652427673339844, 0.058444976806640625, 0.06036567687988281, 0.062286376953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 25.0, 444.0, 489.0, 44.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.230231285095215, -8.071907997131348, -7.913585662841797, -7.755262851715088, -7.596940040588379, -7.438616752624512, -7.280294418334961, -7.121971130371094, -6.963648319244385, -6.805325508117676, -6.647002696990967, -6.488679885864258, -6.330357074737549, -6.17203426361084, -6.013710975646973, -5.855388164520264, -5.697065353393555, -5.538742542266846, -5.380419731140137, -5.222096920013428, -5.063774108886719, -4.905450820922852, -4.747128486633301, -4.588805198669434, -4.430482864379883, -4.272160053253174, -4.113837242126465, -3.955514430999756, -3.7971913814544678, -3.638868570327759, -3.48054575920105, -3.3222227096557617, -3.163900136947632, -3.005577325820923, -2.847254514694214, -2.688931465148926, -2.530608654022217, -2.372285842895508, -2.213963031768799, -2.05564022064209, -1.8973172903060913, -1.7389944791793823, -1.5806715488433838, -1.4223487377166748, -1.2640259265899658, -1.1057029962539673, -0.9473801851272583, -0.7890572547912598, -0.6307344436645508, -0.472411572933197, -0.31408873200416565, -0.15576589107513428, 0.0025569796562194824, 0.16087985038757324, 0.3192026615142822, 0.47752559185028076, 0.6358484029769897, 0.7941712737083435, 0.9524941444396973, 1.1108169555664062, 1.2691397666931152, 1.4274626970291138, 1.5857855081558228, 1.7441084384918213, 1.9024312496185303]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 5.0, 5.0, 5.0, 7.0, 8.0, 12.0, 11.0, 15.0, 11.0, 24.0, 28.0, 16.0, 40.0, 45.0, 43.0, 42.0, 34.0, 35.0, 50.0, 51.0, 39.0, 41.0, 41.0, 45.0, 41.0, 34.0, 29.0, 29.0, 30.0, 30.0, 26.0, 21.0, 20.0, 21.0, 15.0, 15.0, 11.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8964300751686096, -0.8689583539962769, -0.8414866328239441, -0.8140149116516113, -0.7865432500839233, -0.7590715289115906, -0.7315998077392578, -0.704128086566925, -0.6766563653945923, -0.6491846442222595, -0.6217129230499268, -0.5942412614822388, -0.566769540309906, -0.5392978191375732, -0.5118260979652405, -0.4843543767929077, -0.45688268542289734, -0.4294109642505646, -0.4019392728805542, -0.37446755170822144, -0.34699583053588867, -0.3195241093635559, -0.29205241799354553, -0.26458069682121277, -0.2371089905500412, -0.20963728427886963, -0.18216556310653687, -0.1546938568353653, -0.12722215056419373, -0.09975042939186096, -0.07227872312068939, -0.04480700194835663, -0.01733529567718506, 0.010136416181921959, 0.037608128041028976, 0.06507983803749084, 0.09255155175924301, 0.12002326548099518, 0.14749497175216675, 0.1749666929244995, 0.20243839919567108, 0.22991010546684265, 0.2573818266391754, 0.2848535180091858, 0.31232523918151855, 0.3397969603538513, 0.3672686815261841, 0.39474040269851685, 0.4222120940685272, 0.44968381524086, 0.47715550661087036, 0.5046272277832031, 0.5320989489555359, 0.5595706701278687, 0.5870423316955566, 0.6145141124725342, 0.6419857740402222, 0.6694574952125549, 0.6969292163848877, 0.7244008779525757, 0.7518725991249084, 0.7793443202972412, 0.806816041469574, 0.8342877626419067, 0.8617594838142395]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 14.0, 22.0, 27.0, 37.0, 70.0, 90.0, 196.0, 368.0, 915.0, 3181.0, 14448.0, 261187.0, 3862930.0, 43225.0, 4818.0, 1323.0, 565.0, 319.0, 175.0, 115.0, 68.0, 37.0, 32.0, 19.0, 17.0, 15.0, 14.0, 7.0, 6.0, 4.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.27197265625, -0.2616233825683594, -0.25127410888671875, -0.24092483520507812, -0.2305755615234375, -0.22022628784179688, -0.20987701416015625, -0.19952774047851562, -0.189178466796875, -0.17882919311523438, -0.16847991943359375, -0.15813064575195312, -0.1477813720703125, -0.13743209838867188, -0.12708282470703125, -0.11673355102539062, -0.10638427734375, -0.09603500366210938, -0.08568572998046875, -0.07533645629882812, -0.0649871826171875, -0.054637908935546875, -0.04428863525390625, -0.033939361572265625, -0.023590087890625, -0.013240814208984375, -0.00289154052734375, 0.007457733154296875, 0.0178070068359375, 0.028156280517578125, 0.03850555419921875, 0.048854827880859375, 0.0592041015625, 0.06955337524414062, 0.07990264892578125, 0.09025192260742188, 0.1006011962890625, 0.11095046997070312, 0.12129974365234375, 0.13164901733398438, 0.141998291015625, 0.15234756469726562, 0.16269683837890625, 0.17304611206054688, 0.1833953857421875, 0.19374465942382812, 0.20409393310546875, 0.21444320678710938, 0.22479248046875, 0.23514175415039062, 0.24549102783203125, 0.2558403015136719, 0.2661895751953125, 0.2765388488769531, 0.28688812255859375, 0.2972373962402344, 0.307586669921875, 0.3179359436035156, 0.32828521728515625, 0.3386344909667969, 0.3489837646484375, 0.3593330383300781, 0.36968231201171875, 0.3800315856933594, 0.390380859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 14.0, 16.0, 17.0, 22.0, 37.0, 60.0, 98.0, 158.0, 184.0, 155.0, 74.0, 76.0, 24.0, 20.0, 18.0, 16.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.11033344268798828, -0.10561561584472656, -0.10089778900146484, -0.09617996215820312, -0.0914621353149414, -0.08674430847167969, -0.08202648162841797, -0.07730865478515625, -0.07259082794189453, -0.06787300109863281, -0.0631551742553711, -0.058437347412109375, -0.053719520568847656, -0.04900169372558594, -0.04428386688232422, -0.0395660400390625, -0.03484821319580078, -0.030130386352539062, -0.025412559509277344, -0.020694732666015625, -0.015976905822753906, -0.011259078979492188, -0.006541252136230469, -0.00182342529296875, 0.0028944015502929688, 0.0076122283935546875, 0.012330055236816406, 0.017047882080078125, 0.021765708923339844, 0.026483535766601562, 0.03120136260986328, 0.035919189453125, 0.04063701629638672, 0.04535484313964844, 0.050072669982910156, 0.054790496826171875, 0.059508323669433594, 0.06422615051269531, 0.06894397735595703, 0.07366180419921875, 0.07837963104248047, 0.08309745788574219, 0.0878152847290039, 0.09253311157226562, 0.09725093841552734, 0.10196876525878906, 0.10668659210205078, 0.1114044189453125, 0.11612224578857422, 0.12084007263183594, 0.12555789947509766, 0.13027572631835938, 0.1349935531616211, 0.1397113800048828, 0.14442920684814453, 0.14914703369140625, 0.15386486053466797, 0.1585826873779297, 0.1633005142211914, 0.16801834106445312, 0.17273616790771484, 0.17745399475097656, 0.18217182159423828, 0.1868896484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 23.0, 50.0, 115.0, 342.0, 1097.0, 11155.0, 1627359.0, 2539088.0, 13303.0, 1140.0, 306.0, 140.0, 58.0, 33.0, 29.0, 6.0, 5.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4560279846191406, -0.43915557861328125, -0.4222831726074219, -0.4054107666015625, -0.3885383605957031, -0.37166595458984375, -0.3547935485839844, -0.337921142578125, -0.3210487365722656, -0.30417633056640625, -0.2873039245605469, -0.2704315185546875, -0.2535591125488281, -0.23668670654296875, -0.21981430053710938, -0.20294189453125, -0.18606948852539062, -0.16919708251953125, -0.15232467651367188, -0.1354522705078125, -0.11857986450195312, -0.10170745849609375, -0.08483505249023438, -0.067962646484375, -0.051090240478515625, -0.03421783447265625, -0.017345428466796875, -0.0004730224609375, 0.016399383544921875, 0.03327178955078125, 0.050144195556640625, 0.0670166015625, 0.08388900756835938, 0.10076141357421875, 0.11763381958007812, 0.1345062255859375, 0.15137863159179688, 0.16825103759765625, 0.18512344360351562, 0.201995849609375, 0.21886825561523438, 0.23574066162109375, 0.2526130676269531, 0.2694854736328125, 0.2863578796386719, 0.30323028564453125, 0.3201026916503906, 0.33697509765625, 0.3538475036621094, 0.37071990966796875, 0.3875923156738281, 0.4044647216796875, 0.4213371276855469, 0.43820953369140625, 0.4550819396972656, 0.471954345703125, 0.4888267517089844, 0.5056991577148438, 0.5225715637207031, 0.5394439697265625, 0.5563163757324219, 0.5731887817382812, 0.5900611877441406, 0.60693359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 12.0, 8.0, 21.0, 41.0, 86.0, 158.0, 406.0, 752.0, 1302.0, 648.0, 283.0, 147.0, 96.0, 47.0, 31.0, 16.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.188446044921875, -0.18243408203125, -0.176422119140625, -0.17041015625, -0.164398193359375, -0.15838623046875, -0.152374267578125, -0.1463623046875, -0.140350341796875, -0.13433837890625, -0.128326416015625, -0.122314453125, -0.116302490234375, -0.11029052734375, -0.104278564453125, -0.0982666015625, -0.092254638671875, -0.08624267578125, -0.080230712890625, -0.07421875, -0.068206787109375, -0.06219482421875, -0.056182861328125, -0.0501708984375, -0.044158935546875, -0.03814697265625, -0.032135009765625, -0.026123046875, -0.020111083984375, -0.01409912109375, -0.008087158203125, -0.0020751953125, 0.003936767578125, 0.00994873046875, 0.015960693359375, 0.02197265625, 0.027984619140625, 0.03399658203125, 0.040008544921875, 0.0460205078125, 0.052032470703125, 0.05804443359375, 0.064056396484375, 0.070068359375, 0.076080322265625, 0.08209228515625, 0.088104248046875, 0.0941162109375, 0.100128173828125, 0.10614013671875, 0.112152099609375, 0.1181640625, 0.124176025390625, 0.13018798828125, 0.136199951171875, 0.1422119140625, 0.148223876953125, 0.15423583984375, 0.160247802734375, 0.166259765625, 0.172271728515625, 0.17828369140625, 0.184295654296875, 0.1903076171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 841.0, 172.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.509147644042969, -13.248595237731934, -12.988042831420898, -12.727490425109863, -12.466938018798828, -12.20638656616211, -11.945834159851074, -11.685281753540039, -11.424729347229004, -11.164176940917969, -10.903624534606934, -10.643072128295898, -10.38252067565918, -10.121968269348145, -9.86141586303711, -9.600863456726074, -9.340311050415039, -9.079758644104004, -8.819206237792969, -8.558653831481934, -8.298101425170898, -8.03754997253418, -7.7769975662231445, -7.516445159912109, -7.255892753601074, -6.995340347290039, -6.734787940979004, -6.474236011505127, -6.213683605194092, -5.953131198883057, -5.69257926940918, -5.4320268630981445, -5.171474933624268, -4.910922527313232, -4.6503705978393555, -4.38981819152832, -4.129265785217285, -3.86871337890625, -3.608161211013794, -3.347609043121338, -3.0870566368103027, -2.8265042304992676, -2.5659520626068115, -2.3053998947143555, -2.0448474884033203, -1.7842952013015747, -1.523742914199829, -1.2631906270980835, -1.002638339996338, -0.7420860528945923, -0.4815337657928467, -0.22098147869110107, 0.03957080841064453, 0.30012309551239014, 0.5606753826141357, 0.8212276697158813, 1.081779956817627, 1.3423322439193726, 1.6028845310211182, 1.8634368181228638, 2.1239891052246094, 2.3845415115356445, 2.6450936794281006, 2.9056458473205566, 3.166198253631592]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 14.0, 11.0, 20.0, 15.0, 24.0, 37.0, 39.0, 52.0, 50.0, 57.0, 70.0, 69.0, 76.0, 51.0, 63.0, 53.0, 55.0, 55.0, 39.0, 31.0, 28.0, 17.0, 16.0, 19.0, 15.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0], "bins": [-0.7734193801879883, -0.7562493681907654, -0.7390792965888977, -0.7219092845916748, -0.7047392725944519, -0.687569260597229, -0.6703991889953613, -0.6532291769981384, -0.6360591650009155, -0.6188891530036926, -0.601719081401825, -0.584549069404602, -0.5673790574073792, -0.5502090454101562, -0.5330389738082886, -0.5158689618110657, -0.498698890209198, -0.4815288484096527, -0.4643588364124298, -0.4471887946128845, -0.4300187826156616, -0.41284874081611633, -0.39567869901657104, -0.37850868701934814, -0.36133864521980286, -0.34416860342025757, -0.32699859142303467, -0.3098285496234894, -0.2926585078239441, -0.2754884958267212, -0.2583184540271759, -0.2411484271287918, -0.2239784598350525, -0.2068084329366684, -0.1896384060382843, -0.172468364238739, -0.15529833734035492, -0.13812831044197083, -0.12095827609300613, -0.10378824174404144, -0.08661821484565735, -0.06944818794727325, -0.05227815359830856, -0.03510812297463417, -0.017938092350959778, -0.0007680654525756836, 0.016401968896389008, 0.0335720032453537, 0.05074203014373779, 0.06791205704212189, 0.08508209139108658, 0.10225212574005127, 0.11942215263843536, 0.13659217953681946, 0.15376222133636475, 0.17093224823474884, 0.18810227513313293, 0.20527230203151703, 0.22244232892990112, 0.2396123707294464, 0.2567824125289917, 0.2739524245262146, 0.2911224663257599, 0.3082925081253052, 0.3254625201225281]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 8.0, 16.0, 25.0, 31.0, 33.0, 41.0, 70.0, 92.0, 137.0, 169.0, 268.0, 496.0, 953.0, 2153.0, 6210.0, 24996.0, 215567.0, 707223.0, 70408.0, 12782.0, 3628.0, 1432.0, 624.0, 366.0, 217.0, 155.0, 107.0, 66.0, 45.0, 40.0, 32.0, 30.0, 15.0, 18.0, 13.0, 9.0, 7.0, 9.0, 5.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4086418151855469, -0.39418792724609375, -0.3797340393066406, -0.3652801513671875, -0.3508262634277344, -0.33637237548828125, -0.3219184875488281, -0.307464599609375, -0.2930107116699219, -0.27855682373046875, -0.2641029357910156, -0.2496490478515625, -0.23519515991210938, -0.22074127197265625, -0.20628738403320312, -0.19183349609375, -0.17737960815429688, -0.16292572021484375, -0.14847183227539062, -0.1340179443359375, -0.11956405639648438, -0.10511016845703125, -0.09065628051757812, -0.076202392578125, -0.061748504638671875, -0.04729461669921875, -0.032840728759765625, -0.0183868408203125, -0.003932952880859375, 0.01052093505859375, 0.024974822998046875, 0.0394287109375, 0.053882598876953125, 0.06833648681640625, 0.08279037475585938, 0.0972442626953125, 0.11169815063476562, 0.12615203857421875, 0.14060592651367188, 0.155059814453125, 0.16951370239257812, 0.18396759033203125, 0.19842147827148438, 0.2128753662109375, 0.22732925415039062, 0.24178314208984375, 0.2562370300292969, 0.27069091796875, 0.2851448059082031, 0.29959869384765625, 0.3140525817871094, 0.3285064697265625, 0.3429603576660156, 0.35741424560546875, 0.3718681335449219, 0.386322021484375, 0.4007759094238281, 0.41522979736328125, 0.4296836853027344, 0.4441375732421875, 0.4585914611816406, 0.47304534912109375, 0.4874992370605469, 0.501953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 10.0, 8.0, 14.0, 21.0, 35.0, 39.0, 78.0, 121.0, 188.0, 184.0, 120.0, 72.0, 39.0, 26.0, 18.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.117919921875, -0.11318397521972656, -0.10844802856445312, -0.10371208190917969, -0.09897613525390625, -0.09424018859863281, -0.08950424194335938, -0.08476829528808594, -0.0800323486328125, -0.07529640197753906, -0.07056045532226562, -0.06582450866699219, -0.06108856201171875, -0.05635261535644531, -0.051616668701171875, -0.04688072204589844, -0.042144775390625, -0.03740882873535156, -0.032672882080078125, -0.027936935424804688, -0.02320098876953125, -0.018465042114257812, -0.013729095458984375, -0.008993148803710938, -0.0042572021484375, 0.0004787445068359375, 0.005214691162109375, 0.009950637817382812, 0.01468658447265625, 0.019422531127929688, 0.024158477783203125, 0.028894424438476562, 0.03363037109375, 0.03836631774902344, 0.043102264404296875, 0.04783821105957031, 0.05257415771484375, 0.05731010437011719, 0.062046051025390625, 0.06678199768066406, 0.0715179443359375, 0.07625389099121094, 0.08098983764648438, 0.08572578430175781, 0.09046173095703125, 0.09519767761230469, 0.09993362426757812, 0.10466957092285156, 0.109405517578125, 0.11414146423339844, 0.11887741088867188, 0.12361335754394531, 0.12834930419921875, 0.1330852508544922, 0.13782119750976562, 0.14255714416503906, 0.1472930908203125, 0.15202903747558594, 0.15676498413085938, 0.1615009307861328, 0.16623687744140625, 0.1709728240966797, 0.17570877075195312, 0.18044471740722656, 0.1851806640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 5.0, 2.0, 11.0, 11.0, 10.0, 14.0, 15.0, 21.0, 30.0, 55.0, 48.0, 64.0, 87.0, 108.0, 177.0, 267.0, 580.0, 1453.0, 4693.0, 19233.0, 130061.0, 667440.0, 189855.0, 25072.0, 5812.0, 1739.0, 614.0, 347.0, 201.0, 126.0, 91.0, 83.0, 39.0, 45.0, 35.0, 26.0, 14.0, 14.0, 18.0, 9.0, 4.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.447998046875, -0.4350433349609375, -0.422088623046875, -0.4091339111328125, -0.39617919921875, -0.3832244873046875, -0.370269775390625, -0.3573150634765625, -0.3443603515625, -0.3314056396484375, -0.318450927734375, -0.3054962158203125, -0.29254150390625, -0.2795867919921875, -0.266632080078125, -0.2536773681640625, -0.24072265625, -0.2277679443359375, -0.214813232421875, -0.2018585205078125, -0.18890380859375, -0.1759490966796875, -0.162994384765625, -0.1500396728515625, -0.1370849609375, -0.1241302490234375, -0.111175537109375, -0.0982208251953125, -0.08526611328125, -0.0723114013671875, -0.059356689453125, -0.0464019775390625, -0.033447265625, -0.0204925537109375, -0.007537841796875, 0.0054168701171875, 0.01837158203125, 0.0313262939453125, 0.044281005859375, 0.0572357177734375, 0.0701904296875, 0.0831451416015625, 0.096099853515625, 0.1090545654296875, 0.12200927734375, 0.1349639892578125, 0.147918701171875, 0.1608734130859375, 0.173828125, 0.1867828369140625, 0.199737548828125, 0.2126922607421875, 0.22564697265625, 0.2386016845703125, 0.251556396484375, 0.2645111083984375, 0.2774658203125, 0.2904205322265625, 0.303375244140625, 0.3163299560546875, 0.32928466796875, 0.3422393798828125, 0.355194091796875, 0.3681488037109375, 0.381103515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 5.0, 18.0, 17.0, 14.0, 22.0, 24.0, 29.0, 28.0, 32.0, 46.0, 52.0, 45.0, 41.0, 42.0, 55.0, 47.0, 50.0, 52.0, 44.0, 42.0, 38.0, 39.0, 36.0, 36.0, 16.0, 16.0, 16.0, 12.0, 8.0, 11.0, 5.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.14111328125, -0.13638687133789062, -0.13166046142578125, -0.12693405151367188, -0.1222076416015625, -0.11748123168945312, -0.11275482177734375, -0.10802841186523438, -0.103302001953125, -0.09857559204101562, -0.09384918212890625, -0.08912277221679688, -0.0843963623046875, -0.07966995239257812, -0.07494354248046875, -0.07021713256835938, -0.06549072265625, -0.060764312744140625, -0.05603790283203125, -0.051311492919921875, -0.0465850830078125, -0.041858673095703125, -0.03713226318359375, -0.032405853271484375, -0.027679443359375, -0.022953033447265625, -0.01822662353515625, -0.013500213623046875, -0.0087738037109375, -0.004047393798828125, 0.00067901611328125, 0.005405426025390625, 0.0101318359375, 0.014858245849609375, 0.01958465576171875, 0.024311065673828125, 0.0290374755859375, 0.033763885498046875, 0.03849029541015625, 0.043216705322265625, 0.047943115234375, 0.052669525146484375, 0.05739593505859375, 0.062122344970703125, 0.0668487548828125, 0.07157516479492188, 0.07630157470703125, 0.08102798461914062, 0.08575439453125, 0.09048080444335938, 0.09520721435546875, 0.09993362426757812, 0.1046600341796875, 0.10938644409179688, 0.11411285400390625, 0.11883926391601562, 0.123565673828125, 0.12829208374023438, 0.13301849365234375, 0.13774490356445312, 0.1424713134765625, 0.14719772338867188, 0.15192413330078125, 0.15665054321289062, 0.161376953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 6.0, 9.0, 15.0, 23.0, 33.0, 41.0, 63.0, 99.0, 137.0, 174.0, 301.0, 422.0, 664.0, 1098.0, 1791.0, 3217.0, 5830.0, 12057.0, 31040.0, 121802.0, 478653.0, 290933.0, 61233.0, 19482.0, 8559.0, 4406.0, 2479.0, 1490.0, 888.0, 504.0, 376.0, 244.0, 128.0, 84.0, 81.0, 41.0, 40.0, 29.0, 16.0, 10.0, 9.0, 9.0, 14.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1444091796875, -0.1395587921142578, -0.13470840454101562, -0.12985801696777344, -0.12500762939453125, -0.12015724182128906, -0.11530685424804688, -0.11045646667480469, -0.1056060791015625, -0.10075569152832031, -0.09590530395507812, -0.09105491638183594, -0.08620452880859375, -0.08135414123535156, -0.07650375366210938, -0.07165336608886719, -0.066802978515625, -0.06195259094238281, -0.057102203369140625, -0.05225181579589844, -0.04740142822265625, -0.04255104064941406, -0.037700653076171875, -0.03285026550292969, -0.0279998779296875, -0.023149490356445312, -0.018299102783203125, -0.013448715209960938, -0.00859832763671875, -0.0037479400634765625, 0.001102447509765625, 0.0059528350830078125, 0.01080322265625, 0.015653610229492188, 0.020503997802734375, 0.025354385375976562, 0.03020477294921875, 0.03505516052246094, 0.039905548095703125, 0.04475593566894531, 0.0496063232421875, 0.05445671081542969, 0.059307098388671875, 0.06415748596191406, 0.06900787353515625, 0.07385826110839844, 0.07870864868164062, 0.08355903625488281, 0.088409423828125, 0.09325981140136719, 0.09811019897460938, 0.10296058654785156, 0.10781097412109375, 0.11266136169433594, 0.11751174926757812, 0.12236213684082031, 0.1272125244140625, 0.1320629119873047, 0.13691329956054688, 0.14176368713378906, 0.14661407470703125, 0.15146446228027344, 0.15631484985351562, 0.1611652374267578, 0.166015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 20.0, 40.0, 78.0, 142.0, 215.0, 219.0, 131.0, 55.0, 23.0, 15.0, 11.0, 9.0, 1.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.713369369506836e-05, -3.606826066970825e-05, -3.5002827644348145e-05, -3.393739461898804e-05, -3.287196159362793e-05, -3.180652856826782e-05, -3.0741095542907715e-05, -2.9675662517547607e-05, -2.86102294921875e-05, -2.7544796466827393e-05, -2.6479363441467285e-05, -2.5413930416107178e-05, -2.434849739074707e-05, -2.3283064365386963e-05, -2.2217631340026855e-05, -2.1152198314666748e-05, -2.008676528930664e-05, -1.9021332263946533e-05, -1.7955899238586426e-05, -1.689046621322632e-05, -1.582503318786621e-05, -1.4759600162506104e-05, -1.3694167137145996e-05, -1.2628734111785889e-05, -1.1563301086425781e-05, -1.0497868061065674e-05, -9.432435035705566e-06, -8.367002010345459e-06, -7.3015689849853516e-06, -6.236135959625244e-06, -5.170702934265137e-06, -4.105269908905029e-06, -3.039836883544922e-06, -1.9744038581848145e-06, -9.08970832824707e-07, 1.564621925354004e-07, 1.2218952178955078e-06, 2.2873282432556152e-06, 3.3527612686157227e-06, 4.41819429397583e-06, 5.4836273193359375e-06, 6.549060344696045e-06, 7.614493370056152e-06, 8.67992639541626e-06, 9.745359420776367e-06, 1.0810792446136475e-05, 1.1876225471496582e-05, 1.294165849685669e-05, 1.4007091522216797e-05, 1.5072524547576904e-05, 1.6137957572937012e-05, 1.720339059829712e-05, 1.8268823623657227e-05, 1.9334256649017334e-05, 2.039968967437744e-05, 2.146512269973755e-05, 2.2530555725097656e-05, 2.3595988750457764e-05, 2.466142177581787e-05, 2.572685480117798e-05, 2.6792287826538086e-05, 2.7857720851898193e-05, 2.89231538772583e-05, 2.9988586902618408e-05, 3.1054019927978516e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 7.0, 14.0, 13.0, 20.0, 32.0, 39.0, 78.0, 96.0, 174.0, 306.0, 591.0, 1506.0, 4144.0, 16810.0, 118648.0, 670849.0, 201692.0, 24309.0, 5645.0, 1888.0, 749.0, 383.0, 191.0, 118.0, 66.0, 49.0, 32.0, 28.0, 16.0, 9.0, 11.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1845703125, -0.1785411834716797, -0.17251205444335938, -0.16648292541503906, -0.16045379638671875, -0.15442466735839844, -0.14839553833007812, -0.1423664093017578, -0.1363372802734375, -0.1303081512451172, -0.12427902221679688, -0.11824989318847656, -0.11222076416015625, -0.10619163513183594, -0.10016250610351562, -0.09413337707519531, -0.088104248046875, -0.08207511901855469, -0.07604598999023438, -0.07001686096191406, -0.06398773193359375, -0.05795860290527344, -0.051929473876953125, -0.04590034484863281, -0.0398712158203125, -0.03384208679199219, -0.027812957763671875, -0.021783828735351562, -0.01575469970703125, -0.009725570678710938, -0.003696441650390625, 0.0023326873779296875, 0.00836181640625, 0.014390945434570312, 0.020420074462890625, 0.026449203491210938, 0.03247833251953125, 0.03850746154785156, 0.044536590576171875, 0.05056571960449219, 0.0565948486328125, 0.06262397766113281, 0.06865310668945312, 0.07468223571777344, 0.08071136474609375, 0.08674049377441406, 0.09276962280273438, 0.09879875183105469, 0.104827880859375, 0.11085700988769531, 0.11688613891601562, 0.12291526794433594, 0.12894439697265625, 0.13497352600097656, 0.14100265502929688, 0.1470317840576172, 0.1530609130859375, 0.1590900421142578, 0.16511917114257812, 0.17114830017089844, 0.17717742919921875, 0.18320655822753906, 0.18923568725585938, 0.1952648162841797, 0.2012939453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 7.0, 14.0, 20.0, 12.0, 21.0, 33.0, 35.0, 56.0, 42.0, 54.0, 69.0, 71.0, 76.0, 80.0, 73.0, 76.0, 40.0, 44.0, 37.0, 27.0, 18.0, 18.0, 13.0, 6.0, 7.0, 5.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06829833984375, -0.06624031066894531, -0.06418228149414062, -0.06212425231933594, -0.06006622314453125, -0.05800819396972656, -0.055950164794921875, -0.05389213562011719, -0.0518341064453125, -0.04977607727050781, -0.047718048095703125, -0.04566001892089844, -0.04360198974609375, -0.04154396057128906, -0.039485931396484375, -0.03742790222167969, -0.035369873046875, -0.03331184387207031, -0.031253814697265625, -0.029195785522460938, -0.02713775634765625, -0.025079727172851562, -0.023021697998046875, -0.020963668823242188, -0.0189056396484375, -0.016847610473632812, -0.014789581298828125, -0.012731552124023438, -0.01067352294921875, -0.008615493774414062, -0.006557464599609375, -0.0044994354248046875, -0.00244140625, -0.0003833770751953125, 0.001674652099609375, 0.0037326812744140625, 0.00579071044921875, 0.007848739624023438, 0.009906768798828125, 0.011964797973632812, 0.0140228271484375, 0.016080856323242188, 0.018138885498046875, 0.020196914672851562, 0.02225494384765625, 0.024312973022460938, 0.026371002197265625, 0.028429031372070312, 0.030487060546875, 0.03254508972167969, 0.034603118896484375, 0.03666114807128906, 0.03871917724609375, 0.04077720642089844, 0.042835235595703125, 0.04489326477050781, 0.0469512939453125, 0.04900932312011719, 0.051067352294921875, 0.05312538146972656, 0.05518341064453125, 0.05724143981933594, 0.059299468994140625, 0.06135749816894531, 0.06341552734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 30.0, 91.0, 225.0, 288.0, 203.0, 98.0, 29.0, 17.0, 7.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.949930191040039, -1.9041064977645874, -1.8582826852798462, -1.8124589920043945, -1.7666351795196533, -1.7208114862442017, -1.67498779296875, -1.6291639804840088, -1.5833401679992676, -1.537516474723816, -1.4916926622390747, -1.445868968963623, -1.4000451564788818, -1.3542214632034302, -1.3083977699279785, -1.2625739574432373, -1.2167502641677856, -1.170926570892334, -1.1251027584075928, -1.0792790651321411, -1.0334552526474, -0.9876315593719482, -0.9418078064918518, -0.8959840536117554, -0.8501603007316589, -0.8043365478515625, -0.7585127949714661, -0.7126890420913696, -0.666865348815918, -0.6210415363311768, -0.5752178430557251, -0.5293940901756287, -0.48357027769088745, -0.437746524810791, -0.3919227719306946, -0.34609904885292053, -0.3002752959728241, -0.25445154309272766, -0.2086278200149536, -0.16280406713485718, -0.11698031425476074, -0.0711565688252449, -0.025332823395729065, 0.020490914583206177, 0.06631466746330261, 0.11213842034339905, 0.1579621434211731, 0.20378589630126953, 0.24960964918136597, 0.2954334020614624, 0.34125715494155884, 0.3870808780193329, 0.4329046308994293, 0.47872838377952576, 0.5245521068572998, 0.5703758597373962, 0.6161996126174927, 0.6620233654975891, 0.7078471183776855, 0.7536708116531372, 0.7994946241378784, 0.8453183174133301, 0.8911420702934265, 0.936965823173523, 0.9827895760536194]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 12.0, 9.0, 14.0, 12.0, 16.0, 21.0, 25.0, 28.0, 41.0, 33.0, 40.0, 36.0, 53.0, 57.0, 51.0, 47.0, 60.0, 43.0, 50.0, 42.0, 51.0, 48.0, 37.0, 31.0, 29.0, 24.0, 24.0, 14.0, 16.0, 10.0, 8.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46683305501937866, -0.4494871497154236, -0.4321412742137909, -0.4147953689098358, -0.3974494934082031, -0.38010358810424805, -0.36275768280029297, -0.3454118072986603, -0.3280659317970276, -0.3107200264930725, -0.2933741509914398, -0.27602824568748474, -0.25868237018585205, -0.24133646488189697, -0.2239905744791031, -0.2066446840763092, -0.18929877877235413, -0.17195288836956024, -0.15460699796676636, -0.13726109266281128, -0.11991520971059799, -0.10256931930780411, -0.08522342145442963, -0.06787753105163574, -0.05053164064884186, -0.033185750246047974, -0.01583985611796379, 0.0015060380101203918, 0.018851928412914276, 0.03619781881570816, 0.05354371666908264, 0.07088960707187653, 0.08823549747467041, 0.1055813878774643, 0.12292727828025818, 0.14027318358421326, 0.15761905908584595, 0.17496496438980103, 0.1923108547925949, 0.2096567451953888, 0.22700263559818268, 0.24434852600097656, 0.26169443130493164, 0.27904030680656433, 0.2963862121105194, 0.3137320876121521, 0.3310779929161072, 0.34842389822006226, 0.36576977372169495, 0.38311567902565, 0.4004615545272827, 0.4178074598312378, 0.4351533353328705, 0.45249924063682556, 0.46984511613845825, 0.48719102144241333, 0.5045369267463684, 0.5218828320503235, 0.5392287373542786, 0.5565745830535889, 0.573920488357544, 0.591266393661499, 0.6086122989654541, 0.6259582042694092, 0.6433040499687195]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 7.0, 11.0, 19.0, 32.0, 48.0, 114.0, 201.0, 434.0, 1074.0, 3338.0, 8619.0, 32320.0, 686462.0, 3356012.0, 89788.0, 10549.0, 2668.0, 990.0, 542.0, 350.0, 182.0, 128.0, 96.0, 69.0, 52.0, 38.0, 34.0, 18.0, 11.0, 15.0, 13.0, 5.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.1614990234375, -0.1548328399658203, -0.14816665649414062, -0.14150047302246094, -0.13483428955078125, -0.12816810607910156, -0.12150192260742188, -0.11483573913574219, -0.1081695556640625, -0.10150337219238281, -0.09483718872070312, -0.08817100524902344, -0.08150482177734375, -0.07483863830566406, -0.06817245483398438, -0.06150627136230469, -0.054840087890625, -0.04817390441894531, -0.041507720947265625, -0.03484153747558594, -0.02817535400390625, -0.021509170532226562, -0.014842987060546875, -0.008176803588867188, -0.0015106201171875, 0.0051555633544921875, 0.011821746826171875, 0.018487930297851562, 0.02515411376953125, 0.03182029724121094, 0.038486480712890625, 0.04515266418457031, 0.05181884765625, 0.05848503112792969, 0.06515121459960938, 0.07181739807128906, 0.07848358154296875, 0.08514976501464844, 0.09181594848632812, 0.09848213195800781, 0.1051483154296875, 0.11181449890136719, 0.11848068237304688, 0.12514686584472656, 0.13181304931640625, 0.13847923278808594, 0.14514541625976562, 0.1518115997314453, 0.158477783203125, 0.1651439666748047, 0.17181015014648438, 0.17847633361816406, 0.18514251708984375, 0.19180870056152344, 0.19847488403320312, 0.2051410675048828, 0.2118072509765625, 0.2184734344482422, 0.22513961791992188, 0.23180580139160156, 0.23847198486328125, 0.24513816833496094, 0.2518043518066406, 0.2584705352783203, 0.26513671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 20.0, 5.0, 31.0, 33.0, 44.0, 103.0, 148.0, 164.0, 174.0, 99.0, 69.0, 39.0, 21.0, 18.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1083984375, -0.10380744934082031, -0.09921646118164062, -0.09462547302246094, -0.09003448486328125, -0.08544349670410156, -0.08085250854492188, -0.07626152038574219, -0.0716705322265625, -0.06707954406738281, -0.062488555908203125, -0.05789756774902344, -0.05330657958984375, -0.04871559143066406, -0.044124603271484375, -0.03953361511230469, -0.034942626953125, -0.030351638793945312, -0.025760650634765625, -0.021169662475585938, -0.01657867431640625, -0.011987686157226562, -0.007396697998046875, -0.0028057098388671875, 0.0017852783203125, 0.0063762664794921875, 0.010967254638671875, 0.015558242797851562, 0.02014923095703125, 0.024740219116210938, 0.029331207275390625, 0.03392219543457031, 0.03851318359375, 0.04310417175292969, 0.047695159912109375, 0.05228614807128906, 0.05687713623046875, 0.06146812438964844, 0.06605911254882812, 0.07065010070800781, 0.0752410888671875, 0.07983207702636719, 0.08442306518554688, 0.08901405334472656, 0.09360504150390625, 0.09819602966308594, 0.10278701782226562, 0.10737800598144531, 0.111968994140625, 0.11655998229980469, 0.12115097045898438, 0.12574195861816406, 0.13033294677734375, 0.13492393493652344, 0.13951492309570312, 0.1441059112548828, 0.1486968994140625, 0.1532878875732422, 0.15787887573242188, 0.16246986389160156, 0.16706085205078125, 0.17165184020996094, 0.17624282836914062, 0.1808338165283203, 0.1854248046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 9.0, 22.0, 15.0, 50.0, 41.0, 80.0, 127.0, 198.0, 339.0, 659.0, 1361.0, 3634.0, 12804.0, 64373.0, 485962.0, 2799461.0, 713415.0, 87696.0, 16391.0, 4299.0, 1605.0, 754.0, 358.0, 204.0, 145.0, 86.0, 50.0, 32.0, 34.0, 12.0, 12.0, 11.0, 9.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13652992248535156, -0.13158035278320312, -0.1266307830810547, -0.12168121337890625, -0.11673164367675781, -0.11178207397460938, -0.10683250427246094, -0.1018829345703125, -0.09693336486816406, -0.09198379516601562, -0.08703422546386719, -0.08208465576171875, -0.07713508605957031, -0.07218551635742188, -0.06723594665527344, -0.062286376953125, -0.05733680725097656, -0.052387237548828125, -0.04743766784667969, -0.04248809814453125, -0.03753852844238281, -0.032588958740234375, -0.027639389038085938, -0.0226898193359375, -0.017740249633789062, -0.012790679931640625, -0.007841110229492188, -0.00289154052734375, 0.0020580291748046875, 0.007007598876953125, 0.011957168579101562, 0.01690673828125, 0.021856307983398438, 0.026805877685546875, 0.03175544738769531, 0.03670501708984375, 0.04165458679199219, 0.046604156494140625, 0.05155372619628906, 0.0565032958984375, 0.06145286560058594, 0.06640243530273438, 0.07135200500488281, 0.07630157470703125, 0.08125114440917969, 0.08620071411132812, 0.09115028381347656, 0.096099853515625, 0.10104942321777344, 0.10599899291992188, 0.11094856262207031, 0.11589813232421875, 0.12084770202636719, 0.12579727172851562, 0.13074684143066406, 0.1356964111328125, 0.14064598083496094, 0.14559555053710938, 0.1505451202392578, 0.15549468994140625, 0.1604442596435547, 0.16539382934570312, 0.17034339904785156, 0.17529296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 12.0, 5.0, 14.0, 12.0, 22.0, 49.0, 43.0, 80.0, 111.0, 134.0, 161.0, 251.0, 304.0, 396.0, 424.0, 461.0, 406.0, 299.0, 215.0, 155.0, 138.0, 109.0, 56.0, 46.0, 38.0, 29.0, 21.0, 24.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.1123046875, -0.10935401916503906, -0.10640335083007812, -0.10345268249511719, -0.10050201416015625, -0.09755134582519531, -0.09460067749023438, -0.09165000915527344, -0.0886993408203125, -0.08574867248535156, -0.08279800415039062, -0.07984733581542969, -0.07689666748046875, -0.07394599914550781, -0.07099533081054688, -0.06804466247558594, -0.065093994140625, -0.06214332580566406, -0.059192657470703125, -0.05624198913574219, -0.05329132080078125, -0.05034065246582031, -0.047389984130859375, -0.04443931579589844, -0.0414886474609375, -0.03853797912597656, -0.035587310791015625, -0.03263664245605469, -0.02968597412109375, -0.026735305786132812, -0.023784637451171875, -0.020833969116210938, -0.01788330078125, -0.014932632446289062, -0.011981964111328125, -0.009031295776367188, -0.00608062744140625, -0.0031299591064453125, -0.000179290771484375, 0.0027713775634765625, 0.0057220458984375, 0.008672714233398438, 0.011623382568359375, 0.014574050903320312, 0.01752471923828125, 0.020475387573242188, 0.023426055908203125, 0.026376724243164062, 0.029327392578125, 0.03227806091308594, 0.035228729248046875, 0.03817939758300781, 0.04113006591796875, 0.04408073425292969, 0.047031402587890625, 0.04998207092285156, 0.0529327392578125, 0.05588340759277344, 0.058834075927734375, 0.06178474426269531, 0.06473541259765625, 0.06768608093261719, 0.07063674926757812, 0.07358741760253906, 0.0765380859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 23.0, 52.0, 147.0, 253.0, 249.0, 147.0, 65.0, 42.0, 13.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4258193373680115, -0.393331378698349, -0.36084339022636414, -0.32835543155670166, -0.2958674430847168, -0.2633794844150543, -0.23089152574539185, -0.19840355217456818, -0.1659155786037445, -0.13342760503292084, -0.10093963891267776, -0.06845167279243469, -0.03596369922161102, -0.0034757256507873535, 0.029012233018875122, 0.06150020658969879, 0.09398818016052246, 0.12647615373134613, 0.1589641273021698, 0.19145208597183228, 0.22394005954265594, 0.2564280331134796, 0.2889159917831421, 0.32140398025512695, 0.35389193892478943, 0.3863798975944519, 0.41886788606643677, 0.45135584473609924, 0.4838438034057617, 0.5163317918777466, 0.5488197803497314, 0.5813077092170715, 0.6137956380844116, 0.6462836265563965, 0.6787715554237366, 0.7112595438957214, 0.7437475323677063, 0.7762354612350464, 0.8087234497070312, 0.8412114381790161, 0.873699426651001, 0.9061874151229858, 0.9386753439903259, 0.9711633324623108, 1.0036512613296509, 1.0361392498016357, 1.0686272382736206, 1.1011152267456055, 1.1336030960083008, 1.1660910844802856, 1.1985790729522705, 1.2310669422149658, 1.2635549306869507, 1.2960429191589355, 1.3285309076309204, 1.3610188961029053, 1.3935068845748901, 1.425994873046875, 1.4584828615188599, 1.4909708499908447, 1.52345871925354, 1.555946707725525, 1.5884346961975098, 1.6209226846694946, 1.6534106731414795]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 8.0, 13.0, 14.0, 14.0, 16.0, 23.0, 25.0, 26.0, 40.0, 33.0, 29.0, 41.0, 33.0, 45.0, 45.0, 60.0, 48.0, 44.0, 34.0, 43.0, 32.0, 39.0, 33.0, 31.0, 24.0, 31.0, 21.0, 18.0, 16.0, 18.0, 12.0, 16.0, 15.0, 6.0, 10.0, 7.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31851905584335327, -0.30708131194114685, -0.29564356803894043, -0.284205824136734, -0.2727680802345276, -0.26133033633232117, -0.24989260733127594, -0.23845486342906952, -0.2270171195268631, -0.21557937562465668, -0.20414163172245026, -0.19270390272140503, -0.1812661588191986, -0.1698284149169922, -0.15839067101478577, -0.14695292711257935, -0.13551518321037292, -0.1240774393081665, -0.11263969540596008, -0.10120195895433426, -0.08976421505212784, -0.07832647114992142, -0.0668887346982956, -0.05545099079608917, -0.04401324689388275, -0.03257550299167633, -0.021137762814760208, -0.009700022637844086, 0.0017377212643623352, 0.013175465166568756, 0.02461320161819458, 0.036050945520401, 0.04748868942260742, 0.05892643332481384, 0.07036417722702026, 0.08180191367864609, 0.09323965758085251, 0.10467740148305893, 0.11611513793468475, 0.12755288183689117, 0.1389906257390976, 0.15042836964130402, 0.16186611354351044, 0.17330384254455566, 0.18474158644676208, 0.1961793303489685, 0.20761707425117493, 0.21905481815338135, 0.23049256205558777, 0.2419303059577942, 0.2533680498600006, 0.26480579376220703, 0.27624353766441345, 0.2876812815666199, 0.2991189956665039, 0.3105567693710327, 0.32199448347091675, 0.33343222737312317, 0.3448699712753296, 0.356307715177536, 0.36774545907974243, 0.37918320298194885, 0.3906209468841553, 0.4020586609840393, 0.4134964346885681]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 4.0, 9.0, 10.0, 8.0, 23.0, 14.0, 26.0, 43.0, 66.0, 80.0, 125.0, 211.0, 361.0, 665.0, 1801.0, 6431.0, 42057.0, 555519.0, 401795.0, 30946.0, 5328.0, 1447.0, 589.0, 349.0, 192.0, 134.0, 92.0, 56.0, 56.0, 34.0, 19.0, 11.0, 14.0, 13.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.49462127685546875, -0.4775238037109375, -0.46042633056640625, -0.443328857421875, -0.42623138427734375, -0.4091339111328125, -0.39203643798828125, -0.37493896484375, -0.35784149169921875, -0.3407440185546875, -0.32364654541015625, -0.306549072265625, -0.28945159912109375, -0.2723541259765625, -0.25525665283203125, -0.2381591796875, -0.22106170654296875, -0.2039642333984375, -0.18686676025390625, -0.169769287109375, -0.15267181396484375, -0.1355743408203125, -0.11847686767578125, -0.10137939453125, -0.08428192138671875, -0.0671844482421875, -0.05008697509765625, -0.032989501953125, -0.01589202880859375, 0.0012054443359375, 0.01830291748046875, 0.035400390625, 0.05249786376953125, 0.0695953369140625, 0.08669281005859375, 0.103790283203125, 0.12088775634765625, 0.1379852294921875, 0.15508270263671875, 0.17218017578125, 0.18927764892578125, 0.2063751220703125, 0.22347259521484375, 0.240570068359375, 0.25766754150390625, 0.2747650146484375, 0.29186248779296875, 0.3089599609375, 0.32605743408203125, 0.3431549072265625, 0.36025238037109375, 0.377349853515625, 0.39444732666015625, 0.4115447998046875, 0.42864227294921875, 0.44573974609375, 0.46283721923828125, 0.4799346923828125, 0.49703216552734375, 0.514129638671875, 0.5312271118164062, 0.5483245849609375, 0.5654220581054688, 0.58251953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 10.0, 12.0, 13.0, 21.0, 37.0, 55.0, 112.0, 126.0, 202.0, 155.0, 99.0, 72.0, 39.0, 20.0, 12.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10060787200927734, -0.09593009948730469, -0.09125232696533203, -0.08657455444335938, -0.08189678192138672, -0.07721900939941406, -0.0725412368774414, -0.06786346435546875, -0.0631856918334961, -0.05850791931152344, -0.05383014678955078, -0.049152374267578125, -0.04447460174560547, -0.03979682922363281, -0.035119056701660156, -0.0304412841796875, -0.025763511657714844, -0.021085739135742188, -0.01640796661376953, -0.011730194091796875, -0.007052421569824219, -0.0023746490478515625, 0.0023031234741210938, 0.00698089599609375, 0.011658668518066406, 0.016336441040039062, 0.02101421356201172, 0.025691986083984375, 0.03036975860595703, 0.03504753112792969, 0.039725303649902344, 0.044403076171875, 0.049080848693847656, 0.05375862121582031, 0.05843639373779297, 0.06311416625976562, 0.06779193878173828, 0.07246971130371094, 0.0771474838256836, 0.08182525634765625, 0.0865030288696289, 0.09118080139160156, 0.09585857391357422, 0.10053634643554688, 0.10521411895751953, 0.10989189147949219, 0.11456966400146484, 0.1192474365234375, 0.12392520904541016, 0.1286029815673828, 0.13328075408935547, 0.13795852661132812, 0.14263629913330078, 0.14731407165527344, 0.1519918441772461, 0.15666961669921875, 0.1613473892211914, 0.16602516174316406, 0.17070293426513672, 0.17538070678710938, 0.18005847930908203, 0.1847362518310547, 0.18941402435302734, 0.194091796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 8.0, 5.0, 11.0, 19.0, 12.0, 21.0, 35.0, 62.0, 59.0, 163.0, 284.0, 807.0, 2726.0, 12499.0, 78452.0, 454383.0, 414094.0, 69446.0, 11419.0, 2416.0, 813.0, 365.0, 144.0, 96.0, 57.0, 50.0, 19.0, 18.0, 16.0, 9.0, 10.0, 7.0, 6.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.467041015625, -0.45195770263671875, -0.4368743896484375, -0.42179107666015625, -0.406707763671875, -0.39162445068359375, -0.3765411376953125, -0.36145782470703125, -0.34637451171875, -0.33129119873046875, -0.3162078857421875, -0.30112457275390625, -0.286041259765625, -0.27095794677734375, -0.2558746337890625, -0.24079132080078125, -0.2257080078125, -0.21062469482421875, -0.1955413818359375, -0.18045806884765625, -0.165374755859375, -0.15029144287109375, -0.1352081298828125, -0.12012481689453125, -0.10504150390625, -0.08995819091796875, -0.0748748779296875, -0.05979156494140625, -0.044708251953125, -0.02962493896484375, -0.0145416259765625, 0.00054168701171875, 0.015625, 0.03070831298828125, 0.0457916259765625, 0.06087493896484375, 0.075958251953125, 0.09104156494140625, 0.1061248779296875, 0.12120819091796875, 0.13629150390625, 0.15137481689453125, 0.1664581298828125, 0.18154144287109375, 0.196624755859375, 0.21170806884765625, 0.2267913818359375, 0.24187469482421875, 0.2569580078125, 0.27204132080078125, 0.2871246337890625, 0.30220794677734375, 0.317291259765625, 0.33237457275390625, 0.3474578857421875, 0.36254119873046875, 0.37762451171875, 0.39270782470703125, 0.4077911376953125, 0.42287445068359375, 0.437957763671875, 0.45304107666015625, 0.4681243896484375, 0.48320770263671875, 0.498291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 6.0, 11.0, 14.0, 23.0, 21.0, 28.0, 29.0, 29.0, 30.0, 38.0, 60.0, 38.0, 56.0, 57.0, 43.0, 61.0, 42.0, 63.0, 56.0, 50.0, 43.0, 40.0, 32.0, 29.0, 17.0, 13.0, 10.0, 7.0, 5.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2274169921875, -0.2210540771484375, -0.214691162109375, -0.2083282470703125, -0.20196533203125, -0.1956024169921875, -0.189239501953125, -0.1828765869140625, -0.176513671875, -0.1701507568359375, -0.163787841796875, -0.1574249267578125, -0.15106201171875, -0.1446990966796875, -0.138336181640625, -0.1319732666015625, -0.1256103515625, -0.1192474365234375, -0.112884521484375, -0.1065216064453125, -0.10015869140625, -0.0937957763671875, -0.087432861328125, -0.0810699462890625, -0.07470703125, -0.0683441162109375, -0.061981201171875, -0.0556182861328125, -0.04925537109375, -0.0428924560546875, -0.036529541015625, -0.0301666259765625, -0.0238037109375, -0.0174407958984375, -0.011077880859375, -0.0047149658203125, 0.00164794921875, 0.0080108642578125, 0.014373779296875, 0.0207366943359375, 0.027099609375, 0.0334625244140625, 0.039825439453125, 0.0461883544921875, 0.05255126953125, 0.0589141845703125, 0.065277099609375, 0.0716400146484375, 0.0780029296875, 0.0843658447265625, 0.090728759765625, 0.0970916748046875, 0.10345458984375, 0.1098175048828125, 0.116180419921875, 0.1225433349609375, 0.12890625, 0.1352691650390625, 0.141632080078125, 0.1479949951171875, 0.15435791015625, 0.1607208251953125, 0.167083740234375, 0.1734466552734375, 0.1798095703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 4.0, 10.0, 9.0, 11.0, 24.0, 46.0, 52.0, 77.0, 135.0, 154.0, 268.0, 432.0, 786.0, 1602.0, 3421.0, 8504.0, 25990.0, 100697.0, 374362.0, 383738.0, 105080.0, 27347.0, 8659.0, 3482.0, 1599.0, 808.0, 449.0, 292.0, 167.0, 126.0, 56.0, 52.0, 36.0, 24.0, 14.0, 11.0, 1.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1605224609375, -0.15517425537109375, -0.1498260498046875, -0.14447784423828125, -0.139129638671875, -0.13378143310546875, -0.1284332275390625, -0.12308502197265625, -0.11773681640625, -0.11238861083984375, -0.1070404052734375, -0.10169219970703125, -0.096343994140625, -0.09099578857421875, -0.0856475830078125, -0.08029937744140625, -0.074951171875, -0.06960296630859375, -0.0642547607421875, -0.05890655517578125, -0.053558349609375, -0.04821014404296875, -0.0428619384765625, -0.03751373291015625, -0.03216552734375, -0.02681732177734375, -0.0214691162109375, -0.01612091064453125, -0.010772705078125, -0.00542449951171875, -7.62939453125e-05, 0.00527191162109375, 0.0106201171875, 0.01596832275390625, 0.0213165283203125, 0.02666473388671875, 0.032012939453125, 0.03736114501953125, 0.0427093505859375, 0.04805755615234375, 0.05340576171875, 0.05875396728515625, 0.0641021728515625, 0.06945037841796875, 0.074798583984375, 0.08014678955078125, 0.0854949951171875, 0.09084320068359375, 0.09619140625, 0.10153961181640625, 0.1068878173828125, 0.11223602294921875, 0.117584228515625, 0.12293243408203125, 0.1282806396484375, 0.13362884521484375, 0.13897705078125, 0.14432525634765625, 0.1496734619140625, 0.15502166748046875, 0.160369873046875, 0.16571807861328125, 0.1710662841796875, 0.17641448974609375, 0.1817626953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 9.0, 4.0, 11.0, 13.0, 20.0, 24.0, 29.0, 58.0, 85.0, 116.0, 166.0, 120.0, 98.0, 66.0, 54.0, 37.0, 29.0, 19.0, 13.0, 15.0, 4.0, 3.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.15522775053978e-05, -3.06200236082077e-05, -2.968776971101761e-05, -2.8755515813827515e-05, -2.782326191663742e-05, -2.6891008019447327e-05, -2.5958754122257233e-05, -2.502650022506714e-05, -2.4094246327877045e-05, -2.316199243068695e-05, -2.2229738533496857e-05, -2.1297484636306763e-05, -2.036523073911667e-05, -1.9432976841926575e-05, -1.850072294473648e-05, -1.7568469047546387e-05, -1.6636215150356293e-05, -1.57039612531662e-05, -1.4771707355976105e-05, -1.383945345878601e-05, -1.2907199561595917e-05, -1.1974945664405823e-05, -1.1042691767215729e-05, -1.0110437870025635e-05, -9.17818397283554e-06, -8.245930075645447e-06, -7.313676178455353e-06, -6.381422281265259e-06, -5.449168384075165e-06, -4.516914486885071e-06, -3.584660589694977e-06, -2.652406692504883e-06, -1.7201527953147888e-06, -7.878988981246948e-07, 1.4435499906539917e-07, 1.0766088962554932e-06, 2.008862793445587e-06, 2.941116690635681e-06, 3.873370587825775e-06, 4.805624485015869e-06, 5.737878382205963e-06, 6.670132279396057e-06, 7.602386176586151e-06, 8.534640073776245e-06, 9.466893970966339e-06, 1.0399147868156433e-05, 1.1331401765346527e-05, 1.2263655662536621e-05, 1.3195909559726715e-05, 1.4128163456916809e-05, 1.5060417354106903e-05, 1.5992671251296997e-05, 1.692492514848709e-05, 1.7857179045677185e-05, 1.878943294286728e-05, 1.9721686840057373e-05, 2.0653940737247467e-05, 2.158619463443756e-05, 2.2518448531627655e-05, 2.345070242881775e-05, 2.4382956326007843e-05, 2.5315210223197937e-05, 2.624746412038803e-05, 2.7179718017578125e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 8.0, 8.0, 14.0, 15.0, 23.0, 32.0, 51.0, 84.0, 149.0, 328.0, 1174.0, 5718.0, 60304.0, 786295.0, 179703.0, 11739.0, 1875.0, 517.0, 204.0, 107.0, 57.0, 47.0, 23.0, 10.0, 16.0, 7.0, 10.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.390380859375, -0.3794364929199219, -0.36849212646484375, -0.3575477600097656, -0.3466033935546875, -0.3356590270996094, -0.32471466064453125, -0.3137702941894531, -0.302825927734375, -0.2918815612792969, -0.28093719482421875, -0.2699928283691406, -0.2590484619140625, -0.24810409545898438, -0.23715972900390625, -0.22621536254882812, -0.21527099609375, -0.20432662963867188, -0.19338226318359375, -0.18243789672851562, -0.1714935302734375, -0.16054916381835938, -0.14960479736328125, -0.13866043090820312, -0.127716064453125, -0.11677169799804688, -0.10582733154296875, -0.09488296508789062, -0.0839385986328125, -0.07299423217773438, -0.06204986572265625, -0.051105499267578125, -0.0401611328125, -0.029216766357421875, -0.01827239990234375, -0.007328033447265625, 0.0036163330078125, 0.014560699462890625, 0.02550506591796875, 0.036449432373046875, 0.047393798828125, 0.058338165283203125, 0.06928253173828125, 0.08022689819335938, 0.0911712646484375, 0.10211563110351562, 0.11305999755859375, 0.12400436401367188, 0.13494873046875, 0.14589309692382812, 0.15683746337890625, 0.16778182983398438, 0.1787261962890625, 0.18967056274414062, 0.20061492919921875, 0.21155929565429688, 0.222503662109375, 0.23344802856445312, 0.24439239501953125, 0.2553367614746094, 0.2662811279296875, 0.2772254943847656, 0.28816986083984375, 0.2991142272949219, 0.31005859375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 13.0, 13.0, 25.0, 25.0, 34.0, 53.0, 74.0, 110.0, 124.0, 125.0, 102.0, 76.0, 65.0, 52.0, 29.0, 21.0, 13.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13134765625, -0.1266918182373047, -0.12203598022460938, -0.11738014221191406, -0.11272430419921875, -0.10806846618652344, -0.10341262817382812, -0.09875679016113281, -0.0941009521484375, -0.08944511413574219, -0.08478927612304688, -0.08013343811035156, -0.07547760009765625, -0.07082176208496094, -0.06616592407226562, -0.06151008605957031, -0.056854248046875, -0.05219841003417969, -0.047542572021484375, -0.04288673400878906, -0.03823089599609375, -0.03357505798339844, -0.028919219970703125, -0.024263381958007812, -0.0196075439453125, -0.014951705932617188, -0.010295867919921875, -0.0056400299072265625, -0.00098419189453125, 0.0036716461181640625, 0.008327484130859375, 0.012983322143554688, 0.01763916015625, 0.022294998168945312, 0.026950836181640625, 0.03160667419433594, 0.03626251220703125, 0.04091835021972656, 0.045574188232421875, 0.05023002624511719, 0.0548858642578125, 0.05954170227050781, 0.06419754028320312, 0.06885337829589844, 0.07350921630859375, 0.07816505432128906, 0.08282089233398438, 0.08747673034667969, 0.092132568359375, 0.09678840637207031, 0.10144424438476562, 0.10610008239746094, 0.11075592041015625, 0.11541175842285156, 0.12006759643554688, 0.12472343444824219, 0.1293792724609375, 0.1340351104736328, 0.13869094848632812, 0.14334678649902344, 0.14800262451171875, 0.15265846252441406, 0.15731430053710938, 0.1619701385498047, 0.1666259765625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 11.0, 68.0, 278.0, 428.0, 179.0, 36.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.753924369812012, -4.651325702667236, -4.548727512359619, -4.446128845214844, -4.343530178070068, -4.240931510925293, -4.138333320617676, -4.0357346534729, -3.933135986328125, -3.8305375576019287, -3.7279388904571533, -3.625340461730957, -3.5227417945861816, -3.4201433658599854, -3.317544937133789, -3.2149462699890137, -3.1123478412628174, -3.009749412536621, -2.9071507453918457, -2.8045523166656494, -2.701953649520874, -2.5993552207946777, -2.4967565536499023, -2.394158124923706, -2.2915596961975098, -2.1889612674713135, -2.086362600326538, -1.9837641716003418, -1.8811655044555664, -1.7785670757293701, -1.6759685277938843, -1.5733699798583984, -1.4707715511322021, -1.3681730031967163, -1.2655744552612305, -1.1629760265350342, -1.0603773593902588, -0.9577788710594177, -0.8551803827285767, -0.7525818347930908, -0.649983286857605, -0.5473847389221191, -0.4447862207889557, -0.34218770265579224, -0.2395891547203064, -0.13699060678482056, -0.03439211845397949, 0.06820642948150635, 0.1708049774169922, 0.273403525352478, 0.3760020434856415, 0.47860056161880493, 0.5811991095542908, 0.6837976574897766, 0.7863961458206177, 0.8889946937561035, 0.9915932416915894, 1.0941917896270752, 1.196790337562561, 1.2993888854980469, 1.4019873142242432, 1.5045859813690186, 1.6071844100952148, 1.7097829580307007, 1.8123815059661865]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 2.0, 6.0, 14.0, 22.0, 25.0, 29.0, 32.0, 45.0, 55.0, 59.0, 67.0, 84.0, 71.0, 60.0, 66.0, 59.0, 56.0, 54.0, 39.0, 33.0, 27.0, 15.0, 23.0, 13.0, 8.0, 7.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8294411301612854, -0.7996581196784973, -0.7698750495910645, -0.7400920391082764, -0.7103090286254883, -0.6805259585380554, -0.6507429480552673, -0.6209598779678345, -0.5911768674850464, -0.5613938570022583, -0.5316107869148254, -0.5018277764320374, -0.4720447361469269, -0.4422616958618164, -0.4124786853790283, -0.38269564509391785, -0.3529126048088074, -0.3231295645236969, -0.2933465242385864, -0.26356351375579834, -0.23378047347068787, -0.2039974331855774, -0.1742144078016281, -0.14443138241767883, -0.11464834213256836, -0.08486530929803848, -0.055082276463508606, -0.02529924362897873, 0.0044837892055511475, 0.03426682949066162, 0.0640498548746109, 0.09383288025856018, 0.12361598014831543, 0.1533990204334259, 0.18318204581737518, 0.21296507120132446, 0.24274811148643494, 0.2725311517715454, 0.3023141622543335, 0.33209720253944397, 0.36188024282455444, 0.3916632831096649, 0.4214463233947754, 0.4512293338775635, 0.48101237416267395, 0.5107954144477844, 0.5405784249305725, 0.5703614950180054, 0.6001445055007935, 0.6299275159835815, 0.6597105860710144, 0.6894935965538025, 0.7192766666412354, 0.7490596771240234, 0.7788426876068115, 0.8086256980895996, 0.8384087681770325, 0.8681917786598206, 0.8979748487472534, 0.9277578592300415, 0.9575408697128296, 0.9873239398002625, 1.0171070098876953, 1.0468900203704834, 1.0766730308532715]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 12.0, 26.0, 51.0, 82.0, 168.0, 527.0, 3113.0, 31601.0, 3978354.0, 174098.0, 4535.0, 1035.0, 333.0, 169.0, 64.0, 44.0, 26.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2981986999511719, -0.28560638427734375, -0.2730140686035156, -0.2604217529296875, -0.24782943725585938, -0.23523712158203125, -0.22264480590820312, -0.210052490234375, -0.19746017456054688, -0.18486785888671875, -0.17227554321289062, -0.1596832275390625, -0.14709091186523438, -0.13449859619140625, -0.12190628051757812, -0.10931396484375, -0.09672164916992188, -0.08412933349609375, -0.07153701782226562, -0.0589447021484375, -0.046352386474609375, -0.03376007080078125, -0.021167755126953125, -0.008575439453125, 0.004016876220703125, 0.01660919189453125, 0.029201507568359375, 0.0417938232421875, 0.054386138916015625, 0.06697845458984375, 0.07957077026367188, 0.0921630859375, 0.10475540161132812, 0.11734771728515625, 0.12994003295898438, 0.1425323486328125, 0.15512466430664062, 0.16771697998046875, 0.18030929565429688, 0.192901611328125, 0.20549392700195312, 0.21808624267578125, 0.23067855834960938, 0.2432708740234375, 0.2558631896972656, 0.26845550537109375, 0.2810478210449219, 0.29364013671875, 0.3062324523925781, 0.31882476806640625, 0.3314170837402344, 0.3440093994140625, 0.3566017150878906, 0.36919403076171875, 0.3817863464355469, 0.394378662109375, 0.4069709777832031, 0.41956329345703125, 0.4321556091308594, 0.4447479248046875, 0.4573402404785156, 0.46993255615234375, 0.4825248718261719, 0.4951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 12.0, 10.0, 17.0, 23.0, 32.0, 62.0, 93.0, 107.0, 137.0, 144.0, 123.0, 93.0, 52.0, 40.0, 27.0, 12.0, 6.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.08414745330810547, -0.07973289489746094, -0.0753183364868164, -0.07090377807617188, -0.06648921966552734, -0.06207466125488281, -0.05766010284423828, -0.05324554443359375, -0.04883098602294922, -0.04441642761230469, -0.040001869201660156, -0.035587310791015625, -0.031172752380371094, -0.026758193969726562, -0.02234363555908203, -0.0179290771484375, -0.013514518737792969, -0.009099960327148438, -0.004685401916503906, -0.000270843505859375, 0.004143714904785156, 0.008558273315429688, 0.012972831726074219, 0.01738739013671875, 0.02180194854736328, 0.026216506958007812, 0.030631065368652344, 0.035045623779296875, 0.039460182189941406, 0.04387474060058594, 0.04828929901123047, 0.052703857421875, 0.05711841583251953, 0.06153297424316406, 0.0659475326538086, 0.07036209106445312, 0.07477664947509766, 0.07919120788574219, 0.08360576629638672, 0.08802032470703125, 0.09243488311767578, 0.09684944152832031, 0.10126399993896484, 0.10567855834960938, 0.1100931167602539, 0.11450767517089844, 0.11892223358154297, 0.1233367919921875, 0.12775135040283203, 0.13216590881347656, 0.1365804672241211, 0.14099502563476562, 0.14540958404541016, 0.1498241424560547, 0.15423870086669922, 0.15865325927734375, 0.16306781768798828, 0.1674823760986328, 0.17189693450927734, 0.17631149291992188, 0.1807260513305664, 0.18514060974121094, 0.18955516815185547, 0.1939697265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 8.0, 9.0, 11.0, 21.0, 30.0, 44.0, 60.0, 82.0, 112.0, 206.0, 377.0, 641.0, 1441.0, 3959.0, 14831.0, 81786.0, 714980.0, 2744558.0, 546899.0, 65702.0, 12191.0, 3436.0, 1285.0, 624.0, 350.0, 216.0, 112.0, 104.0, 59.0, 37.0, 30.0, 25.0, 14.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14310073852539062, -0.13788604736328125, -0.13267135620117188, -0.1274566650390625, -0.12224197387695312, -0.11702728271484375, -0.11181259155273438, -0.106597900390625, -0.10138320922851562, -0.09616851806640625, -0.09095382690429688, -0.0857391357421875, -0.08052444458007812, -0.07530975341796875, -0.07009506225585938, -0.06488037109375, -0.059665679931640625, -0.05445098876953125, -0.049236297607421875, -0.0440216064453125, -0.038806915283203125, -0.03359222412109375, -0.028377532958984375, -0.023162841796875, -0.017948150634765625, -0.01273345947265625, -0.007518768310546875, -0.0023040771484375, 0.002910614013671875, 0.00812530517578125, 0.013339996337890625, 0.0185546875, 0.023769378662109375, 0.02898406982421875, 0.034198760986328125, 0.0394134521484375, 0.044628143310546875, 0.04984283447265625, 0.055057525634765625, 0.060272216796875, 0.06548690795898438, 0.07070159912109375, 0.07591629028320312, 0.0811309814453125, 0.08634567260742188, 0.09156036376953125, 0.09677505493164062, 0.10198974609375, 0.10720443725585938, 0.11241912841796875, 0.11763381958007812, 0.1228485107421875, 0.12806320190429688, 0.13327789306640625, 0.13849258422851562, 0.143707275390625, 0.14892196655273438, 0.15413665771484375, 0.15935134887695312, 0.1645660400390625, 0.16978073120117188, 0.17499542236328125, 0.18021011352539062, 0.1854248046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 10.0, 17.0, 21.0, 22.0, 38.0, 37.0, 55.0, 71.0, 93.0, 155.0, 181.0, 246.0, 280.0, 359.0, 403.0, 406.0, 403.0, 296.0, 228.0, 213.0, 142.0, 105.0, 76.0, 62.0, 41.0, 27.0, 19.0, 25.0, 11.0, 12.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11114501953125, -0.10807609558105469, -0.10500717163085938, -0.10193824768066406, -0.09886932373046875, -0.09580039978027344, -0.09273147583007812, -0.08966255187988281, -0.0865936279296875, -0.08352470397949219, -0.08045578002929688, -0.07738685607910156, -0.07431793212890625, -0.07124900817871094, -0.06818008422851562, -0.06511116027832031, -0.062042236328125, -0.05897331237792969, -0.055904388427734375, -0.05283546447753906, -0.04976654052734375, -0.04669761657714844, -0.043628692626953125, -0.04055976867675781, -0.0374908447265625, -0.03442192077636719, -0.031352996826171875, -0.028284072875976562, -0.02521514892578125, -0.022146224975585938, -0.019077301025390625, -0.016008377075195312, -0.012939453125, -0.009870529174804688, -0.006801605224609375, -0.0037326812744140625, -0.00066375732421875, 0.0024051666259765625, 0.005474090576171875, 0.008543014526367188, 0.0116119384765625, 0.014680862426757812, 0.017749786376953125, 0.020818710327148438, 0.02388763427734375, 0.026956558227539062, 0.030025482177734375, 0.03309440612792969, 0.036163330078125, 0.03923225402832031, 0.042301177978515625, 0.04537010192871094, 0.04843902587890625, 0.05150794982910156, 0.054576873779296875, 0.05764579772949219, 0.0607147216796875, 0.06378364562988281, 0.06685256958007812, 0.06992149353027344, 0.07299041748046875, 0.07605934143066406, 0.07912826538085938, 0.08219718933105469, 0.08526611328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 33.0, 131.0, 400.0, 327.0, 100.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4440441131591797, -1.3808889389038086, -1.3177337646484375, -1.2545785903930664, -1.1914234161376953, -1.1282682418823242, -1.0651129484176636, -1.0019577741622925, -0.9388025999069214, -0.8756474256515503, -0.8124922513961792, -0.7493370175361633, -0.6861818432807922, -0.6230266690254211, -0.5598714351654053, -0.4967162609100342, -0.4335610866546631, -0.370405912399292, -0.3072507083415985, -0.24409551918506622, -0.18094033002853394, -0.11778515577316284, -0.05462995171546936, 0.008525252342224121, 0.07168042659759521, 0.1348356157541275, 0.1979908049106598, 0.26114600896835327, 0.32430118322372437, 0.38745635747909546, 0.45061156153678894, 0.5137667655944824, 0.5769219398498535, 0.6400771141052246, 0.7032322883605957, 0.7663875222206116, 0.8295426964759827, 0.8926978707313538, 0.9558531045913696, 1.0190082788467407, 1.0821634531021118, 1.145318627357483, 1.208473801612854, 1.271628975868225, 1.3347842693328857, 1.3979394435882568, 1.461094617843628, 1.524249792098999, 1.5874049663543701, 1.6505601406097412, 1.7137153148651123, 1.7768704891204834, 1.8400256633758545, 1.9031808376312256, 1.9663361310958862, 2.029491424560547, 2.092646598815918, 2.155801773071289, 2.21895694732666, 2.2821121215820312, 2.3452672958374023, 2.4084224700927734, 2.4715776443481445, 2.5347328186035156, 2.5978879928588867]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 6.0, 8.0, 10.0, 17.0, 22.0, 24.0, 26.0, 26.0, 25.0, 31.0, 35.0, 46.0, 40.0, 38.0, 35.0, 43.0, 50.0, 42.0, 40.0, 57.0, 46.0, 39.0, 28.0, 34.0, 25.0, 27.0, 30.0, 20.0, 17.0, 18.0, 14.0, 18.0, 8.0, 13.0, 8.0, 6.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33290839195251465, -0.32202205061912537, -0.31113573908805847, -0.3002493977546692, -0.2893630862236023, -0.278476744890213, -0.26759040355682373, -0.25670409202575684, -0.24581775069236755, -0.23493142426013947, -0.22404509782791138, -0.2131587564945221, -0.202272430062294, -0.19138610363006592, -0.18049977719783783, -0.16961345076560974, -0.15872712433338165, -0.14784079790115356, -0.13695447146892548, -0.1260681450366974, -0.1151818037033081, -0.10429547727108002, -0.09340915083885193, -0.08252281695604324, -0.07163649052381516, -0.06075016036629677, -0.04986383020877838, -0.03897750377655029, -0.028091173619031906, -0.01720484346151352, -0.006318517029285431, 0.004567816853523254, 0.015454143285751343, 0.02634047344326973, 0.037226803600788116, 0.048113130033016205, 0.05899946019053459, 0.06988579034805298, 0.08077211678028107, 0.09165845066308975, 0.10254477709531784, 0.11343110352754593, 0.12431743741035461, 0.1352037638425827, 0.1460900902748108, 0.15697643160820007, 0.16786274313926697, 0.17874908447265625, 0.18963541090488434, 0.20052173733711243, 0.21140806376934052, 0.2222943902015686, 0.23318073153495789, 0.24406705796718597, 0.25495338439941406, 0.26583972573280334, 0.27672603726387024, 0.2876123785972595, 0.2984986901283264, 0.3093850314617157, 0.3202713429927826, 0.3311576843261719, 0.34204399585723877, 0.35293033719062805, 0.36381667852401733]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 6.0, 13.0, 15.0, 23.0, 27.0, 35.0, 51.0, 70.0, 93.0, 145.0, 233.0, 375.0, 696.0, 1471.0, 3641.0, 11696.0, 55979.0, 409135.0, 476497.0, 67381.0, 13377.0, 3994.0, 1632.0, 787.0, 383.0, 255.0, 165.0, 101.0, 76.0, 56.0, 53.0, 17.0, 11.0, 16.0, 5.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.373046875, -0.3617591857910156, -0.35047149658203125, -0.3391838073730469, -0.3278961181640625, -0.3166084289550781, -0.30532073974609375, -0.2940330505371094, -0.282745361328125, -0.2714576721191406, -0.26016998291015625, -0.24888229370117188, -0.2375946044921875, -0.22630691528320312, -0.21501922607421875, -0.20373153686523438, -0.19244384765625, -0.18115615844726562, -0.16986846923828125, -0.15858078002929688, -0.1472930908203125, -0.13600540161132812, -0.12471771240234375, -0.11343002319335938, -0.102142333984375, -0.09085464477539062, -0.07956695556640625, -0.06827926635742188, -0.0569915771484375, -0.045703887939453125, -0.03441619873046875, -0.023128509521484375, -0.0118408203125, -0.000553131103515625, 0.01073455810546875, 0.022022247314453125, 0.0333099365234375, 0.044597625732421875, 0.05588531494140625, 0.06717300415039062, 0.078460693359375, 0.08974838256835938, 0.10103607177734375, 0.11232376098632812, 0.1236114501953125, 0.13489913940429688, 0.14618682861328125, 0.15747451782226562, 0.16876220703125, 0.18004989624023438, 0.19133758544921875, 0.20262527465820312, 0.2139129638671875, 0.22520065307617188, 0.23648834228515625, 0.24777603149414062, 0.259063720703125, 0.2703514099121094, 0.28163909912109375, 0.2929267883300781, 0.3042144775390625, 0.3155021667480469, 0.32678985595703125, 0.3380775451660156, 0.349365234375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 18.0, 22.0, 22.0, 56.0, 78.0, 122.0, 121.0, 158.0, 134.0, 92.0, 71.0, 39.0, 25.0, 14.0, 5.0, 9.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09075927734375, -0.08629131317138672, -0.08182334899902344, -0.07735538482666016, -0.07288742065429688, -0.0684194564819336, -0.06395149230957031, -0.05948352813720703, -0.05501556396484375, -0.05054759979248047, -0.04607963562011719, -0.041611671447753906, -0.037143707275390625, -0.032675743103027344, -0.028207778930664062, -0.02373981475830078, -0.0192718505859375, -0.014803886413574219, -0.010335922241210938, -0.005867958068847656, -0.001399993896484375, 0.0030679702758789062, 0.0075359344482421875, 0.012003898620605469, 0.01647186279296875, 0.02093982696533203, 0.025407791137695312, 0.029875755310058594, 0.034343719482421875, 0.038811683654785156, 0.04327964782714844, 0.04774761199951172, 0.052215576171875, 0.05668354034423828, 0.06115150451660156, 0.06561946868896484, 0.07008743286132812, 0.0745553970336914, 0.07902336120605469, 0.08349132537841797, 0.08795928955078125, 0.09242725372314453, 0.09689521789550781, 0.1013631820678711, 0.10583114624023438, 0.11029911041259766, 0.11476707458496094, 0.11923503875732422, 0.1237030029296875, 0.12817096710205078, 0.13263893127441406, 0.13710689544677734, 0.14157485961914062, 0.1460428237915039, 0.1505107879638672, 0.15497875213623047, 0.15944671630859375, 0.16391468048095703, 0.1683826446533203, 0.1728506088256836, 0.17731857299804688, 0.18178653717041016, 0.18625450134277344, 0.19072246551513672, 0.1951904296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 10.0, 21.0, 22.0, 27.0, 41.0, 52.0, 91.0, 149.0, 271.0, 472.0, 1161.0, 3772.0, 18512.0, 109749.0, 501297.0, 339513.0, 58777.0, 10344.0, 2403.0, 869.0, 381.0, 188.0, 115.0, 106.0, 59.0, 31.0, 21.0, 24.0, 16.0, 14.0, 10.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.37744140625, -0.3666038513183594, -0.35576629638671875, -0.3449287414550781, -0.3340911865234375, -0.3232536315917969, -0.31241607666015625, -0.3015785217285156, -0.290740966796875, -0.2799034118652344, -0.26906585693359375, -0.2582283020019531, -0.2473907470703125, -0.23655319213867188, -0.22571563720703125, -0.21487808227539062, -0.20404052734375, -0.19320297241210938, -0.18236541748046875, -0.17152786254882812, -0.1606903076171875, -0.14985275268554688, -0.13901519775390625, -0.12817764282226562, -0.117340087890625, -0.10650253295898438, -0.09566497802734375, -0.08482742309570312, -0.0739898681640625, -0.06315231323242188, -0.05231475830078125, -0.041477203369140625, -0.0306396484375, -0.019802093505859375, -0.00896453857421875, 0.001873016357421875, 0.0127105712890625, 0.023548126220703125, 0.03438568115234375, 0.045223236083984375, 0.056060791015625, 0.06689834594726562, 0.07773590087890625, 0.08857345581054688, 0.0994110107421875, 0.11024856567382812, 0.12108612060546875, 0.13192367553710938, 0.14276123046875, 0.15359878540039062, 0.16443634033203125, 0.17527389526367188, 0.1861114501953125, 0.19694900512695312, 0.20778656005859375, 0.21862411499023438, 0.229461669921875, 0.24029922485351562, 0.25113677978515625, 0.2619743347167969, 0.2728118896484375, 0.2836494445800781, 0.29448699951171875, 0.3053245544433594, 0.316162109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 7.0, 9.0, 8.0, 12.0, 23.0, 19.0, 24.0, 39.0, 22.0, 34.0, 36.0, 33.0, 40.0, 43.0, 40.0, 55.0, 47.0, 34.0, 48.0, 42.0, 44.0, 35.0, 44.0, 33.0, 26.0, 32.0, 23.0, 26.0, 20.0, 10.0, 16.0, 17.0, 15.0, 12.0, 5.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.17919921875, -0.1738739013671875, -0.168548583984375, -0.1632232666015625, -0.15789794921875, -0.1525726318359375, -0.147247314453125, -0.1419219970703125, -0.1365966796875, -0.1312713623046875, -0.125946044921875, -0.1206207275390625, -0.11529541015625, -0.1099700927734375, -0.104644775390625, -0.0993194580078125, -0.093994140625, -0.0886688232421875, -0.083343505859375, -0.0780181884765625, -0.07269287109375, -0.0673675537109375, -0.062042236328125, -0.0567169189453125, -0.0513916015625, -0.0460662841796875, -0.040740966796875, -0.0354156494140625, -0.03009033203125, -0.0247650146484375, -0.019439697265625, -0.0141143798828125, -0.0087890625, -0.0034637451171875, 0.001861572265625, 0.0071868896484375, 0.01251220703125, 0.0178375244140625, 0.023162841796875, 0.0284881591796875, 0.0338134765625, 0.0391387939453125, 0.044464111328125, 0.0497894287109375, 0.05511474609375, 0.0604400634765625, 0.065765380859375, 0.0710906982421875, 0.076416015625, 0.0817413330078125, 0.087066650390625, 0.0923919677734375, 0.09771728515625, 0.1030426025390625, 0.108367919921875, 0.1136932373046875, 0.1190185546875, 0.1243438720703125, 0.129669189453125, 0.1349945068359375, 0.14031982421875, 0.1456451416015625, 0.150970458984375, 0.1562957763671875, 0.16162109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 5.0, 13.0, 27.0, 35.0, 46.0, 83.0, 136.0, 212.0, 453.0, 794.0, 1534.0, 3304.0, 7192.0, 16570.0, 41067.0, 106411.0, 245007.0, 318242.0, 183463.0, 73492.0, 28252.0, 11893.0, 5127.0, 2466.0, 1243.0, 591.0, 349.0, 193.0, 136.0, 69.0, 50.0, 25.0, 23.0, 15.0, 7.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07794189453125, -0.07560157775878906, -0.07326126098632812, -0.07092094421386719, -0.06858062744140625, -0.06624031066894531, -0.06389999389648438, -0.06155967712402344, -0.0592193603515625, -0.05687904357910156, -0.054538726806640625, -0.05219841003417969, -0.04985809326171875, -0.04751777648925781, -0.045177459716796875, -0.04283714294433594, -0.040496826171875, -0.03815650939941406, -0.035816192626953125, -0.03347587585449219, -0.03113555908203125, -0.028795242309570312, -0.026454925537109375, -0.024114608764648438, -0.0217742919921875, -0.019433975219726562, -0.017093658447265625, -0.014753341674804688, -0.01241302490234375, -0.010072708129882812, -0.007732391357421875, -0.0053920745849609375, -0.0030517578125, -0.0007114410400390625, 0.001628875732421875, 0.0039691925048828125, 0.00630950927734375, 0.008649826049804688, 0.010990142822265625, 0.013330459594726562, 0.0156707763671875, 0.018011093139648438, 0.020351409912109375, 0.022691726684570312, 0.02503204345703125, 0.027372360229492188, 0.029712677001953125, 0.03205299377441406, 0.034393310546875, 0.03673362731933594, 0.039073944091796875, 0.04141426086425781, 0.04375457763671875, 0.04609489440917969, 0.048435211181640625, 0.05077552795410156, 0.0531158447265625, 0.05545616149902344, 0.057796478271484375, 0.06013679504394531, 0.06247711181640625, 0.06481742858886719, 0.06715774536132812, 0.06949806213378906, 0.07183837890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 10.0, 2.0, 12.0, 8.0, 17.0, 21.0, 26.0, 25.0, 33.0, 46.0, 47.0, 72.0, 68.0, 81.0, 72.0, 81.0, 75.0, 52.0, 52.0, 31.0, 27.0, 23.0, 17.0, 17.0, 17.0, 10.0, 9.0, 7.0, 6.0, 2.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1026859283447266e-05, -1.0662712156772614e-05, -1.0298565030097961e-05, -9.93441790342331e-06, -9.570270776748657e-06, -9.206123650074005e-06, -8.841976523399353e-06, -8.477829396724701e-06, -8.113682270050049e-06, -7.749535143375397e-06, -7.385388016700745e-06, -7.0212408900260925e-06, -6.6570937633514404e-06, -6.292946636676788e-06, -5.928799510002136e-06, -5.564652383327484e-06, -5.200505256652832e-06, -4.83635812997818e-06, -4.472211003303528e-06, -4.108063876628876e-06, -3.7439167499542236e-06, -3.3797696232795715e-06, -3.0156224966049194e-06, -2.6514753699302673e-06, -2.2873282432556152e-06, -1.923181116580963e-06, -1.559033989906311e-06, -1.194886863231659e-06, -8.307397365570068e-07, -4.6659260988235474e-07, -1.0244548320770264e-07, 2.6170164346694946e-07, 6.258487701416016e-07, 9.899958968162537e-07, 1.3541430234909058e-06, 1.7182901501655579e-06, 2.08243727684021e-06, 2.446584403514862e-06, 2.810731530189514e-06, 3.1748786568641663e-06, 3.5390257835388184e-06, 3.9031729102134705e-06, 4.2673200368881226e-06, 4.631467163562775e-06, 4.995614290237427e-06, 5.359761416912079e-06, 5.723908543586731e-06, 6.088055670261383e-06, 6.452202796936035e-06, 6.816349923610687e-06, 7.180497050285339e-06, 7.5446441769599915e-06, 7.908791303634644e-06, 8.272938430309296e-06, 8.637085556983948e-06, 9.0012326836586e-06, 9.365379810333252e-06, 9.729526937007904e-06, 1.0093674063682556e-05, 1.0457821190357208e-05, 1.082196831703186e-05, 1.1186115443706512e-05, 1.1550262570381165e-05, 1.1914409697055817e-05, 1.2278556823730469e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 13.0, 9.0, 15.0, 24.0, 38.0, 62.0, 85.0, 131.0, 203.0, 361.0, 646.0, 1145.0, 2124.0, 4651.0, 10447.0, 26266.0, 69712.0, 187128.0, 340697.0, 246031.0, 96999.0, 35499.0, 14101.0, 6135.0, 2764.0, 1383.0, 754.0, 403.0, 236.0, 161.0, 97.0, 64.0, 31.0, 23.0, 27.0, 20.0, 15.0, 6.0, 9.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0728759765625, -0.07033348083496094, -0.06779098510742188, -0.06524848937988281, -0.06270599365234375, -0.06016349792480469, -0.057621002197265625, -0.05507850646972656, -0.0525360107421875, -0.04999351501464844, -0.047451019287109375, -0.04490852355957031, -0.04236602783203125, -0.03982353210449219, -0.037281036376953125, -0.03473854064941406, -0.032196044921875, -0.029653549194335938, -0.027111053466796875, -0.024568557739257812, -0.02202606201171875, -0.019483566284179688, -0.016941070556640625, -0.014398574829101562, -0.0118560791015625, -0.009313583374023438, -0.006771087646484375, -0.0042285919189453125, -0.00168609619140625, 0.0008563995361328125, 0.003398895263671875, 0.0059413909912109375, 0.00848388671875, 0.011026382446289062, 0.013568878173828125, 0.016111373901367188, 0.01865386962890625, 0.021196365356445312, 0.023738861083984375, 0.026281356811523438, 0.0288238525390625, 0.03136634826660156, 0.033908843994140625, 0.03645133972167969, 0.03899383544921875, 0.04153633117675781, 0.044078826904296875, 0.04662132263183594, 0.049163818359375, 0.05170631408691406, 0.054248809814453125, 0.05679130554199219, 0.05933380126953125, 0.06187629699707031, 0.06441879272460938, 0.06696128845214844, 0.0695037841796875, 0.07204627990722656, 0.07458877563476562, 0.07713127136230469, 0.07967376708984375, 0.08221626281738281, 0.08475875854492188, 0.08730125427246094, 0.08984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 13.0, 8.0, 9.0, 12.0, 12.0, 14.0, 19.0, 28.0, 21.0, 31.0, 56.0, 45.0, 64.0, 62.0, 51.0, 56.0, 59.0, 62.0, 49.0, 54.0, 40.0, 40.0, 40.0, 31.0, 25.0, 15.0, 9.0, 17.0, 18.0, 7.0, 8.0, 5.0, 8.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.0625448226928711, -0.06075859069824219, -0.05897235870361328, -0.057186126708984375, -0.05539989471435547, -0.05361366271972656, -0.051827430725097656, -0.05004119873046875, -0.048254966735839844, -0.04646873474121094, -0.04468250274658203, -0.042896270751953125, -0.04111003875732422, -0.03932380676269531, -0.037537574768066406, -0.0357513427734375, -0.033965110778808594, -0.03217887878417969, -0.03039264678955078, -0.028606414794921875, -0.02682018280029297, -0.025033950805664062, -0.023247718811035156, -0.02146148681640625, -0.019675254821777344, -0.017889022827148438, -0.01610279083251953, -0.014316558837890625, -0.012530326843261719, -0.010744094848632812, -0.008957862854003906, -0.007171630859375, -0.005385398864746094, -0.0035991668701171875, -0.0018129348754882812, -2.6702880859375e-05, 0.0017595291137695312, 0.0035457611083984375, 0.005331993103027344, 0.00711822509765625, 0.008904457092285156, 0.010690689086914062, 0.012476921081542969, 0.014263153076171875, 0.01604938507080078, 0.017835617065429688, 0.019621849060058594, 0.0214080810546875, 0.023194313049316406, 0.024980545043945312, 0.02676677703857422, 0.028553009033203125, 0.03033924102783203, 0.03212547302246094, 0.033911705017089844, 0.03569793701171875, 0.037484169006347656, 0.03927040100097656, 0.04105663299560547, 0.042842864990234375, 0.04462909698486328, 0.04641532897949219, 0.048201560974121094, 0.04998779296875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 357.0, 504.0, 93.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.004016399383545, -3.883042097091675, -3.762068033218384, -3.6410937309265137, -3.5201194286346436, -3.3991451263427734, -3.2781710624694824, -3.1571967601776123, -3.036222457885742, -2.915248155593872, -2.794274091720581, -2.673299789428711, -2.552325487136841, -2.4313511848449707, -2.3103771209716797, -2.1894028186798096, -2.0684285163879395, -1.9474543333053589, -1.8264800310134888, -1.7055058479309082, -1.584531545639038, -1.4635573625564575, -1.342583179473877, -1.2216088771820068, -1.1006348133087158, -0.9796605706214905, -0.8586863279342651, -0.7377121448516846, -0.6167378425598145, -0.4957636594772339, -0.37478941679000854, -0.2538151741027832, -0.13284087181091309, -0.011866636574268341, 0.1091075986623764, 0.23008182644844055, 0.3510560691356659, 0.47203028202056885, 0.5930045247077942, 0.7139787673950195, 0.8349530100822449, 0.9559272527694702, 1.0769014358520508, 1.197875738143921, 1.3188499212265015, 1.439824104309082, 1.5607984066009521, 1.6817727088928223, 1.8027468919754028, 1.9237210750579834, 2.0446953773498535, 2.1656696796417236, 2.2866437435150146, 2.4076180458068848, 2.528592348098755, 2.649566650390625, 2.770540714263916, 2.891515016555786, 3.012489080429077, 3.1334633827209473, 3.2544376850128174, 3.3754119873046875, 3.4963860511779785, 3.6173603534698486, 3.7383346557617188]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 13.0, 12.0, 16.0, 15.0, 30.0, 18.0, 35.0, 39.0, 41.0, 44.0, 45.0, 55.0, 56.0, 52.0, 64.0, 51.0, 51.0, 53.0, 56.0, 41.0, 36.0, 38.0, 27.0, 23.0, 15.0, 16.0, 11.0, 9.0, 8.0, 2.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7837508320808411, -0.7629237771034241, -0.7420967221260071, -0.7212697267532349, -0.7004426717758179, -0.6796156167984009, -0.6587885618209839, -0.6379615068435669, -0.6171344518661499, -0.5963073968887329, -0.5754803419113159, -0.5546533465385437, -0.5338262915611267, -0.5129992365837097, -0.4921721816062927, -0.47134512662887573, -0.4505181312561035, -0.4296910762786865, -0.4088640511035919, -0.3880369961261749, -0.3672099709510803, -0.34638291597366333, -0.32555586099624634, -0.30472880601882935, -0.28390178084373474, -0.26307472586631775, -0.24224770069122314, -0.22142064571380615, -0.20059360563755035, -0.17976656556129456, -0.15893951058387756, -0.13811247050762177, -0.11728537082672119, -0.0964583307504654, -0.075631283223629, -0.0548042394220829, -0.033977195620536804, -0.013150155544281006, 0.007676891982555389, 0.028503939509391785, 0.04933097958564758, 0.07015801966190338, 0.09098506718873978, 0.11181211471557617, 0.13263915479183197, 0.15346619486808777, 0.17429324984550476, 0.19512028992176056, 0.21594732999801636, 0.23677437007427216, 0.25760141015052795, 0.27842846512794495, 0.29925549030303955, 0.32008254528045654, 0.34090960025787354, 0.3617366552352905, 0.38256368041038513, 0.4033907353878021, 0.42421776056289673, 0.4450448155403137, 0.4658718705177307, 0.4866988956928253, 0.5075259208679199, 0.5283529758453369, 0.5491800308227539]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 14.0, 33.0, 54.0, 99.0, 192.0, 416.0, 1143.0, 3229.0, 9828.0, 46373.0, 1173593.0, 2859380.0, 83436.0, 10671.0, 3096.0, 1195.0, 578.0, 305.0, 179.0, 144.0, 90.0, 74.0, 48.0, 25.0, 17.0, 18.0, 12.0, 5.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15703201293945312, -0.15024566650390625, -0.14345932006835938, -0.1366729736328125, -0.12988662719726562, -0.12310028076171875, -0.11631393432617188, -0.109527587890625, -0.10274124145507812, -0.09595489501953125, -0.08916854858398438, -0.0823822021484375, -0.07559585571289062, -0.06880950927734375, -0.062023162841796875, -0.05523681640625, -0.048450469970703125, -0.04166412353515625, -0.034877777099609375, -0.0280914306640625, -0.021305084228515625, -0.01451873779296875, -0.007732391357421875, -0.000946044921875, 0.005840301513671875, 0.01262664794921875, 0.019412994384765625, 0.0261993408203125, 0.032985687255859375, 0.03977203369140625, 0.046558380126953125, 0.0533447265625, 0.060131072998046875, 0.06691741943359375, 0.07370376586914062, 0.0804901123046875, 0.08727645874023438, 0.09406280517578125, 0.10084915161132812, 0.107635498046875, 0.11442184448242188, 0.12120819091796875, 0.12799453735351562, 0.1347808837890625, 0.14156723022460938, 0.14835357666015625, 0.15513992309570312, 0.16192626953125, 0.16871261596679688, 0.17549896240234375, 0.18228530883789062, 0.1890716552734375, 0.19585800170898438, 0.20264434814453125, 0.20943069458007812, 0.216217041015625, 0.22300338745117188, 0.22978973388671875, 0.23657608032226562, 0.2433624267578125, 0.2501487731933594, 0.25693511962890625, 0.2637214660644531, 0.2705078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 9.0, 28.0, 26.0, 42.0, 80.0, 113.0, 109.0, 130.0, 134.0, 112.0, 84.0, 52.0, 31.0, 20.0, 12.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0772705078125, -0.07289886474609375, -0.0685272216796875, -0.06415557861328125, -0.059783935546875, -0.05541229248046875, -0.0510406494140625, -0.04666900634765625, -0.04229736328125, -0.03792572021484375, -0.0335540771484375, -0.02918243408203125, -0.024810791015625, -0.02043914794921875, -0.0160675048828125, -0.01169586181640625, -0.00732421875, -0.00295257568359375, 0.0014190673828125, 0.00579071044921875, 0.010162353515625, 0.01453399658203125, 0.0189056396484375, 0.02327728271484375, 0.02764892578125, 0.03202056884765625, 0.0363922119140625, 0.04076385498046875, 0.045135498046875, 0.04950714111328125, 0.0538787841796875, 0.05825042724609375, 0.0626220703125, 0.06699371337890625, 0.0713653564453125, 0.07573699951171875, 0.080108642578125, 0.08448028564453125, 0.0888519287109375, 0.09322357177734375, 0.09759521484375, 0.10196685791015625, 0.1063385009765625, 0.11071014404296875, 0.115081787109375, 0.11945343017578125, 0.1238250732421875, 0.12819671630859375, 0.132568359375, 0.13694000244140625, 0.1413116455078125, 0.14568328857421875, 0.150054931640625, 0.15442657470703125, 0.1587982177734375, 0.16316986083984375, 0.16754150390625, 0.17191314697265625, 0.1762847900390625, 0.18065643310546875, 0.185028076171875, 0.18939971923828125, 0.1937713623046875, 0.19814300537109375, 0.2025146484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 10.0, 11.0, 28.0, 21.0, 29.0, 52.0, 73.0, 102.0, 241.0, 472.0, 1287.0, 5757.0, 41387.0, 566595.0, 3230046.0, 314735.0, 27281.0, 4104.0, 1038.0, 388.0, 223.0, 121.0, 81.0, 50.0, 42.0, 29.0, 14.0, 11.0, 11.0, 5.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.22705078125, -0.22004318237304688, -0.21303558349609375, -0.20602798461914062, -0.1990203857421875, -0.19201278686523438, -0.18500518798828125, -0.17799758911132812, -0.170989990234375, -0.16398239135742188, -0.15697479248046875, -0.14996719360351562, -0.1429595947265625, -0.13595199584960938, -0.12894439697265625, -0.12193679809570312, -0.11492919921875, -0.10792160034179688, -0.10091400146484375, -0.09390640258789062, -0.0868988037109375, -0.07989120483398438, -0.07288360595703125, -0.06587600708007812, -0.058868408203125, -0.051860809326171875, -0.04485321044921875, -0.037845611572265625, -0.0308380126953125, -0.023830413818359375, -0.01682281494140625, -0.009815216064453125, -0.0028076171875, 0.004199981689453125, 0.01120758056640625, 0.018215179443359375, 0.0252227783203125, 0.032230377197265625, 0.03923797607421875, 0.046245574951171875, 0.053253173828125, 0.060260772705078125, 0.06726837158203125, 0.07427597045898438, 0.0812835693359375, 0.08829116821289062, 0.09529876708984375, 0.10230636596679688, 0.10931396484375, 0.11632156372070312, 0.12332916259765625, 0.13033676147460938, 0.1373443603515625, 0.14435195922851562, 0.15135955810546875, 0.15836715698242188, 0.165374755859375, 0.17238235473632812, 0.17938995361328125, 0.18639755249023438, 0.1934051513671875, 0.20041275024414062, 0.20742034912109375, 0.21442794799804688, 0.221435546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 14.0, 10.0, 22.0, 17.0, 32.0, 46.0, 55.0, 76.0, 115.0, 167.0, 205.0, 280.0, 389.0, 540.0, 496.0, 449.0, 340.0, 244.0, 172.0, 117.0, 88.0, 58.0, 43.0, 30.0, 22.0, 11.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.11379051208496094, -0.11045455932617188, -0.10711860656738281, -0.10378265380859375, -0.10044670104980469, -0.09711074829101562, -0.09377479553222656, -0.0904388427734375, -0.08710289001464844, -0.08376693725585938, -0.08043098449707031, -0.07709503173828125, -0.07375907897949219, -0.07042312622070312, -0.06708717346191406, -0.063751220703125, -0.06041526794433594, -0.057079315185546875, -0.05374336242675781, -0.05040740966796875, -0.04707145690917969, -0.043735504150390625, -0.04039955139160156, -0.0370635986328125, -0.03372764587402344, -0.030391693115234375, -0.027055740356445312, -0.02371978759765625, -0.020383834838867188, -0.017047882080078125, -0.013711929321289062, -0.0103759765625, -0.0070400238037109375, -0.003704071044921875, -0.0003681182861328125, 0.00296783447265625, 0.0063037872314453125, 0.009639739990234375, 0.012975692749023438, 0.0163116455078125, 0.019647598266601562, 0.022983551025390625, 0.026319503784179688, 0.02965545654296875, 0.03299140930175781, 0.036327362060546875, 0.03966331481933594, 0.042999267578125, 0.04633522033691406, 0.049671173095703125, 0.05300712585449219, 0.05634307861328125, 0.05967903137207031, 0.06301498413085938, 0.06635093688964844, 0.0696868896484375, 0.07302284240722656, 0.07635879516601562, 0.07969474792480469, 0.08303070068359375, 0.08636665344238281, 0.08970260620117188, 0.09303855895996094, 0.09637451171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 9.0, 33.0, 93.0, 195.0, 256.0, 219.0, 122.0, 57.0, 16.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2261666059494019, -1.187685251235962, -1.1492037773132324, -1.1107224225997925, -1.0722410678863525, -1.033759593963623, -0.9952782392501831, -0.9567968249320984, -0.9183154106140137, -0.879833996295929, -0.8413525819778442, -0.8028712272644043, -0.7643898129463196, -0.7259083986282349, -0.6874270439147949, -0.6489456295967102, -0.6104642152786255, -0.5719828009605408, -0.533501386642456, -0.4950200319290161, -0.4565386176109314, -0.4180572032928467, -0.37957581877708435, -0.341094434261322, -0.3026130199432373, -0.2641316056251526, -0.22565022110939026, -0.18716882169246674, -0.1486874222755432, -0.11020602285861969, -0.07172462344169617, -0.03324323892593384, 0.00523829460144043, 0.04371969401836395, 0.08220109343528748, 0.120682492852211, 0.15916389226913452, 0.19764529168605804, 0.23612669110298157, 0.2746080756187439, 0.3130894899368286, 0.35157090425491333, 0.39005228877067566, 0.428533673286438, 0.4670150876045227, 0.5054965019226074, 0.5439778566360474, 0.5824592709541321, 0.6209406852722168, 0.6594220995903015, 0.6979035139083862, 0.7363848686218262, 0.7748662829399109, 0.8133476972579956, 0.8518290519714355, 0.8903104662895203, 0.928791880607605, 0.9672732949256897, 1.0057547092437744, 1.0442360639572144, 1.0827174186706543, 1.1211988925933838, 1.1596802473068237, 1.1981616020202637, 1.2366430759429932]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 9.0, 15.0, 8.0, 16.0, 20.0, 18.0, 32.0, 29.0, 30.0, 42.0, 42.0, 35.0, 52.0, 49.0, 42.0, 41.0, 48.0, 44.0, 40.0, 42.0, 37.0, 47.0, 35.0, 30.0, 19.0, 19.0, 19.0, 18.0, 15.0, 14.0, 12.0, 12.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3093070983886719, -0.2985919117927551, -0.287876695394516, -0.27716150879859924, -0.2664463222026825, -0.25573110580444336, -0.2450159192085266, -0.23430071771144867, -0.22358551621437073, -0.21287031471729279, -0.20215512812137604, -0.1914399266242981, -0.18072472512722015, -0.1700095236301422, -0.15929433703422546, -0.14857913553714752, -0.13786394894123077, -0.12714874744415283, -0.11643355339765549, -0.10571835935115814, -0.0950031578540802, -0.08428796380758286, -0.07357276976108551, -0.06285756826400757, -0.05214237421751022, -0.04142717644572258, -0.030711980536580086, -0.01999678462743759, -0.009281586855649948, 0.0014336109161376953, 0.01214880496263504, 0.022864006459712982, 0.03357920050621033, 0.04429439827799797, 0.055009596049785614, 0.06572479009628296, 0.0764399915933609, 0.08715518563985825, 0.09787037968635559, 0.10858558118343353, 0.11930077522993088, 0.13001596927642822, 0.14073117077350616, 0.1514463722705841, 0.16216155886650085, 0.1728767603635788, 0.18359196186065674, 0.1943071484565735, 0.20502234995365143, 0.21573755145072937, 0.22645273804664612, 0.23716793954372406, 0.247883141040802, 0.25859832763671875, 0.2693135142326355, 0.28002873063087463, 0.2907439172267914, 0.30145910382270813, 0.31217432022094727, 0.322889506816864, 0.33360469341278076, 0.3443199098110199, 0.35503509640693665, 0.3657503128051758, 0.37646549940109253]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 11.0, 9.0, 17.0, 13.0, 25.0, 22.0, 37.0, 36.0, 66.0, 69.0, 120.0, 169.0, 238.0, 301.0, 555.0, 1005.0, 2229.0, 6175.0, 21780.0, 99264.0, 474266.0, 350124.0, 67401.0, 15609.0, 4646.0, 1879.0, 893.0, 491.0, 288.0, 218.0, 154.0, 94.0, 91.0, 61.0, 41.0, 42.0, 25.0, 19.0, 14.0, 14.0, 11.0, 8.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28271484375, -0.2735595703125, -0.264404296875, -0.2552490234375, -0.24609375, -0.2369384765625, -0.227783203125, -0.2186279296875, -0.20947265625, -0.2003173828125, -0.191162109375, -0.1820068359375, -0.1728515625, -0.1636962890625, -0.154541015625, -0.1453857421875, -0.13623046875, -0.1270751953125, -0.117919921875, -0.1087646484375, -0.099609375, -0.0904541015625, -0.081298828125, -0.0721435546875, -0.06298828125, -0.0538330078125, -0.044677734375, -0.0355224609375, -0.0263671875, -0.0172119140625, -0.008056640625, 0.0010986328125, 0.01025390625, 0.0194091796875, 0.028564453125, 0.0377197265625, 0.046875, 0.0560302734375, 0.065185546875, 0.0743408203125, 0.08349609375, 0.0926513671875, 0.101806640625, 0.1109619140625, 0.1201171875, 0.1292724609375, 0.138427734375, 0.1475830078125, 0.15673828125, 0.1658935546875, 0.175048828125, 0.1842041015625, 0.193359375, 0.2025146484375, 0.211669921875, 0.2208251953125, 0.22998046875, 0.2391357421875, 0.248291015625, 0.2574462890625, 0.2666015625, 0.2757568359375, 0.284912109375, 0.2940673828125, 0.30322265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 8.0, 16.0, 19.0, 39.0, 58.0, 92.0, 104.0, 124.0, 115.0, 134.0, 100.0, 80.0, 38.0, 32.0, 20.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06597900390625, -0.06169414520263672, -0.05740928649902344, -0.053124427795410156, -0.048839569091796875, -0.044554710388183594, -0.04026985168457031, -0.03598499298095703, -0.03170013427734375, -0.02741527557373047, -0.023130416870117188, -0.018845558166503906, -0.014560699462890625, -0.010275840759277344, -0.0059909820556640625, -0.0017061233520507812, 0.0025787353515625, 0.006863594055175781, 0.011148452758789062, 0.015433311462402344, 0.019718170166015625, 0.024003028869628906, 0.028287887573242188, 0.03257274627685547, 0.03685760498046875, 0.04114246368408203, 0.04542732238769531, 0.049712181091308594, 0.053997039794921875, 0.058281898498535156, 0.06256675720214844, 0.06685161590576172, 0.071136474609375, 0.07542133331298828, 0.07970619201660156, 0.08399105072021484, 0.08827590942382812, 0.0925607681274414, 0.09684562683105469, 0.10113048553466797, 0.10541534423828125, 0.10970020294189453, 0.11398506164550781, 0.1182699203491211, 0.12255477905273438, 0.12683963775634766, 0.13112449645996094, 0.13540935516357422, 0.1396942138671875, 0.14397907257080078, 0.14826393127441406, 0.15254878997802734, 0.15683364868164062, 0.1611185073852539, 0.1654033660888672, 0.16968822479248047, 0.17397308349609375, 0.17825794219970703, 0.1825428009033203, 0.1868276596069336, 0.19111251831054688, 0.19539737701416016, 0.19968223571777344, 0.20396709442138672, 0.208251953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 14.0, 13.0, 10.0, 20.0, 28.0, 45.0, 54.0, 85.0, 163.0, 318.0, 614.0, 1283.0, 2821.0, 6644.0, 14733.0, 33626.0, 77522.0, 175133.0, 301757.0, 236427.0, 110328.0, 48714.0, 21112.0, 9239.0, 4200.0, 1867.0, 827.0, 394.0, 204.0, 110.0, 73.0, 50.0, 29.0, 21.0, 18.0, 12.0, 13.0, 11.0, 5.0, 9.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.156005859375, -0.15108680725097656, -0.14616775512695312, -0.1412487030029297, -0.13632965087890625, -0.1314105987548828, -0.12649154663085938, -0.12157249450683594, -0.1166534423828125, -0.11173439025878906, -0.10681533813476562, -0.10189628601074219, -0.09697723388671875, -0.09205818176269531, -0.08713912963867188, -0.08222007751464844, -0.077301025390625, -0.07238197326660156, -0.06746292114257812, -0.06254386901855469, -0.05762481689453125, -0.05270576477050781, -0.047786712646484375, -0.04286766052246094, -0.0379486083984375, -0.03302955627441406, -0.028110504150390625, -0.023191452026367188, -0.01827239990234375, -0.013353347778320312, -0.008434295654296875, -0.0035152435302734375, 0.00140380859375, 0.0063228607177734375, 0.011241912841796875, 0.016160964965820312, 0.02108001708984375, 0.025999069213867188, 0.030918121337890625, 0.03583717346191406, 0.0407562255859375, 0.04567527770996094, 0.050594329833984375, 0.05551338195800781, 0.06043243408203125, 0.06535148620605469, 0.07027053833007812, 0.07518959045410156, 0.080108642578125, 0.08502769470214844, 0.08994674682617188, 0.09486579895019531, 0.09978485107421875, 0.10470390319824219, 0.10962295532226562, 0.11454200744628906, 0.1194610595703125, 0.12438011169433594, 0.12929916381835938, 0.1342182159423828, 0.13913726806640625, 0.1440563201904297, 0.14897537231445312, 0.15389442443847656, 0.1588134765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 14.0, 8.0, 10.0, 15.0, 17.0, 21.0, 18.0, 22.0, 20.0, 28.0, 30.0, 30.0, 31.0, 36.0, 35.0, 35.0, 34.0, 37.0, 53.0, 52.0, 38.0, 46.0, 35.0, 27.0, 36.0, 27.0, 30.0, 28.0, 24.0, 18.0, 24.0, 25.0, 14.0, 14.0, 11.0, 10.0, 8.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1485595703125, -0.14398574829101562, -0.13941192626953125, -0.13483810424804688, -0.1302642822265625, -0.12569046020507812, -0.12111663818359375, -0.11654281616210938, -0.111968994140625, -0.10739517211914062, -0.10282135009765625, -0.09824752807617188, -0.0936737060546875, -0.08909988403320312, -0.08452606201171875, -0.07995223999023438, -0.07537841796875, -0.07080459594726562, -0.06623077392578125, -0.061656951904296875, -0.0570831298828125, -0.052509307861328125, -0.04793548583984375, -0.043361663818359375, -0.038787841796875, -0.034214019775390625, -0.02964019775390625, -0.025066375732421875, -0.0204925537109375, -0.015918731689453125, -0.01134490966796875, -0.006771087646484375, -0.002197265625, 0.002376556396484375, 0.00695037841796875, 0.011524200439453125, 0.0160980224609375, 0.020671844482421875, 0.02524566650390625, 0.029819488525390625, 0.034393310546875, 0.038967132568359375, 0.04354095458984375, 0.048114776611328125, 0.0526885986328125, 0.057262420654296875, 0.06183624267578125, 0.06641006469726562, 0.07098388671875, 0.07555770874023438, 0.08013153076171875, 0.08470535278320312, 0.0892791748046875, 0.09385299682617188, 0.09842681884765625, 0.10300064086914062, 0.107574462890625, 0.11214828491210938, 0.11672210693359375, 0.12129592895507812, 0.1258697509765625, 0.13044357299804688, 0.13501739501953125, 0.13959121704101562, 0.1441650390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 15.0, 26.0, 45.0, 52.0, 90.0, 124.0, 193.0, 298.0, 477.0, 797.0, 1338.0, 2209.0, 3813.0, 6872.0, 12364.0, 22535.0, 42138.0, 75914.0, 130672.0, 189900.0, 202611.0, 151155.0, 91252.0, 50881.0, 27751.0, 15182.0, 8377.0, 4614.0, 2644.0, 1586.0, 1010.0, 609.0, 380.0, 197.0, 145.0, 83.0, 59.0, 41.0, 27.0, 18.0, 13.0, 14.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.03803300857543945, -0.036728858947753906, -0.03542470932006836, -0.03412055969238281, -0.032816410064697266, -0.03151226043701172, -0.030208110809326172, -0.028903961181640625, -0.027599811553955078, -0.02629566192626953, -0.024991512298583984, -0.023687362670898438, -0.02238321304321289, -0.021079063415527344, -0.019774913787841797, -0.01847076416015625, -0.017166614532470703, -0.015862464904785156, -0.01455831527709961, -0.013254165649414062, -0.011950016021728516, -0.010645866394042969, -0.009341716766357422, -0.008037567138671875, -0.006733417510986328, -0.005429267883300781, -0.004125118255615234, -0.0028209686279296875, -0.0015168190002441406, -0.00021266937255859375, 0.0010914802551269531, 0.0023956298828125, 0.003699779510498047, 0.005003929138183594, 0.006308078765869141, 0.0076122283935546875, 0.008916378021240234, 0.010220527648925781, 0.011524677276611328, 0.012828826904296875, 0.014132976531982422, 0.015437126159667969, 0.016741275787353516, 0.018045425415039062, 0.01934957504272461, 0.020653724670410156, 0.021957874298095703, 0.02326202392578125, 0.024566173553466797, 0.025870323181152344, 0.02717447280883789, 0.028478622436523438, 0.029782772064208984, 0.03108692169189453, 0.03239107131958008, 0.033695220947265625, 0.03499937057495117, 0.03630352020263672, 0.037607669830322266, 0.03891181945800781, 0.04021596908569336, 0.041520118713378906, 0.04282426834106445, 0.04412841796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 4.0, 2.0, 7.0, 11.0, 13.0, 13.0, 14.0, 16.0, 30.0, 42.0, 30.0, 37.0, 48.0, 71.0, 94.0, 106.0, 88.0, 82.0, 55.0, 51.0, 32.0, 34.0, 21.0, 12.0, 20.0, 12.0, 17.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0311603546142578e-05, -9.922310709953308e-06, -9.533017873764038e-06, -9.143725037574768e-06, -8.754432201385498e-06, -8.365139365196228e-06, -7.975846529006958e-06, -7.586553692817688e-06, -7.197260856628418e-06, -6.807968020439148e-06, -6.418675184249878e-06, -6.029382348060608e-06, -5.640089511871338e-06, -5.250796675682068e-06, -4.861503839492798e-06, -4.472211003303528e-06, -4.082918167114258e-06, -3.693625330924988e-06, -3.3043324947357178e-06, -2.9150396585464478e-06, -2.5257468223571777e-06, -2.1364539861679077e-06, -1.7471611499786377e-06, -1.3578683137893677e-06, -9.685754776000977e-07, -5.792826414108276e-07, -1.8998980522155762e-07, 1.993030309677124e-07, 5.885958671569824e-07, 9.778887033462524e-07, 1.3671815395355225e-06, 1.7564743757247925e-06, 2.1457672119140625e-06, 2.5350600481033325e-06, 2.9243528842926025e-06, 3.3136457204818726e-06, 3.7029385566711426e-06, 4.092231392860413e-06, 4.481524229049683e-06, 4.870817065238953e-06, 5.260109901428223e-06, 5.649402737617493e-06, 6.038695573806763e-06, 6.427988409996033e-06, 6.817281246185303e-06, 7.206574082374573e-06, 7.595866918563843e-06, 7.985159754753113e-06, 8.374452590942383e-06, 8.763745427131653e-06, 9.153038263320923e-06, 9.542331099510193e-06, 9.931623935699463e-06, 1.0320916771888733e-05, 1.0710209608078003e-05, 1.1099502444267273e-05, 1.1488795280456543e-05, 1.1878088116645813e-05, 1.2267380952835083e-05, 1.2656673789024353e-05, 1.3045966625213623e-05, 1.3435259461402893e-05, 1.3824552297592163e-05, 1.4213845133781433e-05, 1.4603137969970703e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 10.0, 8.0, 11.0, 22.0, 40.0, 57.0, 93.0, 164.0, 275.0, 458.0, 737.0, 1391.0, 2565.0, 4519.0, 8424.0, 16059.0, 29954.0, 56291.0, 101819.0, 168137.0, 215763.0, 184466.0, 116313.0, 65387.0, 35174.0, 18725.0, 9743.0, 5262.0, 2886.0, 1667.0, 945.0, 445.0, 294.0, 186.0, 100.0, 59.0, 29.0, 25.0, 10.0, 8.0, 10.0, 7.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.03835916519165039, -0.03710651397705078, -0.03585386276245117, -0.03460121154785156, -0.03334856033325195, -0.032095909118652344, -0.030843257904052734, -0.029590606689453125, -0.028337955474853516, -0.027085304260253906, -0.025832653045654297, -0.024580001831054688, -0.023327350616455078, -0.02207469940185547, -0.02082204818725586, -0.01956939697265625, -0.01831674575805664, -0.01706409454345703, -0.015811443328857422, -0.014558792114257812, -0.013306140899658203, -0.012053489685058594, -0.010800838470458984, -0.009548187255859375, -0.008295536041259766, -0.007042884826660156, -0.005790233612060547, -0.0045375823974609375, -0.003284931182861328, -0.0020322799682617188, -0.0007796287536621094, 0.0004730224609375, 0.0017256736755371094, 0.0029783248901367188, 0.004230976104736328, 0.0054836273193359375, 0.006736278533935547, 0.007988929748535156, 0.009241580963134766, 0.010494232177734375, 0.011746883392333984, 0.012999534606933594, 0.014252185821533203, 0.015504837036132812, 0.016757488250732422, 0.01801013946533203, 0.01926279067993164, 0.02051544189453125, 0.02176809310913086, 0.02302074432373047, 0.024273395538330078, 0.025526046752929688, 0.026778697967529297, 0.028031349182128906, 0.029284000396728516, 0.030536651611328125, 0.031789302825927734, 0.033041954040527344, 0.03429460525512695, 0.03554725646972656, 0.03679990768432617, 0.03805255889892578, 0.03930521011352539, 0.040557861328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 13.0, 16.0, 18.0, 18.0, 23.0, 20.0, 35.0, 35.0, 49.0, 36.0, 48.0, 44.0, 70.0, 64.0, 61.0, 56.0, 49.0, 39.0, 44.0, 42.0, 38.0, 18.0, 20.0, 27.0, 17.0, 16.0, 11.0, 13.0, 10.0, 3.0, 3.0, 2.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.040924072265625, -0.03970623016357422, -0.03848838806152344, -0.037270545959472656, -0.036052703857421875, -0.034834861755371094, -0.03361701965332031, -0.03239917755126953, -0.03118133544921875, -0.02996349334716797, -0.028745651245117188, -0.027527809143066406, -0.026309967041015625, -0.025092124938964844, -0.023874282836914062, -0.02265644073486328, -0.0214385986328125, -0.02022075653076172, -0.019002914428710938, -0.017785072326660156, -0.016567230224609375, -0.015349388122558594, -0.014131546020507812, -0.012913703918457031, -0.01169586181640625, -0.010478019714355469, -0.009260177612304688, -0.008042335510253906, -0.006824493408203125, -0.005606651306152344, -0.0043888092041015625, -0.0031709671020507812, -0.001953125, -0.0007352828979492188, 0.0004825592041015625, 0.0017004013061523438, 0.002918243408203125, 0.004136085510253906, 0.0053539276123046875, 0.006571769714355469, 0.00778961181640625, 0.009007453918457031, 0.010225296020507812, 0.011443138122558594, 0.012660980224609375, 0.013878822326660156, 0.015096664428710938, 0.01631450653076172, 0.0175323486328125, 0.01875019073486328, 0.019968032836914062, 0.021185874938964844, 0.022403717041015625, 0.023621559143066406, 0.024839401245117188, 0.02605724334716797, 0.02727508544921875, 0.02849292755126953, 0.029710769653320312, 0.030928611755371094, 0.032146453857421875, 0.033364295959472656, 0.03458213806152344, 0.03579998016357422, 0.037017822265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 53.0, 159.0, 280.0, 319.0, 130.0, 43.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.192502021789551, -2.1280267238616943, -2.063551187515259, -1.9990758895874023, -1.934600591659546, -1.8701251745224, -1.805649757385254, -1.7411744594573975, -1.6766990423202515, -1.6122236251831055, -1.547748327255249, -1.483272910118103, -1.418797492980957, -1.3543221950531006, -1.2898467779159546, -1.2253713607788086, -1.1608960628509521, -1.0964206457138062, -1.0319453477859497, -0.9674699306488037, -0.9029945731163025, -0.8385192155838013, -0.7740437984466553, -0.709568440914154, -0.6450930833816528, -0.5806177258491516, -0.5161423683166504, -0.4516669511795044, -0.3871915936470032, -0.32271623611450195, -0.25824084877967834, -0.19376546144485474, -0.12928986549377441, -0.064814493060112, -0.00033912062644958496, 0.06413625180721283, 0.12861162424087524, 0.19308698177337646, 0.2575623691082001, 0.3220377564430237, 0.3865131139755249, 0.4509884715080261, 0.5154638290405273, 0.5799392461776733, 0.6444146037101746, 0.7088899612426758, 0.7733653783798218, 0.837840735912323, 0.9023160934448242, 0.9667914509773254, 1.0312668085098267, 1.0957422256469727, 1.160217523574829, 1.224692940711975, 1.289168357849121, 1.3536436557769775, 1.4181190729141235, 1.4825944900512695, 1.547069787979126, 1.611545205116272, 1.676020622253418, 1.7404959201812744, 1.8049713373184204, 1.8694467544555664, 1.9339220523834229]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 10.0, 10.0, 7.0, 11.0, 12.0, 18.0, 20.0, 28.0, 29.0, 26.0, 35.0, 44.0, 36.0, 30.0, 49.0, 51.0, 54.0, 43.0, 46.0, 39.0, 65.0, 43.0, 35.0, 35.0, 44.0, 18.0, 28.0, 24.0, 24.0, 24.0, 14.0, 13.0, 6.0, 9.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6124780774116516, -0.5935313701629639, -0.5745847225189209, -0.5556380152702332, -0.5366913080215454, -0.5177446007728577, -0.4987979233264923, -0.47985124588012695, -0.4609045386314392, -0.44195783138275146, -0.4230111539363861, -0.40406447649002075, -0.385117769241333, -0.36617106199264526, -0.3472243845462799, -0.32827770709991455, -0.3093309998512268, -0.29038429260253906, -0.2714376151561737, -0.25249093770980835, -0.2335442304611206, -0.21459753811359406, -0.1956508457660675, -0.17670415341854095, -0.1577574610710144, -0.13881076872348785, -0.1198640763759613, -0.10091738402843475, -0.0819706916809082, -0.06302399933338165, -0.0440773069858551, -0.025130614638328552, -0.006183981895446777, 0.012762710452079773, 0.03170940279960632, 0.050656095147132874, 0.06960278749465942, 0.08854947984218597, 0.10749617218971252, 0.12644286453723907, 0.14538955688476562, 0.16433624923229218, 0.18328294157981873, 0.20222963392734528, 0.22117632627487183, 0.24012301862239838, 0.2590697109699249, 0.2780163884162903, 0.296963095664978, 0.31590980291366577, 0.33485648036003113, 0.3538031578063965, 0.37274986505508423, 0.391696572303772, 0.41064324975013733, 0.4295899271965027, 0.44853663444519043, 0.4674833416938782, 0.48643001914024353, 0.5053766965866089, 0.5243234038352966, 0.5432701110839844, 0.5622167587280273, 0.5811634659767151, 0.6001101732254028]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 14.0, 10.0, 24.0, 35.0, 53.0, 111.0, 183.0, 428.0, 1108.0, 3002.0, 10149.0, 47117.0, 785882.0, 3193055.0, 128576.0, 16213.0, 4401.0, 1731.0, 836.0, 482.0, 299.0, 171.0, 125.0, 88.0, 51.0, 30.0, 29.0, 21.0, 21.0, 14.0, 8.0, 7.0, 0.0, 1.0, 4.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.15855026245117188, -0.15108489990234375, -0.14361953735351562, -0.1361541748046875, -0.12868881225585938, -0.12122344970703125, -0.11375808715820312, -0.106292724609375, -0.09882736206054688, -0.09136199951171875, -0.08389663696289062, -0.0764312744140625, -0.06896591186523438, -0.06150054931640625, -0.054035186767578125, -0.04656982421875, -0.039104461669921875, -0.03163909912109375, -0.024173736572265625, -0.0167083740234375, -0.009243011474609375, -0.00177764892578125, 0.005687713623046875, 0.013153076171875, 0.020618438720703125, 0.02808380126953125, 0.035549163818359375, 0.0430145263671875, 0.050479888916015625, 0.05794525146484375, 0.06541061401367188, 0.0728759765625, 0.08034133911132812, 0.08780670166015625, 0.09527206420898438, 0.1027374267578125, 0.11020278930664062, 0.11766815185546875, 0.12513351440429688, 0.132598876953125, 0.14006423950195312, 0.14752960205078125, 0.15499496459960938, 0.1624603271484375, 0.16992568969726562, 0.17739105224609375, 0.18485641479492188, 0.19232177734375, 0.19978713989257812, 0.20725250244140625, 0.21471786499023438, 0.2221832275390625, 0.22964859008789062, 0.23711395263671875, 0.24457931518554688, 0.252044677734375, 0.2595100402832031, 0.26697540283203125, 0.2744407653808594, 0.2819061279296875, 0.2893714904785156, 0.29683685302734375, 0.3043022155761719, 0.311767578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 5.0, 22.0, 36.0, 46.0, 66.0, 95.0, 90.0, 111.0, 125.0, 105.0, 106.0, 61.0, 45.0, 32.0, 16.0, 16.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06329345703125, -0.05913066864013672, -0.05496788024902344, -0.050805091857910156, -0.046642303466796875, -0.042479515075683594, -0.03831672668457031, -0.03415393829345703, -0.02999114990234375, -0.02582836151123047, -0.021665573120117188, -0.017502784729003906, -0.013339996337890625, -0.009177207946777344, -0.0050144195556640625, -0.0008516311645507812, 0.0033111572265625, 0.007473945617675781, 0.011636734008789062, 0.015799522399902344, 0.019962310791015625, 0.024125099182128906, 0.028287887573242188, 0.03245067596435547, 0.03661346435546875, 0.04077625274658203, 0.04493904113769531, 0.049101829528808594, 0.053264617919921875, 0.057427406311035156, 0.06159019470214844, 0.06575298309326172, 0.069915771484375, 0.07407855987548828, 0.07824134826660156, 0.08240413665771484, 0.08656692504882812, 0.0907297134399414, 0.09489250183105469, 0.09905529022216797, 0.10321807861328125, 0.10738086700439453, 0.11154365539550781, 0.1157064437866211, 0.11986923217773438, 0.12403202056884766, 0.12819480895996094, 0.13235759735107422, 0.1365203857421875, 0.14068317413330078, 0.14484596252441406, 0.14900875091552734, 0.15317153930664062, 0.1573343276977539, 0.1614971160888672, 0.16565990447998047, 0.16982269287109375, 0.17398548126220703, 0.1781482696533203, 0.1823110580444336, 0.18647384643554688, 0.19063663482666016, 0.19479942321777344, 0.19896221160888672, 0.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 8.0, 17.0, 13.0, 21.0, 28.0, 43.0, 57.0, 123.0, 179.0, 367.0, 991.0, 3211.0, 15148.0, 125987.0, 1916748.0, 1980006.0, 130343.0, 15855.0, 3220.0, 957.0, 400.0, 172.0, 113.0, 78.0, 62.0, 38.0, 23.0, 15.0, 19.0, 5.0, 8.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2003173828125, -0.19364166259765625, -0.1869659423828125, -0.18029022216796875, -0.173614501953125, -0.16693878173828125, -0.1602630615234375, -0.15358734130859375, -0.14691162109375, -0.14023590087890625, -0.1335601806640625, -0.12688446044921875, -0.120208740234375, -0.11353302001953125, -0.1068572998046875, -0.10018157958984375, -0.093505859375, -0.08683013916015625, -0.0801544189453125, -0.07347869873046875, -0.066802978515625, -0.06012725830078125, -0.0534515380859375, -0.04677581787109375, -0.04010009765625, -0.03342437744140625, -0.0267486572265625, -0.02007293701171875, -0.013397216796875, -0.00672149658203125, -4.57763671875e-05, 0.00662994384765625, 0.0133056640625, 0.01998138427734375, 0.0266571044921875, 0.03333282470703125, 0.040008544921875, 0.04668426513671875, 0.0533599853515625, 0.06003570556640625, 0.06671142578125, 0.07338714599609375, 0.0800628662109375, 0.08673858642578125, 0.093414306640625, 0.10009002685546875, 0.1067657470703125, 0.11344146728515625, 0.1201171875, 0.12679290771484375, 0.1334686279296875, 0.14014434814453125, 0.146820068359375, 0.15349578857421875, 0.1601715087890625, 0.16684722900390625, 0.17352294921875, 0.18019866943359375, 0.1868743896484375, 0.19355010986328125, 0.200225830078125, 0.20690155029296875, 0.2135772705078125, 0.22025299072265625, 0.2269287109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 13.0, 18.0, 27.0, 38.0, 46.0, 76.0, 88.0, 145.0, 222.0, 282.0, 401.0, 494.0, 564.0, 484.0, 365.0, 248.0, 170.0, 113.0, 93.0, 56.0, 30.0, 20.0, 18.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129638671875, -0.12615394592285156, -0.12266921997070312, -0.11918449401855469, -0.11569976806640625, -0.11221504211425781, -0.10873031616210938, -0.10524559020996094, -0.1017608642578125, -0.09827613830566406, -0.09479141235351562, -0.09130668640136719, -0.08782196044921875, -0.08433723449707031, -0.08085250854492188, -0.07736778259277344, -0.073883056640625, -0.07039833068847656, -0.06691360473632812, -0.06342887878417969, -0.05994415283203125, -0.05645942687988281, -0.052974700927734375, -0.04948997497558594, -0.0460052490234375, -0.04252052307128906, -0.039035797119140625, -0.03555107116699219, -0.03206634521484375, -0.028581619262695312, -0.025096893310546875, -0.021612167358398438, -0.01812744140625, -0.014642715454101562, -0.011157989501953125, -0.0076732635498046875, -0.00418853759765625, -0.0007038116455078125, 0.002780914306640625, 0.0062656402587890625, 0.0097503662109375, 0.013235092163085938, 0.016719818115234375, 0.020204544067382812, 0.02368927001953125, 0.027173995971679688, 0.030658721923828125, 0.03414344787597656, 0.037628173828125, 0.04111289978027344, 0.044597625732421875, 0.04808235168457031, 0.05156707763671875, 0.05505180358886719, 0.058536529541015625, 0.06202125549316406, 0.0655059814453125, 0.06899070739746094, 0.07247543334960938, 0.07596015930175781, 0.07944488525390625, 0.08292961120605469, 0.08641433715820312, 0.08989906311035156, 0.0933837890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 20.0, 38.0, 95.0, 168.0, 215.0, 212.0, 127.0, 80.0, 24.0, 13.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359740138053894, -1.3247348070144653, -1.2897295951843262, -1.2547242641448975, -1.2197190523147583, -1.1847137212753296, -1.1497085094451904, -1.1147031784057617, -1.079697847366333, -1.0446925163269043, -1.0096873044967651, -0.9746820330619812, -0.9396767616271973, -0.9046714305877686, -0.8696661591529846, -0.8346608877182007, -0.7996556758880615, -0.7646504044532776, -0.7296451330184937, -0.6946398615837097, -0.6596345901489258, -0.6246292591094971, -0.5896239876747131, -0.5546187162399292, -0.5196134448051453, -0.48460817337036133, -0.4496029019355774, -0.41459760069847107, -0.37959232926368713, -0.3445870578289032, -0.3095817565917969, -0.27457648515701294, -0.23957133293151855, -0.20456606149673462, -0.1695607751607895, -0.13455548882484436, -0.09955021739006042, -0.06454494595527649, -0.02953965961933136, 0.0054656267166137695, 0.040470898151397705, 0.07547617703676224, 0.11048145592212677, 0.1454867422580719, 0.18049201369285583, 0.21549728512763977, 0.2505025863647461, 0.28550785779953003, 0.32051312923431396, 0.3555184006690979, 0.39052367210388184, 0.42552897334098816, 0.4605342447757721, 0.49553951621055603, 0.5305448174476624, 0.5655500888824463, 0.6005553603172302, 0.6355606317520142, 0.6705659031867981, 0.705571174621582, 0.7405765056610107, 0.7755817174911499, 0.8105870485305786, 0.8455923199653625, 0.8805975914001465]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 8.0, 11.0, 18.0, 15.0, 20.0, 23.0, 28.0, 22.0, 25.0, 38.0, 40.0, 60.0, 53.0, 52.0, 48.0, 50.0, 49.0, 40.0, 49.0, 40.0, 40.0, 30.0, 32.0, 41.0, 24.0, 28.0, 17.0, 22.0, 13.0, 11.0, 15.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3257802128791809, -0.31436967849731445, -0.3029591143131256, -0.29154857993125916, -0.2801380157470703, -0.26872748136520386, -0.2573169469833374, -0.24590638279914856, -0.2344958335161209, -0.22308528423309326, -0.2116747349500656, -0.20026418566703796, -0.1888536512851715, -0.17744308710098267, -0.1660325527191162, -0.15462200343608856, -0.1432114541530609, -0.13180090487003326, -0.12039035558700562, -0.10897981375455856, -0.09756926447153091, -0.08615871518850327, -0.07474817335605621, -0.06333762407302856, -0.051927074790000916, -0.04051652550697327, -0.029105979949235916, -0.017695434391498566, -0.006284885108470917, 0.005125664174556732, 0.016536206007003784, 0.027946755290031433, 0.03935730457305908, 0.05076785385608673, 0.06217839941382408, 0.07358894497156143, 0.08499949425458908, 0.09641004353761673, 0.10782058537006378, 0.11923113465309143, 0.13064168393611908, 0.14205223321914673, 0.15346278250217438, 0.16487333178520203, 0.17628386616706848, 0.18769443035125732, 0.19910496473312378, 0.21051551401615143, 0.22192606329917908, 0.23333661258220673, 0.24474716186523438, 0.25615769624710083, 0.2675682604312897, 0.27897879481315613, 0.29038935899734497, 0.3017998933792114, 0.3132104277610779, 0.32462096214294434, 0.3360315263271332, 0.34744206070899963, 0.3588526248931885, 0.37026315927505493, 0.3816736936569214, 0.39308425784111023, 0.4044948220252991]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 17.0, 15.0, 21.0, 32.0, 41.0, 66.0, 95.0, 128.0, 170.0, 258.0, 408.0, 709.0, 1400.0, 3532.0, 10784.0, 45827.0, 246227.0, 546444.0, 150271.0, 29143.0, 7573.0, 2608.0, 1108.0, 602.0, 356.0, 212.0, 138.0, 100.0, 77.0, 48.0, 39.0, 21.0, 21.0, 18.0, 9.0, 8.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.470458984375, -0.45676422119140625, -0.4430694580078125, -0.42937469482421875, -0.415679931640625, -0.40198516845703125, -0.3882904052734375, -0.37459564208984375, -0.36090087890625, -0.34720611572265625, -0.3335113525390625, -0.31981658935546875, -0.306121826171875, -0.29242706298828125, -0.2787322998046875, -0.26503753662109375, -0.2513427734375, -0.23764801025390625, -0.2239532470703125, -0.21025848388671875, -0.196563720703125, -0.18286895751953125, -0.1691741943359375, -0.15547943115234375, -0.14178466796875, -0.12808990478515625, -0.1143951416015625, -0.10070037841796875, -0.087005615234375, -0.07331085205078125, -0.0596160888671875, -0.04592132568359375, -0.0322265625, -0.01853179931640625, -0.0048370361328125, 0.00885772705078125, 0.022552490234375, 0.03624725341796875, 0.0499420166015625, 0.06363677978515625, 0.07733154296875, 0.09102630615234375, 0.1047210693359375, 0.11841583251953125, 0.132110595703125, 0.14580535888671875, 0.1595001220703125, 0.17319488525390625, 0.1868896484375, 0.20058441162109375, 0.2142791748046875, 0.22797393798828125, 0.241668701171875, 0.25536346435546875, 0.2690582275390625, 0.28275299072265625, 0.29644775390625, 0.31014251708984375, 0.3238372802734375, 0.33753204345703125, 0.351226806640625, 0.36492156982421875, 0.3786163330078125, 0.39231109619140625, 0.406005859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 7.0, 10.0, 22.0, 30.0, 59.0, 77.0, 105.0, 87.0, 127.0, 129.0, 121.0, 80.0, 56.0, 31.0, 31.0, 7.0, 11.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0634765625, -0.059200286865234375, -0.05492401123046875, -0.050647735595703125, -0.0463714599609375, -0.042095184326171875, -0.03781890869140625, -0.033542633056640625, -0.029266357421875, -0.024990081787109375, -0.02071380615234375, -0.016437530517578125, -0.0121612548828125, -0.007884979248046875, -0.00360870361328125, 0.000667572021484375, 0.00494384765625, 0.009220123291015625, 0.01349639892578125, 0.017772674560546875, 0.0220489501953125, 0.026325225830078125, 0.03060150146484375, 0.034877777099609375, 0.039154052734375, 0.043430328369140625, 0.04770660400390625, 0.051982879638671875, 0.0562591552734375, 0.060535430908203125, 0.06481170654296875, 0.06908798217773438, 0.0733642578125, 0.07764053344726562, 0.08191680908203125, 0.08619308471679688, 0.0904693603515625, 0.09474563598632812, 0.09902191162109375, 0.10329818725585938, 0.107574462890625, 0.11185073852539062, 0.11612701416015625, 0.12040328979492188, 0.1246795654296875, 0.12895584106445312, 0.13323211669921875, 0.13750839233398438, 0.14178466796875, 0.14606094360351562, 0.15033721923828125, 0.15461349487304688, 0.1588897705078125, 0.16316604614257812, 0.16744232177734375, 0.17171859741210938, 0.175994873046875, 0.18027114868164062, 0.18454742431640625, 0.18882369995117188, 0.1930999755859375, 0.19737625122070312, 0.20165252685546875, 0.20592880249023438, 0.210205078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 13.0, 9.0, 10.0, 23.0, 21.0, 27.0, 40.0, 53.0, 103.0, 136.0, 250.0, 408.0, 695.0, 1255.0, 2365.0, 4827.0, 9957.0, 21860.0, 48510.0, 105215.0, 199007.0, 262620.0, 197652.0, 103702.0, 47756.0, 21872.0, 9970.0, 4841.0, 2402.0, 1170.0, 675.0, 408.0, 265.0, 131.0, 91.0, 72.0, 51.0, 20.0, 19.0, 21.0, 15.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.1976318359375, -0.19190216064453125, -0.1861724853515625, -0.18044281005859375, -0.174713134765625, -0.16898345947265625, -0.1632537841796875, -0.15752410888671875, -0.15179443359375, -0.14606475830078125, -0.1403350830078125, -0.13460540771484375, -0.128875732421875, -0.12314605712890625, -0.1174163818359375, -0.11168670654296875, -0.10595703125, -0.10022735595703125, -0.0944976806640625, -0.08876800537109375, -0.083038330078125, -0.07730865478515625, -0.0715789794921875, -0.06584930419921875, -0.06011962890625, -0.05438995361328125, -0.0486602783203125, -0.04293060302734375, -0.037200927734375, -0.03147125244140625, -0.0257415771484375, -0.02001190185546875, -0.0142822265625, -0.00855255126953125, -0.0028228759765625, 0.00290679931640625, 0.008636474609375, 0.01436614990234375, 0.0200958251953125, 0.02582550048828125, 0.03155517578125, 0.03728485107421875, 0.0430145263671875, 0.04874420166015625, 0.054473876953125, 0.06020355224609375, 0.0659332275390625, 0.07166290283203125, 0.077392578125, 0.08312225341796875, 0.0888519287109375, 0.09458160400390625, 0.100311279296875, 0.10604095458984375, 0.1117706298828125, 0.11750030517578125, 0.12322998046875, 0.12895965576171875, 0.1346893310546875, 0.14041900634765625, 0.146148681640625, 0.15187835693359375, 0.1576080322265625, 0.16333770751953125, 0.1690673828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 9.0, 10.0, 10.0, 17.0, 15.0, 22.0, 31.0, 22.0, 32.0, 42.0, 27.0, 39.0, 52.0, 45.0, 67.0, 49.0, 50.0, 52.0, 38.0, 53.0, 37.0, 47.0, 29.0, 30.0, 30.0, 26.0, 23.0, 18.0, 16.0, 18.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1910400390625, -0.1848888397216797, -0.17873764038085938, -0.17258644104003906, -0.16643524169921875, -0.16028404235839844, -0.15413284301757812, -0.1479816436767578, -0.1418304443359375, -0.1356792449951172, -0.12952804565429688, -0.12337684631347656, -0.11722564697265625, -0.11107444763183594, -0.10492324829101562, -0.09877204895019531, -0.092620849609375, -0.08646965026855469, -0.08031845092773438, -0.07416725158691406, -0.06801605224609375, -0.06186485290527344, -0.055713653564453125, -0.04956245422363281, -0.0434112548828125, -0.03726005554199219, -0.031108856201171875, -0.024957656860351562, -0.01880645751953125, -0.012655258178710938, -0.006504058837890625, -0.0003528594970703125, 0.00579833984375, 0.011949539184570312, 0.018100738525390625, 0.024251937866210938, 0.03040313720703125, 0.03655433654785156, 0.042705535888671875, 0.04885673522949219, 0.0550079345703125, 0.06115913391113281, 0.06731033325195312, 0.07346153259277344, 0.07961273193359375, 0.08576393127441406, 0.09191513061523438, 0.09806632995605469, 0.104217529296875, 0.11036872863769531, 0.11651992797851562, 0.12267112731933594, 0.12882232666015625, 0.13497352600097656, 0.14112472534179688, 0.1472759246826172, 0.1534271240234375, 0.1595783233642578, 0.16572952270507812, 0.17188072204589844, 0.17803192138671875, 0.18418312072753906, 0.19033432006835938, 0.1964855194091797, 0.20263671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 6.0, 7.0, 17.0, 22.0, 21.0, 45.0, 54.0, 89.0, 98.0, 147.0, 236.0, 323.0, 435.0, 605.0, 894.0, 1389.0, 2141.0, 3483.0, 5842.0, 10647.0, 22104.0, 48792.0, 113417.0, 231069.0, 282487.0, 175111.0, 78045.0, 34140.0, 15938.0, 8212.0, 4519.0, 2777.0, 1702.0, 1162.0, 805.0, 502.0, 362.0, 278.0, 162.0, 138.0, 91.0, 60.0, 66.0, 37.0, 19.0, 19.0, 14.0, 9.0, 6.0, 4.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07822704315185547, -0.07564353942871094, -0.0730600357055664, -0.07047653198242188, -0.06789302825927734, -0.06530952453613281, -0.06272602081298828, -0.06014251708984375, -0.05755901336669922, -0.05497550964355469, -0.052392005920410156, -0.049808502197265625, -0.047224998474121094, -0.04464149475097656, -0.04205799102783203, -0.0394744873046875, -0.03689098358154297, -0.03430747985839844, -0.031723976135253906, -0.029140472412109375, -0.026556968688964844, -0.023973464965820312, -0.02138996124267578, -0.01880645751953125, -0.01622295379638672, -0.013639450073242188, -0.011055946350097656, -0.008472442626953125, -0.005888938903808594, -0.0033054351806640625, -0.0007219314575195312, 0.001861572265625, 0.004445075988769531, 0.0070285797119140625, 0.009612083435058594, 0.012195587158203125, 0.014779090881347656, 0.017362594604492188, 0.01994609832763672, 0.02252960205078125, 0.02511310577392578, 0.027696609497070312, 0.030280113220214844, 0.032863616943359375, 0.035447120666503906, 0.03803062438964844, 0.04061412811279297, 0.0431976318359375, 0.04578113555908203, 0.04836463928222656, 0.050948143005371094, 0.053531646728515625, 0.056115150451660156, 0.05869865417480469, 0.06128215789794922, 0.06386566162109375, 0.06644916534423828, 0.06903266906738281, 0.07161617279052734, 0.07419967651367188, 0.0767831802368164, 0.07936668395996094, 0.08195018768310547, 0.08453369140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 9.0, 12.0, 14.0, 17.0, 23.0, 59.0, 67.0, 87.0, 110.0, 129.0, 130.0, 88.0, 79.0, 44.0, 38.0, 20.0, 14.0, 10.0, 9.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.2814609110355377e-05, -2.1846964955329895e-05, -2.0879320800304413e-05, -1.991167664527893e-05, -1.894403249025345e-05, -1.7976388335227966e-05, -1.7008744180202484e-05, -1.6041100025177002e-05, -1.507345587015152e-05, -1.4105811715126038e-05, -1.3138167560100555e-05, -1.2170523405075073e-05, -1.1202879250049591e-05, -1.0235235095024109e-05, -9.267590939998627e-06, -8.299946784973145e-06, -7.332302629947662e-06, -6.36465847492218e-06, -5.397014319896698e-06, -4.429370164871216e-06, -3.4617260098457336e-06, -2.4940818548202515e-06, -1.5264376997947693e-06, -5.587935447692871e-07, 4.0885061025619507e-07, 1.3764947652816772e-06, 2.3441389203071594e-06, 3.3117830753326416e-06, 4.279427230358124e-06, 5.247071385383606e-06, 6.214715540409088e-06, 7.18235969543457e-06, 8.150003850460052e-06, 9.117648005485535e-06, 1.0085292160511017e-05, 1.1052936315536499e-05, 1.2020580470561981e-05, 1.2988224625587463e-05, 1.3955868780612946e-05, 1.4923512935638428e-05, 1.589115709066391e-05, 1.6858801245689392e-05, 1.7826445400714874e-05, 1.8794089555740356e-05, 1.976173371076584e-05, 2.072937786579132e-05, 2.1697022020816803e-05, 2.2664666175842285e-05, 2.3632310330867767e-05, 2.459995448589325e-05, 2.556759864091873e-05, 2.6535242795944214e-05, 2.7502886950969696e-05, 2.8470531105995178e-05, 2.943817526102066e-05, 3.0405819416046143e-05, 3.1373463571071625e-05, 3.234110772609711e-05, 3.330875188112259e-05, 3.427639603614807e-05, 3.5244040191173553e-05, 3.6211684346199036e-05, 3.717932850122452e-05, 3.814697265625e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 11.0, 12.0, 24.0, 48.0, 95.0, 124.0, 209.0, 320.0, 581.0, 955.0, 1605.0, 2834.0, 5888.0, 12766.0, 34427.0, 118932.0, 365098.0, 341716.0, 107196.0, 31662.0, 11933.0, 5464.0, 2831.0, 1551.0, 935.0, 486.0, 314.0, 194.0, 116.0, 65.0, 55.0, 36.0, 26.0, 11.0, 6.0, 10.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.1267690658569336, -0.12292289733886719, -0.11907672882080078, -0.11523056030273438, -0.11138439178466797, -0.10753822326660156, -0.10369205474853516, -0.09984588623046875, -0.09599971771240234, -0.09215354919433594, -0.08830738067626953, -0.08446121215820312, -0.08061504364013672, -0.07676887512207031, -0.0729227066040039, -0.0690765380859375, -0.0652303695678711, -0.06138420104980469, -0.05753803253173828, -0.053691864013671875, -0.04984569549560547, -0.04599952697753906, -0.042153358459472656, -0.03830718994140625, -0.034461021423339844, -0.030614852905273438, -0.02676868438720703, -0.022922515869140625, -0.01907634735107422, -0.015230178833007812, -0.011384010314941406, -0.007537841796875, -0.0036916732788085938, 0.0001544952392578125, 0.004000663757324219, 0.007846832275390625, 0.011693000793457031, 0.015539169311523438, 0.019385337829589844, 0.02323150634765625, 0.027077674865722656, 0.030923843383789062, 0.03477001190185547, 0.038616180419921875, 0.04246234893798828, 0.04630851745605469, 0.050154685974121094, 0.0540008544921875, 0.057847023010253906, 0.06169319152832031, 0.06553936004638672, 0.06938552856445312, 0.07323169708251953, 0.07707786560058594, 0.08092403411865234, 0.08477020263671875, 0.08861637115478516, 0.09246253967285156, 0.09630870819091797, 0.10015487670898438, 0.10400104522705078, 0.10784721374511719, 0.1116933822631836, 0.11553955078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 7.0, 5.0, 15.0, 21.0, 30.0, 43.0, 49.0, 51.0, 65.0, 83.0, 93.0, 99.0, 105.0, 72.0, 58.0, 48.0, 33.0, 28.0, 12.0, 22.0, 19.0, 6.0, 10.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08404731750488281, -0.08105850219726562, -0.07806968688964844, -0.07508087158203125, -0.07209205627441406, -0.06910324096679688, -0.06611442565917969, -0.0631256103515625, -0.06013679504394531, -0.057147979736328125, -0.05415916442871094, -0.05117034912109375, -0.04818153381347656, -0.045192718505859375, -0.04220390319824219, -0.039215087890625, -0.03622627258300781, -0.033237457275390625, -0.030248641967773438, -0.02725982666015625, -0.024271011352539062, -0.021282196044921875, -0.018293380737304688, -0.0153045654296875, -0.012315750122070312, -0.009326934814453125, -0.0063381195068359375, -0.00334930419921875, -0.0003604888916015625, 0.002628326416015625, 0.0056171417236328125, 0.00860595703125, 0.011594772338867188, 0.014583587646484375, 0.017572402954101562, 0.02056121826171875, 0.023550033569335938, 0.026538848876953125, 0.029527664184570312, 0.0325164794921875, 0.03550529479980469, 0.038494110107421875, 0.04148292541503906, 0.04447174072265625, 0.04746055603027344, 0.050449371337890625, 0.05343818664550781, 0.056427001953125, 0.05941581726074219, 0.062404632568359375, 0.06539344787597656, 0.06838226318359375, 0.07137107849121094, 0.07435989379882812, 0.07734870910644531, 0.0803375244140625, 0.08332633972167969, 0.08631515502929688, 0.08930397033691406, 0.09229278564453125, 0.09528160095214844, 0.09827041625976562, 0.10125923156738281, 0.104248046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 47.0, 176.0, 383.0, 281.0, 101.0, 19.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578874111175537, -2.454348087310791, -2.329821825027466, -2.2052958011627197, -2.0807695388793945, -1.9562435150146484, -1.8317172527313232, -1.7071912288665771, -1.582664966583252, -1.4581388235092163, -1.3336126804351807, -1.209086537361145, -1.0845603942871094, -0.9600343108177185, -0.8355081677436829, -0.7109820246696472, -0.5864559412002563, -0.4619297981262207, -0.33740365505218506, -0.2128775417804718, -0.08835139870643616, 0.0361747145652771, 0.16070085763931274, 0.2852270007133484, 0.40975314378738403, 0.5342792868614197, 0.6588054299354553, 0.7833315134048462, 0.9078576564788818, 1.0323837995529175, 1.1569099426269531, 1.2814360857009888, 1.4059622287750244, 1.53048837184906, 1.6550145149230957, 1.7795406579971313, 1.904066801071167, 2.028592824935913, 2.1531190872192383, 2.2776451110839844, 2.4021713733673096, 2.5266973972320557, 2.651223659515381, 2.775749683380127, 2.900275945663452, 3.0248019695281982, 3.1493282318115234, 3.2738542556762695, 3.3983802795410156, 3.5229063034057617, 3.647432565689087, 3.771958589553833, 3.896484851837158, 4.021010875701904, 4.14553689956665, 4.270063400268555, 4.394589424133301, 4.519115447998047, 4.643641471862793, 4.768167972564697, 4.892693996429443, 5.0172200202941895, 5.1417460441589355, 5.26627254486084, 5.390798568725586]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 4.0, 5.0, 11.0, 3.0, 7.0, 13.0, 10.0, 19.0, 15.0, 16.0, 22.0, 24.0, 35.0, 36.0, 26.0, 33.0, 37.0, 49.0, 35.0, 40.0, 42.0, 35.0, 33.0, 33.0, 43.0, 40.0, 38.0, 35.0, 40.0, 19.0, 33.0, 16.0, 26.0, 12.0, 21.0, 17.0, 11.0, 19.0, 10.0, 4.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6638127565383911, -0.6432740688323975, -0.6227354407310486, -0.6021967530250549, -0.5816580653190613, -0.5611194372177124, -0.5405807495117188, -0.5200420618057251, -0.4995034337043762, -0.47896477580070496, -0.4584260880947113, -0.43788743019104004, -0.4173487722873688, -0.3968101143836975, -0.37627142667770386, -0.3557327687740326, -0.33519408106803894, -0.3146554231643677, -0.294116735458374, -0.27357807755470276, -0.2530394196510315, -0.23250074684619904, -0.21196207404136658, -0.1914234161376953, -0.17088474333286285, -0.1503460705280304, -0.12980741262435913, -0.10926873981952667, -0.08873007446527481, -0.06819140911102295, -0.04765273630619049, -0.027114078402519226, -0.006575405597686768, 0.013963261619210243, 0.034501928836107254, 0.055040597915649414, 0.07557926326990128, 0.09611792862415314, 0.1166566014289856, 0.13719525933265686, 0.15773393213748932, 0.17827260494232178, 0.19881126284599304, 0.2193499356508255, 0.23988860845565796, 0.2604272663593292, 0.2809659242630005, 0.30150461196899414, 0.3220432698726654, 0.34258192777633667, 0.3631206154823303, 0.3836592733860016, 0.40419793128967285, 0.4247366189956665, 0.44527527689933777, 0.46581393480300903, 0.4863526225090027, 0.5068913102149963, 0.5274299383163452, 0.5479686260223389, 0.5685073137283325, 0.5890459418296814, 0.609584629535675, 0.6301232576370239, 0.6506619453430176]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 28.0, 53.0, 132.0, 342.0, 1169.0, 5426.0, 37566.0, 1196452.0, 2884109.0, 59241.0, 6830.0, 1591.0, 626.0, 309.0, 174.0, 89.0, 52.0, 29.0, 19.0, 16.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.24665069580078125, -0.2359771728515625, -0.22530364990234375, -0.214630126953125, -0.20395660400390625, -0.1932830810546875, -0.18260955810546875, -0.17193603515625, -0.16126251220703125, -0.1505889892578125, -0.13991546630859375, -0.129241943359375, -0.11856842041015625, -0.1078948974609375, -0.09722137451171875, -0.0865478515625, -0.07587432861328125, -0.0652008056640625, -0.05452728271484375, -0.043853759765625, -0.03318023681640625, -0.0225067138671875, -0.01183319091796875, -0.00115966796875, 0.00951385498046875, 0.0201873779296875, 0.03086090087890625, 0.041534423828125, 0.05220794677734375, 0.0628814697265625, 0.07355499267578125, 0.084228515625, 0.09490203857421875, 0.1055755615234375, 0.11624908447265625, 0.126922607421875, 0.13759613037109375, 0.1482696533203125, 0.15894317626953125, 0.16961669921875, 0.18029022216796875, 0.1909637451171875, 0.20163726806640625, 0.212310791015625, 0.22298431396484375, 0.2336578369140625, 0.24433135986328125, 0.2550048828125, 0.26567840576171875, 0.2763519287109375, 0.28702545166015625, 0.297698974609375, 0.30837249755859375, 0.3190460205078125, 0.32971954345703125, 0.34039306640625, 0.35106658935546875, 0.3617401123046875, 0.37241363525390625, 0.383087158203125, 0.39376068115234375, 0.4044342041015625, 0.41510772705078125, 0.42578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 8.0, 22.0, 32.0, 37.0, 49.0, 75.0, 90.0, 117.0, 101.0, 115.0, 96.0, 71.0, 70.0, 38.0, 24.0, 19.0, 19.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.078125, -0.07344627380371094, -0.06876754760742188, -0.06408882141113281, -0.05941009521484375, -0.05473136901855469, -0.050052642822265625, -0.04537391662597656, -0.0406951904296875, -0.03601646423339844, -0.031337738037109375, -0.026659011840820312, -0.02198028564453125, -0.017301559448242188, -0.012622833251953125, -0.007944107055664062, -0.003265380859375, 0.0014133453369140625, 0.006092071533203125, 0.010770797729492188, 0.01544952392578125, 0.020128250122070312, 0.024806976318359375, 0.029485702514648438, 0.0341644287109375, 0.03884315490722656, 0.043521881103515625, 0.04820060729980469, 0.05287933349609375, 0.05755805969238281, 0.062236785888671875, 0.06691551208496094, 0.07159423828125, 0.07627296447753906, 0.08095169067382812, 0.08563041687011719, 0.09030914306640625, 0.09498786926269531, 0.09966659545898438, 0.10434532165527344, 0.1090240478515625, 0.11370277404785156, 0.11838150024414062, 0.12306022644042969, 0.12773895263671875, 0.1324176788330078, 0.13709640502929688, 0.14177513122558594, 0.146453857421875, 0.15113258361816406, 0.15581130981445312, 0.1604900360107422, 0.16516876220703125, 0.1698474884033203, 0.17452621459960938, 0.17920494079589844, 0.1838836669921875, 0.18856239318847656, 0.19324111938476562, 0.1979198455810547, 0.20259857177734375, 0.2072772979736328, 0.21195602416992188, 0.21663475036621094, 0.2213134765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 15.0, 35.0, 45.0, 64.0, 167.0, 283.0, 560.0, 1231.0, 3868.0, 15229.0, 92389.0, 1102564.0, 2728909.0, 211440.0, 27939.0, 6139.0, 1912.0, 752.0, 324.0, 157.0, 91.0, 63.0, 29.0, 21.0, 16.0, 13.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.323974609375, -0.31647300720214844, -0.3089714050292969, -0.3014698028564453, -0.29396820068359375, -0.2864665985107422, -0.2789649963378906, -0.27146339416503906, -0.2639617919921875, -0.25646018981933594, -0.24895858764648438, -0.2414569854736328, -0.23395538330078125, -0.2264537811279297, -0.21895217895507812, -0.21145057678222656, -0.203948974609375, -0.19644737243652344, -0.18894577026367188, -0.1814441680908203, -0.17394256591796875, -0.1664409637451172, -0.15893936157226562, -0.15143775939941406, -0.1439361572265625, -0.13643455505371094, -0.12893295288085938, -0.12143135070800781, -0.11392974853515625, -0.10642814636230469, -0.09892654418945312, -0.09142494201660156, -0.08392333984375, -0.07642173767089844, -0.06892013549804688, -0.06141853332519531, -0.05391693115234375, -0.04641532897949219, -0.038913726806640625, -0.03141212463378906, -0.0239105224609375, -0.016408920288085938, -0.008907318115234375, -0.0014057159423828125, 0.00609588623046875, 0.013597488403320312, 0.021099090576171875, 0.028600692749023438, 0.036102294921875, 0.04360389709472656, 0.051105499267578125, 0.05860710144042969, 0.06610870361328125, 0.07361030578613281, 0.08111190795898438, 0.08861351013183594, 0.0961151123046875, 0.10361671447753906, 0.11111831665039062, 0.11861991882324219, 0.12612152099609375, 0.1336231231689453, 0.14112472534179688, 0.14862632751464844, 0.1561279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 15.0, 29.0, 42.0, 60.0, 110.0, 175.0, 221.0, 356.0, 566.0, 753.0, 623.0, 409.0, 233.0, 194.0, 101.0, 42.0, 45.0, 33.0, 9.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12398910522460938, -0.11894989013671875, -0.11391067504882812, -0.1088714599609375, -0.10383224487304688, -0.09879302978515625, -0.09375381469726562, -0.088714599609375, -0.08367538452148438, -0.07863616943359375, -0.07359695434570312, -0.0685577392578125, -0.06351852416992188, -0.05847930908203125, -0.053440093994140625, -0.04840087890625, -0.043361663818359375, -0.03832244873046875, -0.033283233642578125, -0.0282440185546875, -0.023204803466796875, -0.01816558837890625, -0.013126373291015625, -0.008087158203125, -0.003047943115234375, 0.00199127197265625, 0.007030487060546875, 0.0120697021484375, 0.017108917236328125, 0.02214813232421875, 0.027187347412109375, 0.0322265625, 0.037265777587890625, 0.04230499267578125, 0.047344207763671875, 0.0523834228515625, 0.057422637939453125, 0.06246185302734375, 0.06750106811523438, 0.072540283203125, 0.07757949829101562, 0.08261871337890625, 0.08765792846679688, 0.0926971435546875, 0.09773635864257812, 0.10277557373046875, 0.10781478881835938, 0.11285400390625, 0.11789321899414062, 0.12293243408203125, 0.12797164916992188, 0.1330108642578125, 0.13805007934570312, 0.14308929443359375, 0.14812850952148438, 0.153167724609375, 0.15820693969726562, 0.16324615478515625, 0.16828536987304688, 0.1733245849609375, 0.17836380004882812, 0.18340301513671875, 0.18844223022460938, 0.1934814453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 11.0, 12.0, 36.0, 95.0, 147.0, 159.0, 178.0, 165.0, 92.0, 54.0, 32.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3531036376953125, -1.314698338508606, -1.2762930393218994, -1.2378876209259033, -1.1994823217391968, -1.1610770225524902, -1.1226716041564941, -1.0842663049697876, -1.045861005783081, -1.0074557065963745, -0.9690503478050232, -0.9306449890136719, -0.8922396898269653, -0.8538343906402588, -0.8154290318489075, -0.7770236730575562, -0.7386183738708496, -0.7002130746841431, -0.6618077158927917, -0.6234023571014404, -0.5849970579147339, -0.5465917587280273, -0.508186399936676, -0.4697810709476471, -0.43137574195861816, -0.39297041296958923, -0.3545650839805603, -0.31615975499153137, -0.27775442600250244, -0.2393490970134735, -0.20094376802444458, -0.16253843903541565, -0.12413322925567627, -0.08572790026664734, -0.04732257127761841, -0.008917242288589478, 0.029488086700439453, 0.06789341568946838, 0.10629874467849731, 0.14470407366752625, 0.18310940265655518, 0.2215147316455841, 0.25992006063461304, 0.29832538962364197, 0.3367307186126709, 0.37513604760169983, 0.41354137659072876, 0.4519467055797577, 0.4903520345687866, 0.5287573337554932, 0.5671626925468445, 0.6055680513381958, 0.6439733505249023, 0.6823786497116089, 0.7207840085029602, 0.7591893672943115, 0.7975946664810181, 0.8359999656677246, 0.8744053244590759, 0.9128106832504272, 0.9512159824371338, 0.9896212816238403, 1.0280265808105469, 1.066431999206543, 1.1048372983932495]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 4.0, 13.0, 13.0, 22.0, 19.0, 16.0, 26.0, 27.0, 23.0, 34.0, 36.0, 38.0, 41.0, 43.0, 36.0, 43.0, 51.0, 54.0, 36.0, 31.0, 39.0, 38.0, 42.0, 33.0, 37.0, 35.0, 24.0, 36.0, 18.0, 16.0, 7.0, 12.0, 10.0, 7.0, 7.0, 2.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3875146508216858, -0.3749905526638031, -0.362466424703598, -0.34994232654571533, -0.33741819858551025, -0.32489410042762756, -0.3123699724674225, -0.2998458743095398, -0.2873217463493347, -0.274797648191452, -0.26227352023124695, -0.24974940717220306, -0.23722529411315918, -0.2247011959552765, -0.2121770679950714, -0.19965296983718872, -0.18712885677814484, -0.17460474371910095, -0.16208063066005707, -0.14955651760101318, -0.1370324045419693, -0.12450829893350601, -0.11198418587446213, -0.09946007281541824, -0.08693595975637436, -0.07441184669733047, -0.06188773363828659, -0.049363624304533005, -0.03683951124548912, -0.024315401911735535, -0.01179128885269165, 0.0007328242063522339, 0.013256937265396118, 0.025781050324440002, 0.03830516338348389, 0.05082927271723747, 0.06335338950157166, 0.07587749511003494, 0.08840160816907883, 0.10092572122812271, 0.1134498342871666, 0.12597393989562988, 0.13849805295467377, 0.15102216601371765, 0.16354627907276154, 0.17607039213180542, 0.1885945051908493, 0.2011186182498932, 0.21364273130893707, 0.22616684436798096, 0.23869095742702484, 0.2512150704860687, 0.2637391686439514, 0.2762632966041565, 0.2887873947620392, 0.30131152272224426, 0.31383562088012695, 0.32635971903800964, 0.3388838469982147, 0.3514079451560974, 0.3639320731163025, 0.3764561712741852, 0.38898029923439026, 0.40150439739227295, 0.414028525352478]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 18.0, 17.0, 31.0, 47.0, 64.0, 81.0, 121.0, 175.0, 302.0, 532.0, 1100.0, 2935.0, 9496.0, 37285.0, 187766.0, 584412.0, 174376.0, 35357.0, 9104.0, 2810.0, 1088.0, 524.0, 306.0, 193.0, 125.0, 81.0, 65.0, 39.0, 23.0, 16.0, 12.0, 11.0, 9.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.310791015625, -0.298095703125, -0.285400390625, -0.272705078125, -0.260009765625, -0.247314453125, -0.234619140625, -0.221923828125, -0.209228515625, -0.196533203125, -0.183837890625, -0.171142578125, -0.158447265625, -0.145751953125, -0.133056640625, -0.120361328125, -0.107666015625, -0.094970703125, -0.082275390625, -0.069580078125, -0.056884765625, -0.044189453125, -0.031494140625, -0.018798828125, -0.006103515625, 0.006591796875, 0.019287109375, 0.031982421875, 0.044677734375, 0.057373046875, 0.070068359375, 0.082763671875, 0.095458984375, 0.108154296875, 0.120849609375, 0.133544921875, 0.146240234375, 0.158935546875, 0.171630859375, 0.184326171875, 0.197021484375, 0.209716796875, 0.222412109375, 0.235107421875, 0.247802734375, 0.260498046875, 0.273193359375, 0.285888671875, 0.298583984375, 0.311279296875, 0.323974609375, 0.336669921875, 0.349365234375, 0.362060546875, 0.374755859375, 0.387451171875, 0.400146484375, 0.412841796875, 0.425537109375, 0.438232421875, 0.450927734375, 0.463623046875, 0.476318359375, 0.489013671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 16.0, 21.0, 26.0, 35.0, 54.0, 92.0, 80.0, 124.0, 109.0, 123.0, 77.0, 78.0, 62.0, 39.0, 23.0, 12.0, 14.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07806396484375, -0.07333660125732422, -0.06860923767089844, -0.06388187408447266, -0.059154510498046875, -0.054427146911621094, -0.04969978332519531, -0.04497241973876953, -0.04024505615234375, -0.03551769256591797, -0.030790328979492188, -0.026062965393066406, -0.021335601806640625, -0.016608238220214844, -0.011880874633789062, -0.007153511047363281, -0.0024261474609375, 0.0023012161254882812, 0.0070285797119140625, 0.011755943298339844, 0.016483306884765625, 0.021210670471191406, 0.025938034057617188, 0.03066539764404297, 0.03539276123046875, 0.04012012481689453, 0.04484748840332031, 0.049574851989746094, 0.054302215576171875, 0.059029579162597656, 0.06375694274902344, 0.06848430633544922, 0.073211669921875, 0.07793903350830078, 0.08266639709472656, 0.08739376068115234, 0.09212112426757812, 0.0968484878540039, 0.10157585144042969, 0.10630321502685547, 0.11103057861328125, 0.11575794219970703, 0.12048530578613281, 0.1252126693725586, 0.12994003295898438, 0.13466739654541016, 0.13939476013183594, 0.14412212371826172, 0.1488494873046875, 0.15357685089111328, 0.15830421447753906, 0.16303157806396484, 0.16775894165039062, 0.1724863052368164, 0.1772136688232422, 0.18194103240966797, 0.18666839599609375, 0.19139575958251953, 0.1961231231689453, 0.2008504867553711, 0.20557785034179688, 0.21030521392822266, 0.21503257751464844, 0.21975994110107422, 0.2244873046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 18.0, 16.0, 19.0, 35.0, 49.0, 80.0, 162.0, 352.0, 1064.0, 3572.0, 14514.0, 67109.0, 354508.0, 479122.0, 99847.0, 20849.0, 5011.0, 1317.0, 412.0, 189.0, 113.0, 66.0, 37.0, 20.0, 13.0, 12.0, 7.0, 8.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353515625, -0.3425102233886719, -0.33150482177734375, -0.3204994201660156, -0.3094940185546875, -0.2984886169433594, -0.28748321533203125, -0.2764778137207031, -0.265472412109375, -0.2544670104980469, -0.24346160888671875, -0.23245620727539062, -0.2214508056640625, -0.21044540405273438, -0.19944000244140625, -0.18843460083007812, -0.17742919921875, -0.16642379760742188, -0.15541839599609375, -0.14441299438476562, -0.1334075927734375, -0.12240219116210938, -0.11139678955078125, -0.10039138793945312, -0.089385986328125, -0.07838058471679688, -0.06737518310546875, -0.056369781494140625, -0.0453643798828125, -0.034358978271484375, -0.02335357666015625, -0.012348175048828125, -0.0013427734375, 0.009662628173828125, 0.02066802978515625, 0.031673431396484375, 0.0426788330078125, 0.053684234619140625, 0.06468963623046875, 0.07569503784179688, 0.086700439453125, 0.09770584106445312, 0.10871124267578125, 0.11971664428710938, 0.1307220458984375, 0.14172744750976562, 0.15273284912109375, 0.16373825073242188, 0.17474365234375, 0.18574905395507812, 0.19675445556640625, 0.20775985717773438, 0.2187652587890625, 0.22977066040039062, 0.24077606201171875, 0.2517814636230469, 0.262786865234375, 0.2737922668457031, 0.28479766845703125, 0.2958030700683594, 0.3068084716796875, 0.3178138732910156, 0.32881927490234375, 0.3398246765136719, 0.350830078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 5.0, 14.0, 10.0, 16.0, 16.0, 21.0, 24.0, 28.0, 33.0, 32.0, 42.0, 66.0, 56.0, 59.0, 57.0, 55.0, 66.0, 46.0, 58.0, 47.0, 40.0, 40.0, 29.0, 32.0, 17.0, 15.0, 12.0, 18.0, 8.0, 9.0, 4.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2120361328125, -0.2046642303466797, -0.19729232788085938, -0.18992042541503906, -0.18254852294921875, -0.17517662048339844, -0.16780471801757812, -0.1604328155517578, -0.1530609130859375, -0.1456890106201172, -0.13831710815429688, -0.13094520568847656, -0.12357330322265625, -0.11620140075683594, -0.10882949829101562, -0.10145759582519531, -0.094085693359375, -0.08671379089355469, -0.07934188842773438, -0.07196998596191406, -0.06459808349609375, -0.05722618103027344, -0.049854278564453125, -0.04248237609863281, -0.0351104736328125, -0.027738571166992188, -0.020366668701171875, -0.012994766235351562, -0.00562286376953125, 0.0017490386962890625, 0.009120941162109375, 0.016492843627929688, 0.02386474609375, 0.031236648559570312, 0.038608551025390625, 0.04598045349121094, 0.05335235595703125, 0.06072425842285156, 0.06809616088867188, 0.07546806335449219, 0.0828399658203125, 0.09021186828613281, 0.09758377075195312, 0.10495567321777344, 0.11232757568359375, 0.11969947814941406, 0.12707138061523438, 0.1344432830810547, 0.141815185546875, 0.1491870880126953, 0.15655899047851562, 0.16393089294433594, 0.17130279541015625, 0.17867469787597656, 0.18604660034179688, 0.1934185028076172, 0.2007904052734375, 0.2081623077392578, 0.21553421020507812, 0.22290611267089844, 0.23027801513671875, 0.23764991760253906, 0.24502182006835938, 0.2523937225341797, 0.259765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 16.0, 18.0, 18.0, 30.0, 37.0, 67.0, 96.0, 137.0, 195.0, 373.0, 592.0, 1213.0, 2586.0, 6427.0, 16877.0, 47749.0, 161311.0, 447135.0, 253063.0, 71113.0, 23775.0, 8733.0, 3472.0, 1547.0, 786.0, 423.0, 237.0, 125.0, 111.0, 71.0, 55.0, 43.0, 28.0, 22.0, 9.0, 14.0, 9.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.120758056640625, -0.11639404296875, -0.112030029296875, -0.107666015625, -0.103302001953125, -0.09893798828125, -0.094573974609375, -0.0902099609375, -0.085845947265625, -0.08148193359375, -0.077117919921875, -0.07275390625, -0.068389892578125, -0.06402587890625, -0.059661865234375, -0.0552978515625, -0.050933837890625, -0.04656982421875, -0.042205810546875, -0.037841796875, -0.033477783203125, -0.02911376953125, -0.024749755859375, -0.0203857421875, -0.016021728515625, -0.01165771484375, -0.007293701171875, -0.0029296875, 0.001434326171875, 0.00579833984375, 0.010162353515625, 0.0145263671875, 0.018890380859375, 0.02325439453125, 0.027618408203125, 0.031982421875, 0.036346435546875, 0.04071044921875, 0.045074462890625, 0.0494384765625, 0.053802490234375, 0.05816650390625, 0.062530517578125, 0.06689453125, 0.071258544921875, 0.07562255859375, 0.079986572265625, 0.0843505859375, 0.088714599609375, 0.09307861328125, 0.097442626953125, 0.101806640625, 0.106170654296875, 0.11053466796875, 0.114898681640625, 0.1192626953125, 0.123626708984375, 0.12799072265625, 0.132354736328125, 0.13671875, 0.141082763671875, 0.14544677734375, 0.149810791015625, 0.1541748046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 3.0, 5.0, 7.0, 13.0, 9.0, 10.0, 11.0, 12.0, 27.0, 21.0, 42.0, 38.0, 70.0, 89.0, 93.0, 86.0, 72.0, 81.0, 68.0, 34.0, 46.0, 22.0, 21.0, 17.0, 10.0, 15.0, 10.0, 6.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.9729137420654297e-05, -1.9156374037265778e-05, -1.8583610653877258e-05, -1.801084727048874e-05, -1.743808388710022e-05, -1.68653205037117e-05, -1.629255712032318e-05, -1.5719793736934662e-05, -1.5147030353546143e-05, -1.4574266970157623e-05, -1.4001503586769104e-05, -1.3428740203380585e-05, -1.2855976819992065e-05, -1.2283213436603546e-05, -1.1710450053215027e-05, -1.1137686669826508e-05, -1.0564923286437988e-05, -9.992159903049469e-06, -9.41939651966095e-06, -8.84663313627243e-06, -8.273869752883911e-06, -7.701106369495392e-06, -7.1283429861068726e-06, -6.555579602718353e-06, -5.982816219329834e-06, -5.410052835941315e-06, -4.837289452552795e-06, -4.264526069164276e-06, -3.691762685775757e-06, -3.1189993023872375e-06, -2.5462359189987183e-06, -1.973472535610199e-06, -1.4007091522216797e-06, -8.279457688331604e-07, -2.551823854446411e-07, 3.175809979438782e-07, 8.903443813323975e-07, 1.4631077647209167e-06, 2.035871148109436e-06, 2.6086345314979553e-06, 3.1813979148864746e-06, 3.754161298274994e-06, 4.326924681663513e-06, 4.8996880650520325e-06, 5.472451448440552e-06, 6.045214831829071e-06, 6.61797821521759e-06, 7.19074159860611e-06, 7.763504981994629e-06, 8.336268365383148e-06, 8.909031748771667e-06, 9.481795132160187e-06, 1.0054558515548706e-05, 1.0627321898937225e-05, 1.1200085282325745e-05, 1.1772848665714264e-05, 1.2345612049102783e-05, 1.2918375432491302e-05, 1.3491138815879822e-05, 1.4063902199268341e-05, 1.463666558265686e-05, 1.520942896604538e-05, 1.57821923494339e-05, 1.6354955732822418e-05, 1.6927719116210938e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 7.0, 9.0, 20.0, 31.0, 38.0, 61.0, 99.0, 118.0, 187.0, 260.0, 380.0, 624.0, 972.0, 1681.0, 3217.0, 7231.0, 19961.0, 65391.0, 281705.0, 486937.0, 123669.0, 34034.0, 11458.0, 4634.0, 2278.0, 1223.0, 767.0, 522.0, 320.0, 227.0, 131.0, 103.0, 74.0, 54.0, 29.0, 28.0, 22.0, 15.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14013671875, -0.13550186157226562, -0.13086700439453125, -0.12623214721679688, -0.1215972900390625, -0.11696243286132812, -0.11232757568359375, -0.10769271850585938, -0.103057861328125, -0.09842300415039062, -0.09378814697265625, -0.08915328979492188, -0.0845184326171875, -0.07988357543945312, -0.07524871826171875, -0.07061386108398438, -0.06597900390625, -0.061344146728515625, -0.05670928955078125, -0.052074432373046875, -0.0474395751953125, -0.042804718017578125, -0.03816986083984375, -0.033535003662109375, -0.028900146484375, -0.024265289306640625, -0.01963043212890625, -0.014995574951171875, -0.0103607177734375, -0.005725860595703125, -0.00109100341796875, 0.003543853759765625, 0.0081787109375, 0.012813568115234375, 0.01744842529296875, 0.022083282470703125, 0.0267181396484375, 0.031352996826171875, 0.03598785400390625, 0.040622711181640625, 0.045257568359375, 0.049892425537109375, 0.05452728271484375, 0.059162139892578125, 0.0637969970703125, 0.06843185424804688, 0.07306671142578125, 0.07770156860351562, 0.08233642578125, 0.08697128295898438, 0.09160614013671875, 0.09624099731445312, 0.1008758544921875, 0.10551071166992188, 0.11014556884765625, 0.11478042602539062, 0.119415283203125, 0.12405014038085938, 0.12868499755859375, 0.13331985473632812, 0.1379547119140625, 0.14258956909179688, 0.14722442626953125, 0.15185928344726562, 0.156494140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 10.0, 12.0, 18.0, 17.0, 21.0, 36.0, 68.0, 113.0, 137.0, 148.0, 131.0, 83.0, 57.0, 38.0, 27.0, 16.0, 13.0, 6.0, 10.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.16699790954589844, -0.16212081909179688, -0.1572437286376953, -0.15236663818359375, -0.1474895477294922, -0.14261245727539062, -0.13773536682128906, -0.1328582763671875, -0.12798118591308594, -0.12310409545898438, -0.11822700500488281, -0.11334991455078125, -0.10847282409667969, -0.10359573364257812, -0.09871864318847656, -0.093841552734375, -0.08896446228027344, -0.08408737182617188, -0.07921028137207031, -0.07433319091796875, -0.06945610046386719, -0.06457901000976562, -0.05970191955566406, -0.0548248291015625, -0.04994773864746094, -0.045070648193359375, -0.04019355773925781, -0.03531646728515625, -0.030439376831054688, -0.025562286376953125, -0.020685195922851562, -0.01580810546875, -0.010931015014648438, -0.006053924560546875, -0.0011768341064453125, 0.00370025634765625, 0.008577346801757812, 0.013454437255859375, 0.018331527709960938, 0.0232086181640625, 0.028085708618164062, 0.032962799072265625, 0.03783988952636719, 0.04271697998046875, 0.04759407043457031, 0.052471160888671875, 0.05734825134277344, 0.062225341796875, 0.06710243225097656, 0.07197952270507812, 0.07685661315917969, 0.08173370361328125, 0.08661079406738281, 0.09148788452148438, 0.09636497497558594, 0.1012420654296875, 0.10611915588378906, 0.11099624633789062, 0.11587333679199219, 0.12075042724609375, 0.1256275177001953, 0.13050460815429688, 0.13538169860839844, 0.1402587890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 10.0, 16.0, 35.0, 115.0, 228.0, 266.0, 201.0, 91.0, 36.0, 11.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0012428760528564, -0.9278908371925354, -0.8545387983322144, -0.7811867594718933, -0.7078347206115723, -0.6344826817512512, -0.5611306428909302, -0.48777860403060913, -0.4144265651702881, -0.34107452630996704, -0.267722487449646, -0.19437044858932495, -0.1210184097290039, -0.04766637086868286, 0.025685667991638184, 0.09903770685195923, 0.17238974571228027, 0.24574178457260132, 0.31909382343292236, 0.3924458622932434, 0.46579790115356445, 0.5391499400138855, 0.6125019788742065, 0.6858540177345276, 0.7592060565948486, 0.8325580954551697, 0.9059101343154907, 0.9792621731758118, 1.0526142120361328, 1.1259663105010986, 1.199318289756775, 1.2726702690124512, 1.346022367477417, 1.4193744659423828, 1.492726445198059, 1.5660784244537354, 1.6394305229187012, 1.712782621383667, 1.7861346006393433, 1.8594865798950195, 1.9328386783599854, 2.006190776824951, 2.079542636871338, 2.1528947353363037, 2.2262468338012695, 2.2995989322662354, 2.372951030731201, 2.446302890777588, 2.5196549892425537, 2.5930070877075195, 2.6663589477539062, 2.739711046218872, 2.813063144683838, 2.8864152431488037, 2.9597673416137695, 3.0331192016601562, 3.106471300125122, 3.179823398590088, 3.2531752586364746, 3.3265273571014404, 3.3998794555664062, 3.473231554031372, 3.546583652496338, 3.6199355125427246, 3.6932876110076904]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 12.0, 12.0, 11.0, 20.0, 15.0, 24.0, 34.0, 31.0, 30.0, 27.0, 31.0, 45.0, 44.0, 54.0, 55.0, 52.0, 48.0, 60.0, 40.0, 37.0, 43.0, 33.0, 44.0, 31.0, 25.0, 22.0, 17.0, 19.0, 18.0, 15.0, 7.0, 9.0, 6.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.7667695879936218, -0.7454947829246521, -0.7242200374603271, -0.7029452323913574, -0.6816704869270325, -0.6603956818580627, -0.6391209363937378, -0.6178461313247681, -0.5965713262557983, -0.5752965211868286, -0.5540217757225037, -0.5327469706535339, -0.511472225189209, -0.49019742012023926, -0.4689226448535919, -0.4476478695869446, -0.42637309432029724, -0.4050983190536499, -0.38382354378700256, -0.3625487685203552, -0.3412739634513855, -0.31999918818473816, -0.2987244129180908, -0.2774496078491211, -0.25617486238479614, -0.2349000871181488, -0.21362529695034027, -0.19235052168369293, -0.1710757315158844, -0.14980095624923706, -0.12852618098258972, -0.10725139081478119, -0.08597660064697266, -0.06470181792974472, -0.04342703893780708, -0.022152259945869446, -0.00087747722864151, 0.020397305488586426, 0.041672080755233765, 0.0629468709230423, 0.08422164618968964, 0.10549642890691757, 0.1267712116241455, 0.14804598689079285, 0.16932076215744019, 0.19059555232524872, 0.21187032759189606, 0.2331451177597046, 0.25441989302635193, 0.27569466829299927, 0.2969694435596466, 0.31824421882629395, 0.33951902389526367, 0.360793799161911, 0.38206857442855835, 0.4033433794975281, 0.424618124961853, 0.44589290022850037, 0.4671676754951477, 0.48844248056411743, 0.5097172260284424, 0.5309920310974121, 0.5522668361663818, 0.5735415816307068, 0.5948163866996765]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 1.0, 12.0, 24.0, 45.0, 51.0, 127.0, 208.0, 376.0, 729.0, 1641.0, 3868.0, 10735.0, 39055.0, 222414.0, 2646245.0, 1133116.0, 101522.0, 21450.0, 6666.0, 2760.0, 1281.0, 686.0, 427.0, 268.0, 185.0, 97.0, 97.0, 39.0, 40.0, 24.0, 22.0, 20.0, 11.0, 6.0, 7.0, 5.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.14850997924804688, -0.14101409912109375, -0.13351821899414062, -0.1260223388671875, -0.11852645874023438, -0.11103057861328125, -0.10353469848632812, -0.096038818359375, -0.08854293823242188, -0.08104705810546875, -0.07355117797851562, -0.0660552978515625, -0.058559417724609375, -0.05106353759765625, -0.043567657470703125, -0.03607177734375, -0.028575897216796875, -0.02108001708984375, -0.013584136962890625, -0.0060882568359375, 0.001407623291015625, 0.00890350341796875, 0.016399383544921875, 0.023895263671875, 0.031391143798828125, 0.03888702392578125, 0.046382904052734375, 0.0538787841796875, 0.061374664306640625, 0.06887054443359375, 0.07636642456054688, 0.0838623046875, 0.09135818481445312, 0.09885406494140625, 0.10634994506835938, 0.1138458251953125, 0.12134170532226562, 0.12883758544921875, 0.13633346557617188, 0.143829345703125, 0.15132522583007812, 0.15882110595703125, 0.16631698608398438, 0.1738128662109375, 0.18130874633789062, 0.18880462646484375, 0.19630050659179688, 0.20379638671875, 0.21129226684570312, 0.21878814697265625, 0.22628402709960938, 0.2337799072265625, 0.24127578735351562, 0.24877166748046875, 0.2562675476074219, 0.263763427734375, 0.2712593078613281, 0.27875518798828125, 0.2862510681152344, 0.2937469482421875, 0.3012428283691406, 0.30873870849609375, 0.3162345886230469, 0.32373046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 13.0, 14.0, 21.0, 32.0, 48.0, 67.0, 84.0, 96.0, 117.0, 113.0, 105.0, 83.0, 58.0, 61.0, 36.0, 20.0, 15.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0888671875, -0.0839691162109375, -0.079071044921875, -0.0741729736328125, -0.06927490234375, -0.0643768310546875, -0.059478759765625, -0.0545806884765625, -0.0496826171875, -0.0447845458984375, -0.039886474609375, -0.0349884033203125, -0.03009033203125, -0.0251922607421875, -0.020294189453125, -0.0153961181640625, -0.010498046875, -0.0055999755859375, -0.000701904296875, 0.0041961669921875, 0.00909423828125, 0.0139923095703125, 0.018890380859375, 0.0237884521484375, 0.0286865234375, 0.0335845947265625, 0.038482666015625, 0.0433807373046875, 0.04827880859375, 0.0531768798828125, 0.058074951171875, 0.0629730224609375, 0.06787109375, 0.0727691650390625, 0.077667236328125, 0.0825653076171875, 0.08746337890625, 0.0923614501953125, 0.097259521484375, 0.1021575927734375, 0.1070556640625, 0.1119537353515625, 0.116851806640625, 0.1217498779296875, 0.12664794921875, 0.1315460205078125, 0.136444091796875, 0.1413421630859375, 0.146240234375, 0.1511383056640625, 0.156036376953125, 0.1609344482421875, 0.16583251953125, 0.1707305908203125, 0.175628662109375, 0.1805267333984375, 0.1854248046875, 0.1903228759765625, 0.195220947265625, 0.2001190185546875, 0.20501708984375, 0.2099151611328125, 0.214813232421875, 0.2197113037109375, 0.224609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 1.0, 7.0, 1.0, 3.0, 5.0, 8.0, 6.0, 5.0, 22.0, 15.0, 27.0, 39.0, 63.0, 77.0, 118.0, 158.0, 234.0, 407.0, 645.0, 1318.0, 2704.0, 6310.0, 17226.0, 59667.0, 284307.0, 1894939.0, 1605942.0, 240574.0, 52920.0, 15308.0, 5845.0, 2434.0, 1181.0, 655.0, 349.0, 235.0, 166.0, 95.0, 66.0, 48.0, 47.0, 29.0, 13.0, 17.0, 8.0, 7.0, 13.0, 10.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19504547119140625, -0.1883087158203125, -0.18157196044921875, -0.174835205078125, -0.16809844970703125, -0.1613616943359375, -0.15462493896484375, -0.14788818359375, -0.14115142822265625, -0.1344146728515625, -0.12767791748046875, -0.120941162109375, -0.11420440673828125, -0.1074676513671875, -0.10073089599609375, -0.093994140625, -0.08725738525390625, -0.0805206298828125, -0.07378387451171875, -0.067047119140625, -0.06031036376953125, -0.0535736083984375, -0.04683685302734375, -0.04010009765625, -0.03336334228515625, -0.0266265869140625, -0.01988983154296875, -0.013153076171875, -0.00641632080078125, 0.0003204345703125, 0.00705718994140625, 0.0137939453125, 0.02053070068359375, 0.0272674560546875, 0.03400421142578125, 0.040740966796875, 0.04747772216796875, 0.0542144775390625, 0.06095123291015625, 0.06768798828125, 0.07442474365234375, 0.0811614990234375, 0.08789825439453125, 0.094635009765625, 0.10137176513671875, 0.1081085205078125, 0.11484527587890625, 0.12158203125, 0.12831878662109375, 0.1350555419921875, 0.14179229736328125, 0.148529052734375, 0.15526580810546875, 0.1620025634765625, 0.16873931884765625, 0.17547607421875, 0.18221282958984375, 0.1889495849609375, 0.19568634033203125, 0.202423095703125, 0.20915985107421875, 0.2158966064453125, 0.22263336181640625, 0.2293701171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 5.0, 6.0, 23.0, 11.0, 22.0, 17.0, 42.0, 39.0, 62.0, 84.0, 126.0, 188.0, 277.0, 380.0, 522.0, 622.0, 473.0, 344.0, 253.0, 157.0, 126.0, 84.0, 57.0, 39.0, 24.0, 21.0, 20.0, 19.0, 6.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.170166015625, -0.165069580078125, -0.15997314453125, -0.154876708984375, -0.1497802734375, -0.144683837890625, -0.13958740234375, -0.134490966796875, -0.12939453125, -0.124298095703125, -0.11920166015625, -0.114105224609375, -0.1090087890625, -0.103912353515625, -0.09881591796875, -0.093719482421875, -0.088623046875, -0.083526611328125, -0.07843017578125, -0.073333740234375, -0.0682373046875, -0.063140869140625, -0.05804443359375, -0.052947998046875, -0.0478515625, -0.042755126953125, -0.03765869140625, -0.032562255859375, -0.0274658203125, -0.022369384765625, -0.01727294921875, -0.012176513671875, -0.007080078125, -0.001983642578125, 0.00311279296875, 0.008209228515625, 0.0133056640625, 0.018402099609375, 0.02349853515625, 0.028594970703125, 0.03369140625, 0.038787841796875, 0.04388427734375, 0.048980712890625, 0.0540771484375, 0.059173583984375, 0.06427001953125, 0.069366455078125, 0.074462890625, 0.079559326171875, 0.08465576171875, 0.089752197265625, 0.0948486328125, 0.099945068359375, 0.10504150390625, 0.110137939453125, 0.115234375, 0.120330810546875, 0.12542724609375, 0.130523681640625, 0.1356201171875, 0.140716552734375, 0.14581298828125, 0.150909423828125, 0.156005859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 10.0, 12.0, 25.0, 31.0, 59.0, 85.0, 89.0, 92.0, 127.0, 99.0, 95.0, 83.0, 60.0, 38.0, 32.0, 17.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.477787733078003, -1.4458448886871338, -1.413901925086975, -1.3819589614868164, -1.3500161170959473, -1.3180732727050781, -1.2861303091049194, -1.2541873455047607, -1.2222445011138916, -1.1903016567230225, -1.1583586931228638, -1.126415729522705, -1.094472885131836, -1.0625300407409668, -1.030587077140808, -0.9986441731452942, -0.9667012691497803, -0.9347583651542664, -0.9028154611587524, -0.8708725571632385, -0.8389296531677246, -0.8069867491722107, -0.7750438451766968, -0.7431009411811829, -0.711158037185669, -0.679215133190155, -0.6472722291946411, -0.6153293251991272, -0.5833864212036133, -0.5514435172080994, -0.5195006132125854, -0.48755770921707153, -0.4556148052215576, -0.4236719012260437, -0.3917289972305298, -0.35978609323501587, -0.32784318923950195, -0.29590028524398804, -0.2639573812484741, -0.2320144772529602, -0.2000715732574463, -0.16812866926193237, -0.13618576526641846, -0.10424286127090454, -0.07229995727539062, -0.04035705327987671, -0.008414149284362793, 0.023528754711151123, 0.05547165870666504, 0.08741456270217896, 0.11935746669769287, 0.1513003706932068, 0.1832432746887207, 0.21518617868423462, 0.24712908267974854, 0.27907198667526245, 0.31101489067077637, 0.3429577946662903, 0.3749006986618042, 0.4068436026573181, 0.43878650665283203, 0.47072941064834595, 0.5026723146438599, 0.5346152186393738, 0.5665581226348877]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 13.0, 19.0, 12.0, 18.0, 26.0, 30.0, 22.0, 34.0, 36.0, 33.0, 47.0, 40.0, 40.0, 53.0, 49.0, 63.0, 47.0, 47.0, 39.0, 36.0, 39.0, 35.0, 26.0, 36.0, 23.0, 34.0, 17.0, 8.0, 14.0, 15.0, 5.0, 3.0, 5.0, 5.0, 2.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6266806721687317, -0.6093015074729919, -0.5919223427772522, -0.5745431780815125, -0.5571639537811279, -0.5397847890853882, -0.5224056243896484, -0.5050264596939087, -0.48764729499816895, -0.4702681303024292, -0.45288896560668945, -0.4355097711086273, -0.4181306064128876, -0.4007514417171478, -0.3833722472190857, -0.36599308252334595, -0.3486139178276062, -0.33123475313186646, -0.3138555884361267, -0.2964763939380646, -0.27909722924232483, -0.2617180645465851, -0.24433888494968414, -0.2269597053527832, -0.20958054065704346, -0.1922013759613037, -0.17482219636440277, -0.15744301676750183, -0.14006385207176208, -0.12268467992544174, -0.1053055077791214, -0.08792633563280106, -0.07054710388183594, -0.053167931735515594, -0.03578875958919525, -0.01840958744287491, -0.0010304152965545654, 0.016348756849765778, 0.03372792899608612, 0.051107101142406464, 0.0684862732887268, 0.08586544543504715, 0.10324461758136749, 0.12062378972768784, 0.13800296187400818, 0.15538212656974792, 0.17276130616664886, 0.1901404857635498, 0.20751965045928955, 0.2248988151550293, 0.24227799475193024, 0.2596571743488312, 0.2770363390445709, 0.29441550374031067, 0.3117946982383728, 0.32917386293411255, 0.3465530276298523, 0.36393219232559204, 0.3813113570213318, 0.3986905515193939, 0.41606971621513367, 0.4334488809108734, 0.45082807540893555, 0.4682072401046753, 0.48558640480041504]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 6.0, 15.0, 16.0, 20.0, 36.0, 46.0, 67.0, 93.0, 151.0, 194.0, 317.0, 535.0, 1015.0, 2273.0, 5937.0, 16227.0, 48374.0, 152245.0, 395893.0, 286074.0, 91508.0, 29600.0, 10419.0, 3914.0, 1627.0, 728.0, 420.0, 253.0, 173.0, 95.0, 91.0, 57.0, 37.0, 26.0, 25.0, 13.0, 8.0, 3.0, 4.0, 5.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.39990234375, -0.38840484619140625, -0.3769073486328125, -0.36540985107421875, -0.353912353515625, -0.34241485595703125, -0.3309173583984375, -0.31941986083984375, -0.30792236328125, -0.29642486572265625, -0.2849273681640625, -0.27342987060546875, -0.261932373046875, -0.25043487548828125, -0.2389373779296875, -0.22743988037109375, -0.2159423828125, -0.20444488525390625, -0.1929473876953125, -0.18144989013671875, -0.169952392578125, -0.15845489501953125, -0.1469573974609375, -0.13545989990234375, -0.12396240234375, -0.11246490478515625, -0.1009674072265625, -0.08946990966796875, -0.077972412109375, -0.06647491455078125, -0.0549774169921875, -0.04347991943359375, -0.031982421875, -0.02048492431640625, -0.0089874267578125, 0.00251007080078125, 0.014007568359375, 0.02550506591796875, 0.0370025634765625, 0.04850006103515625, 0.05999755859375, 0.07149505615234375, 0.0829925537109375, 0.09449005126953125, 0.105987548828125, 0.11748504638671875, 0.1289825439453125, 0.14048004150390625, 0.1519775390625, 0.16347503662109375, 0.1749725341796875, 0.18647003173828125, 0.197967529296875, 0.20946502685546875, 0.2209625244140625, 0.23246002197265625, 0.24395751953125, 0.25545501708984375, 0.2669525146484375, 0.27845001220703125, 0.289947509765625, 0.30144500732421875, 0.3129425048828125, 0.32444000244140625, 0.3359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 17.0, 10.0, 20.0, 26.0, 39.0, 62.0, 77.0, 99.0, 98.0, 116.0, 93.0, 97.0, 68.0, 59.0, 47.0, 23.0, 25.0, 12.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07525634765625, -0.07040882110595703, -0.06556129455566406, -0.060713768005371094, -0.055866241455078125, -0.051018714904785156, -0.04617118835449219, -0.04132366180419922, -0.03647613525390625, -0.03162860870361328, -0.026781082153320312, -0.021933555603027344, -0.017086029052734375, -0.012238502502441406, -0.0073909759521484375, -0.0025434494018554688, 0.0023040771484375, 0.007151603698730469, 0.011999130249023438, 0.016846656799316406, 0.021694183349609375, 0.026541709899902344, 0.03138923645019531, 0.03623676300048828, 0.04108428955078125, 0.04593181610107422, 0.05077934265136719, 0.055626869201660156, 0.060474395751953125, 0.0653219223022461, 0.07016944885253906, 0.07501697540283203, 0.079864501953125, 0.08471202850341797, 0.08955955505371094, 0.0944070816040039, 0.09925460815429688, 0.10410213470458984, 0.10894966125488281, 0.11379718780517578, 0.11864471435546875, 0.12349224090576172, 0.1283397674560547, 0.13318729400634766, 0.13803482055664062, 0.1428823471069336, 0.14772987365722656, 0.15257740020751953, 0.1574249267578125, 0.16227245330810547, 0.16711997985839844, 0.1719675064086914, 0.17681503295898438, 0.18166255950927734, 0.1865100860595703, 0.19135761260986328, 0.19620513916015625, 0.20105266571044922, 0.2059001922607422, 0.21074771881103516, 0.21559524536132812, 0.2204427719116211, 0.22529029846191406, 0.23013782501220703, 0.2349853515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 8.0, 12.0, 32.0, 24.0, 64.0, 90.0, 144.0, 248.0, 417.0, 717.0, 1389.0, 2618.0, 4926.0, 10170.0, 20516.0, 44229.0, 102651.0, 230448.0, 306853.0, 179604.0, 76974.0, 33758.0, 15916.0, 7995.0, 4059.0, 2088.0, 1101.0, 611.0, 350.0, 200.0, 112.0, 75.0, 53.0, 43.0, 29.0, 6.0, 7.0, 9.0, 1.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1766357421875, -0.16872596740722656, -0.16081619262695312, -0.1529064178466797, -0.14499664306640625, -0.1370868682861328, -0.12917709350585938, -0.12126731872558594, -0.1133575439453125, -0.10544776916503906, -0.09753799438476562, -0.08962821960449219, -0.08171844482421875, -0.07380867004394531, -0.06589889526367188, -0.05798912048339844, -0.050079345703125, -0.04216957092285156, -0.034259796142578125, -0.026350021362304688, -0.01844024658203125, -0.010530471801757812, -0.002620697021484375, 0.0052890777587890625, 0.0131988525390625, 0.021108627319335938, 0.029018402099609375, 0.03692817687988281, 0.04483795166015625, 0.05274772644042969, 0.060657501220703125, 0.06856727600097656, 0.07647705078125, 0.08438682556152344, 0.09229660034179688, 0.10020637512207031, 0.10811614990234375, 0.11602592468261719, 0.12393569946289062, 0.13184547424316406, 0.1397552490234375, 0.14766502380371094, 0.15557479858398438, 0.1634845733642578, 0.17139434814453125, 0.1793041229248047, 0.18721389770507812, 0.19512367248535156, 0.203033447265625, 0.21094322204589844, 0.21885299682617188, 0.2267627716064453, 0.23467254638671875, 0.2425823211669922, 0.2504920959472656, 0.25840187072753906, 0.2663116455078125, 0.27422142028808594, 0.2821311950683594, 0.2900409698486328, 0.29795074462890625, 0.3058605194091797, 0.3137702941894531, 0.32168006896972656, 0.32958984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 7.0, 6.0, 5.0, 11.0, 16.0, 14.0, 14.0, 21.0, 18.0, 22.0, 21.0, 31.0, 39.0, 33.0, 45.0, 58.0, 52.0, 34.0, 44.0, 36.0, 56.0, 49.0, 47.0, 44.0, 37.0, 31.0, 34.0, 30.0, 19.0, 27.0, 25.0, 19.0, 13.0, 5.0, 7.0, 5.0, 3.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.272705078125, -0.2643585205078125, -0.256011962890625, -0.2476654052734375, -0.23931884765625, -0.2309722900390625, -0.222625732421875, -0.2142791748046875, -0.2059326171875, -0.1975860595703125, -0.189239501953125, -0.1808929443359375, -0.17254638671875, -0.1641998291015625, -0.155853271484375, -0.1475067138671875, -0.13916015625, -0.1308135986328125, -0.122467041015625, -0.1141204833984375, -0.10577392578125, -0.0974273681640625, -0.089080810546875, -0.0807342529296875, -0.0723876953125, -0.0640411376953125, -0.055694580078125, -0.0473480224609375, -0.03900146484375, -0.0306549072265625, -0.022308349609375, -0.0139617919921875, -0.005615234375, 0.0027313232421875, 0.011077880859375, 0.0194244384765625, 0.02777099609375, 0.0361175537109375, 0.044464111328125, 0.0528106689453125, 0.0611572265625, 0.0695037841796875, 0.077850341796875, 0.0861968994140625, 0.09454345703125, 0.1028900146484375, 0.111236572265625, 0.1195831298828125, 0.1279296875, 0.1362762451171875, 0.144622802734375, 0.1529693603515625, 0.16131591796875, 0.1696624755859375, 0.178009033203125, 0.1863555908203125, 0.1947021484375, 0.2030487060546875, 0.211395263671875, 0.2197418212890625, 0.22808837890625, 0.2364349365234375, 0.244781494140625, 0.2531280517578125, 0.261474609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 18.0, 27.0, 33.0, 52.0, 76.0, 125.0, 186.0, 281.0, 427.0, 714.0, 1205.0, 2161.0, 3797.0, 7985.0, 16835.0, 37662.0, 92408.0, 235600.0, 346722.0, 176920.0, 69284.0, 28971.0, 12998.0, 6289.0, 3279.0, 1731.0, 1065.0, 594.0, 390.0, 249.0, 165.0, 96.0, 65.0, 40.0, 25.0, 28.0, 9.0, 5.0, 12.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.1491374969482422, -0.14422225952148438, -0.13930702209472656, -0.13439178466796875, -0.12947654724121094, -0.12456130981445312, -0.11964607238769531, -0.1147308349609375, -0.10981559753417969, -0.10490036010742188, -0.09998512268066406, -0.09506988525390625, -0.09015464782714844, -0.08523941040039062, -0.08032417297363281, -0.075408935546875, -0.07049369812011719, -0.06557846069335938, -0.06066322326660156, -0.05574798583984375, -0.05083274841308594, -0.045917510986328125, -0.04100227355957031, -0.0360870361328125, -0.031171798706054688, -0.026256561279296875, -0.021341323852539062, -0.01642608642578125, -0.011510848999023438, -0.006595611572265625, -0.0016803741455078125, 0.00323486328125, 0.008150100708007812, 0.013065338134765625, 0.017980575561523438, 0.02289581298828125, 0.027811050415039062, 0.032726287841796875, 0.03764152526855469, 0.0425567626953125, 0.04747200012207031, 0.052387237548828125, 0.05730247497558594, 0.06221771240234375, 0.06713294982910156, 0.07204818725585938, 0.07696342468261719, 0.081878662109375, 0.08679389953613281, 0.09170913696289062, 0.09662437438964844, 0.10153961181640625, 0.10645484924316406, 0.11137008666992188, 0.11628532409667969, 0.1212005615234375, 0.1261157989501953, 0.13103103637695312, 0.13594627380371094, 0.14086151123046875, 0.14577674865722656, 0.15069198608398438, 0.1556072235107422, 0.1605224609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 5.0, 8.0, 6.0, 16.0, 16.0, 28.0, 33.0, 33.0, 51.0, 66.0, 121.0, 120.0, 113.0, 84.0, 80.0, 48.0, 39.0, 26.0, 25.0, 17.0, 15.0, 12.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1113624572753906e-05, -2.995505928993225e-05, -2.8796494007110596e-05, -2.763792872428894e-05, -2.6479363441467285e-05, -2.532079815864563e-05, -2.4162232875823975e-05, -2.300366759300232e-05, -2.1845102310180664e-05, -2.068653702735901e-05, -1.9527971744537354e-05, -1.8369406461715698e-05, -1.7210841178894043e-05, -1.6052275896072388e-05, -1.4893710613250732e-05, -1.3735145330429077e-05, -1.2576580047607422e-05, -1.1418014764785767e-05, -1.0259449481964111e-05, -9.100884199142456e-06, -7.9423189163208e-06, -6.7837536334991455e-06, -5.62518835067749e-06, -4.466623067855835e-06, -3.3080577850341797e-06, -2.1494925022125244e-06, -9.909272193908691e-07, 1.6763806343078613e-07, 1.3262033462524414e-06, 2.4847686290740967e-06, 3.643333911895752e-06, 4.801899194717407e-06, 5.9604644775390625e-06, 7.119029760360718e-06, 8.277595043182373e-06, 9.436160326004028e-06, 1.0594725608825684e-05, 1.1753290891647339e-05, 1.2911856174468994e-05, 1.407042145729065e-05, 1.5228986740112305e-05, 1.638755202293396e-05, 1.7546117305755615e-05, 1.870468258857727e-05, 1.9863247871398926e-05, 2.102181315422058e-05, 2.2180378437042236e-05, 2.333894371986389e-05, 2.4497509002685547e-05, 2.5656074285507202e-05, 2.6814639568328857e-05, 2.7973204851150513e-05, 2.9131770133972168e-05, 3.0290335416793823e-05, 3.144890069961548e-05, 3.2607465982437134e-05, 3.376603126525879e-05, 3.4924596548080444e-05, 3.60831618309021e-05, 3.7241727113723755e-05, 3.840029239654541e-05, 3.9558857679367065e-05, 4.071742296218872e-05, 4.1875988245010376e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 20.0, 18.0, 33.0, 36.0, 31.0, 89.0, 132.0, 207.0, 326.0, 552.0, 858.0, 1526.0, 2687.0, 4900.0, 9296.0, 18876.0, 41554.0, 99459.0, 246506.0, 335824.0, 162573.0, 65379.0, 28522.0, 13536.0, 6911.0, 3579.0, 2033.0, 1116.0, 775.0, 412.0, 272.0, 167.0, 113.0, 85.0, 45.0, 25.0, 20.0, 18.0, 13.0, 4.0, 5.0, 6.0, 1.0, 4.0], "bins": [-0.1884765625, -0.18367671966552734, -0.1788768768310547, -0.17407703399658203, -0.16927719116210938, -0.16447734832763672, -0.15967750549316406, -0.1548776626586914, -0.15007781982421875, -0.1452779769897461, -0.14047813415527344, -0.13567829132080078, -0.13087844848632812, -0.12607860565185547, -0.12127876281738281, -0.11647891998291016, -0.1116790771484375, -0.10687923431396484, -0.10207939147949219, -0.09727954864501953, -0.09247970581054688, -0.08767986297607422, -0.08288002014160156, -0.0780801773071289, -0.07328033447265625, -0.0684804916381836, -0.06368064880371094, -0.05888080596923828, -0.054080963134765625, -0.04928112030029297, -0.04448127746582031, -0.039681434631347656, -0.034881591796875, -0.030081748962402344, -0.025281906127929688, -0.02048206329345703, -0.015682220458984375, -0.010882377624511719, -0.0060825347900390625, -0.0012826919555664062, 0.00351715087890625, 0.008316993713378906, 0.013116836547851562, 0.01791667938232422, 0.022716522216796875, 0.02751636505126953, 0.03231620788574219, 0.037116050720214844, 0.0419158935546875, 0.046715736389160156, 0.05151557922363281, 0.05631542205810547, 0.061115264892578125, 0.06591510772705078, 0.07071495056152344, 0.0755147933959961, 0.08031463623046875, 0.0851144790649414, 0.08991432189941406, 0.09471416473388672, 0.09951400756835938, 0.10431385040283203, 0.10911369323730469, 0.11391353607177734, 0.11871337890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 3.0, 3.0, 5.0, 7.0, 14.0, 15.0, 18.0, 22.0, 23.0, 32.0, 29.0, 32.0, 61.0, 55.0, 60.0, 59.0, 81.0, 79.0, 60.0, 63.0, 43.0, 44.0, 35.0, 38.0, 17.0, 14.0, 21.0, 17.0, 8.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.1434326171875, -0.13944625854492188, -0.13545989990234375, -0.13147354125976562, -0.1274871826171875, -0.12350082397460938, -0.11951446533203125, -0.11552810668945312, -0.111541748046875, -0.10755538940429688, -0.10356903076171875, -0.09958267211914062, -0.0955963134765625, -0.09160995483398438, -0.08762359619140625, -0.08363723754882812, -0.07965087890625, -0.07566452026367188, -0.07167816162109375, -0.06769180297851562, -0.0637054443359375, -0.059719085693359375, -0.05573272705078125, -0.051746368408203125, -0.047760009765625, -0.043773651123046875, -0.03978729248046875, -0.035800933837890625, -0.0318145751953125, -0.027828216552734375, -0.02384185791015625, -0.019855499267578125, -0.015869140625, -0.011882781982421875, -0.00789642333984375, -0.003910064697265625, 7.62939453125e-05, 0.004062652587890625, 0.00804901123046875, 0.012035369873046875, 0.016021728515625, 0.020008087158203125, 0.02399444580078125, 0.027980804443359375, 0.0319671630859375, 0.035953521728515625, 0.03993988037109375, 0.043926239013671875, 0.04791259765625, 0.051898956298828125, 0.05588531494140625, 0.059871673583984375, 0.0638580322265625, 0.06784439086914062, 0.07183074951171875, 0.07581710815429688, 0.079803466796875, 0.08378982543945312, 0.08777618408203125, 0.09176254272460938, 0.0957489013671875, 0.09973526000976562, 0.10372161865234375, 0.10770797729492188, 0.1116943359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 13.0, 23.0, 40.0, 61.0, 95.0, 109.0, 140.0, 127.0, 114.0, 95.0, 76.0, 57.0, 21.0, 18.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.9995193481445312, -2.9411139488220215, -2.8827085494995117, -2.824303150177002, -2.765897750854492, -2.7074923515319824, -2.6490869522094727, -2.590681552886963, -2.532276153564453, -2.4738707542419434, -2.4154653549194336, -2.357059955596924, -2.298654556274414, -2.2402491569519043, -2.1818437576293945, -2.1234383583068848, -2.065032958984375, -2.0066275596618652, -1.9482221603393555, -1.8898167610168457, -1.831411361694336, -1.7730059623718262, -1.7146005630493164, -1.6561951637268066, -1.597790002822876, -1.5393846035003662, -1.4809792041778564, -1.4225738048553467, -1.364168405532837, -1.3057630062103271, -1.2473576068878174, -1.1889522075653076, -1.1305468082427979, -1.072141408920288, -1.0137360095977783, -0.9553306102752686, -0.8969252109527588, -0.838519811630249, -0.780114471912384, -0.7217090725898743, -0.6633037328720093, -0.6048983335494995, -0.5464929342269897, -0.48808756470680237, -0.4296821653842926, -0.37127676606178284, -0.31287139654159546, -0.2544659972190857, -0.19606059789657593, -0.13765519857406616, -0.07924981415271759, -0.02084442973136902, 0.03756096959114075, 0.09596636891365051, 0.1543717384338379, 0.21277713775634766, 0.2711825370788574, 0.3295879364013672, 0.38799333572387695, 0.44639870524406433, 0.5048041343688965, 0.5632095336914062, 0.6216148734092712, 0.680020272731781, 0.7384256720542908]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 11.0, 7.0, 10.0, 19.0, 11.0, 15.0, 30.0, 24.0, 34.0, 36.0, 34.0, 36.0, 34.0, 37.0, 37.0, 41.0, 41.0, 49.0, 46.0, 50.0, 44.0, 27.0, 36.0, 31.0, 31.0, 26.0, 25.0, 24.0, 19.0, 25.0, 13.0, 9.0, 12.0, 14.0, 9.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.6818969249725342, -0.6597164869308472, -0.6375360488891602, -0.6153556108474731, -0.5931751728057861, -0.5709947943687439, -0.5488143563270569, -0.5266339182853699, -0.5044534802436829, -0.48227304220199585, -0.46009260416030884, -0.4379121959209442, -0.4157317578792572, -0.3935513198375702, -0.37137091159820557, -0.34919047355651855, -0.32701003551483154, -0.30482959747314453, -0.2826491594314575, -0.2604687511920929, -0.23828831315040588, -0.21610787510871887, -0.19392745196819305, -0.17174702882766724, -0.14956659078598022, -0.1273861527442932, -0.1052057296037674, -0.08302529901266098, -0.060844868421554565, -0.03866443783044815, -0.016484007239341736, 0.005696415901184082, 0.02787691354751587, 0.050057344138622284, 0.0722377747297287, 0.09441820532083511, 0.11659863591194153, 0.13877907395362854, 0.16095949709415436, 0.18313992023468018, 0.2053203582763672, 0.2275007963180542, 0.24968121945858002, 0.27186164259910583, 0.29404208064079285, 0.31622251868247986, 0.3384029269218445, 0.3605833649635315, 0.3827638030052185, 0.4049442410469055, 0.42712467908859253, 0.44930508732795715, 0.47148552536964417, 0.4936659634113312, 0.5158463716506958, 0.5380268096923828, 0.5602072477340698, 0.5823876857757568, 0.6045681238174438, 0.6267485618591309, 0.6489289999008179, 0.6711093783378601, 0.6932898163795471, 0.7154702544212341, 0.7376506924629211]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 12.0, 16.0, 26.0, 40.0, 60.0, 87.0, 194.0, 350.0, 719.0, 1594.0, 4627.0, 16409.0, 78429.0, 670018.0, 3036253.0, 322869.0, 45578.0, 10587.0, 3465.0, 1366.0, 627.0, 367.0, 217.0, 132.0, 94.0, 44.0, 30.0, 31.0, 14.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.257568359375, -0.24779510498046875, -0.2380218505859375, -0.22824859619140625, -0.218475341796875, -0.20870208740234375, -0.1989288330078125, -0.18915557861328125, -0.17938232421875, -0.16960906982421875, -0.1598358154296875, -0.15006256103515625, -0.140289306640625, -0.13051605224609375, -0.1207427978515625, -0.11096954345703125, -0.1011962890625, -0.09142303466796875, -0.0816497802734375, -0.07187652587890625, -0.062103271484375, -0.05233001708984375, -0.0425567626953125, -0.03278350830078125, -0.02301025390625, -0.01323699951171875, -0.0034637451171875, 0.00630950927734375, 0.016082763671875, 0.02585601806640625, 0.0356292724609375, 0.04540252685546875, 0.05517578125, 0.06494903564453125, 0.0747222900390625, 0.08449554443359375, 0.094268798828125, 0.10404205322265625, 0.1138153076171875, 0.12358856201171875, 0.13336181640625, 0.14313507080078125, 0.1529083251953125, 0.16268157958984375, 0.172454833984375, 0.18222808837890625, 0.1920013427734375, 0.20177459716796875, 0.2115478515625, 0.22132110595703125, 0.2310943603515625, 0.24086761474609375, 0.250640869140625, 0.26041412353515625, 0.2701873779296875, 0.27996063232421875, 0.28973388671875, 0.29950714111328125, 0.3092803955078125, 0.31905364990234375, 0.328826904296875, 0.33860015869140625, 0.3483734130859375, 0.35814666748046875, 0.367919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 18.0, 15.0, 22.0, 35.0, 43.0, 47.0, 70.0, 65.0, 84.0, 98.0, 95.0, 84.0, 78.0, 57.0, 50.0, 48.0, 34.0, 20.0, 17.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08575439453125, -0.08075237274169922, -0.07575035095214844, -0.07074832916259766, -0.06574630737304688, -0.060744285583496094, -0.05574226379394531, -0.05074024200439453, -0.04573822021484375, -0.04073619842529297, -0.03573417663574219, -0.030732154846191406, -0.025730133056640625, -0.020728111267089844, -0.015726089477539062, -0.010724067687988281, -0.0057220458984375, -0.0007200241088867188, 0.0042819976806640625, 0.009284019470214844, 0.014286041259765625, 0.019288063049316406, 0.024290084838867188, 0.02929210662841797, 0.03429412841796875, 0.03929615020751953, 0.04429817199707031, 0.049300193786621094, 0.054302215576171875, 0.059304237365722656, 0.06430625915527344, 0.06930828094482422, 0.074310302734375, 0.07931232452392578, 0.08431434631347656, 0.08931636810302734, 0.09431838989257812, 0.0993204116821289, 0.10432243347167969, 0.10932445526123047, 0.11432647705078125, 0.11932849884033203, 0.12433052062988281, 0.1293325424194336, 0.13433456420898438, 0.13933658599853516, 0.14433860778808594, 0.14934062957763672, 0.1543426513671875, 0.15934467315673828, 0.16434669494628906, 0.16934871673583984, 0.17435073852539062, 0.1793527603149414, 0.1843547821044922, 0.18935680389404297, 0.19435882568359375, 0.19936084747314453, 0.2043628692626953, 0.2093648910522461, 0.21436691284179688, 0.21936893463134766, 0.22437095642089844, 0.22937297821044922, 0.234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 3.0, 9.0, 7.0, 19.0, 17.0, 23.0, 37.0, 48.0, 60.0, 110.0, 174.0, 336.0, 630.0, 1177.0, 2613.0, 6325.0, 18032.0, 63710.0, 323711.0, 2196821.0, 1320594.0, 194261.0, 43315.0, 13095.0, 4892.0, 2039.0, 994.0, 484.0, 279.0, 143.0, 111.0, 68.0, 39.0, 27.0, 26.0, 9.0, 6.0, 13.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33740234375, -0.3271331787109375, -0.316864013671875, -0.3065948486328125, -0.29632568359375, -0.2860565185546875, -0.275787353515625, -0.2655181884765625, -0.2552490234375, -0.2449798583984375, -0.234710693359375, -0.2244415283203125, -0.21417236328125, -0.2039031982421875, -0.193634033203125, -0.1833648681640625, -0.173095703125, -0.1628265380859375, -0.152557373046875, -0.1422882080078125, -0.13201904296875, -0.1217498779296875, -0.111480712890625, -0.1012115478515625, -0.0909423828125, -0.0806732177734375, -0.070404052734375, -0.0601348876953125, -0.04986572265625, -0.0395965576171875, -0.029327392578125, -0.0190582275390625, -0.0087890625, 0.0014801025390625, 0.011749267578125, 0.0220184326171875, 0.03228759765625, 0.0425567626953125, 0.052825927734375, 0.0630950927734375, 0.0733642578125, 0.0836334228515625, 0.093902587890625, 0.1041717529296875, 0.11444091796875, 0.1247100830078125, 0.134979248046875, 0.1452484130859375, 0.155517578125, 0.1657867431640625, 0.176055908203125, 0.1863250732421875, 0.19659423828125, 0.2068634033203125, 0.217132568359375, 0.2274017333984375, 0.2376708984375, 0.2479400634765625, 0.258209228515625, 0.2684783935546875, 0.27874755859375, 0.2890167236328125, 0.299285888671875, 0.3095550537109375, 0.31982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 13.0, 17.0, 18.0, 30.0, 50.0, 83.0, 109.0, 178.0, 276.0, 484.0, 682.0, 745.0, 482.0, 341.0, 186.0, 120.0, 83.0, 49.0, 30.0, 27.0, 20.0, 9.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.2869911193847656, -0.27857208251953125, -0.2701530456542969, -0.2617340087890625, -0.2533149719238281, -0.24489593505859375, -0.23647689819335938, -0.228057861328125, -0.21963882446289062, -0.21121978759765625, -0.20280075073242188, -0.1943817138671875, -0.18596267700195312, -0.17754364013671875, -0.16912460327148438, -0.16070556640625, -0.15228652954101562, -0.14386749267578125, -0.13544845581054688, -0.1270294189453125, -0.11861038208007812, -0.11019134521484375, -0.10177230834960938, -0.093353271484375, -0.08493423461914062, -0.07651519775390625, -0.06809616088867188, -0.0596771240234375, -0.051258087158203125, -0.04283905029296875, -0.034420013427734375, -0.0260009765625, -0.017581939697265625, -0.00916290283203125, -0.000743865966796875, 0.0076751708984375, 0.016094207763671875, 0.02451324462890625, 0.032932281494140625, 0.041351318359375, 0.049770355224609375, 0.05818939208984375, 0.06660842895507812, 0.0750274658203125, 0.08344650268554688, 0.09186553955078125, 0.10028457641601562, 0.10870361328125, 0.11712265014648438, 0.12554168701171875, 0.13396072387695312, 0.1423797607421875, 0.15079879760742188, 0.15921783447265625, 0.16763687133789062, 0.176055908203125, 0.18447494506835938, 0.19289398193359375, 0.20131301879882812, 0.2097320556640625, 0.21815109252929688, 0.22657012939453125, 0.23498916625976562, 0.243408203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 11.0, 3.0, 6.0, 6.0, 12.0, 25.0, 31.0, 30.0, 58.0, 57.0, 76.0, 77.0, 81.0, 73.0, 84.0, 85.0, 73.0, 51.0, 35.0, 41.0, 23.0, 17.0, 12.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0217467546463013, -0.9913377165794373, -0.9609286785125732, -0.9305196404457092, -0.9001106023788452, -0.8697015643119812, -0.8392925262451172, -0.808883547782898, -0.7784744501113892, -0.7480654120445251, -0.7176563739776611, -0.6872473359107971, -0.6568382978439331, -0.6264292597770691, -0.5960202217102051, -0.5656112432479858, -0.5352022051811218, -0.5047931671142578, -0.4743841290473938, -0.4439750909805298, -0.41356605291366577, -0.38315701484680176, -0.35274800658226013, -0.3223389685153961, -0.2919299304485321, -0.2615208923816681, -0.23111185431480408, -0.20070283114910126, -0.17029379308223724, -0.13988475501537323, -0.10947573184967041, -0.0790666937828064, -0.04865765571594238, -0.018248621374368668, 0.012160412967205048, 0.042569443583488464, 0.07297848165035248, 0.10338751971721649, 0.1337965428829193, 0.16420558094978333, 0.19461461901664734, 0.22502365708351135, 0.25543269515037537, 0.285841703414917, 0.316250741481781, 0.346659779548645, 0.37706881761550903, 0.40747785568237305, 0.43788689374923706, 0.4682959318161011, 0.4987049698829651, 0.5291140079498291, 0.5595230460166931, 0.5899320840835571, 0.6203410625457764, 0.6507501602172852, 0.6811591386795044, 0.7115681767463684, 0.7419772148132324, 0.7723862528800964, 0.8027952909469604, 0.8332043290138245, 0.8636133670806885, 0.8940223455429077, 0.9244314432144165]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 6.0, 5.0, 11.0, 15.0, 14.0, 10.0, 15.0, 20.0, 19.0, 25.0, 26.0, 41.0, 40.0, 33.0, 32.0, 50.0, 53.0, 45.0, 42.0, 37.0, 58.0, 46.0, 46.0, 27.0, 30.0, 38.0, 35.0, 32.0, 27.0, 19.0, 19.0, 11.0, 14.0, 18.0, 9.0, 5.0, 8.0, 2.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7819831371307373, -0.7594842314720154, -0.7369852662086487, -0.7144863605499268, -0.6919873952865601, -0.6694884896278381, -0.6469895839691162, -0.6244906187057495, -0.6019916534423828, -0.5794927477836609, -0.5569937825202942, -0.5344948768615723, -0.5119959115982056, -0.48949700593948364, -0.46699807047843933, -0.444499135017395, -0.4220002293586731, -0.3995012938976288, -0.3770023584365845, -0.35450345277786255, -0.33200448751449585, -0.3095055818557739, -0.2870066463947296, -0.2645077109336853, -0.242008775472641, -0.21950984001159668, -0.19701090455055237, -0.17451198399066925, -0.15201304852962494, -0.12951411306858063, -0.10701519250869751, -0.0845162570476532, -0.06201726198196411, -0.0395183302462101, -0.017019398510456085, 0.005479529500007629, 0.02797846496105194, 0.05047740042209625, 0.07297632098197937, 0.09547525644302368, 0.117974191904068, 0.1404731273651123, 0.16297206282615662, 0.18547098338603973, 0.20796991884708405, 0.23046885430812836, 0.2529677748680115, 0.2754667103290558, 0.2979656457901001, 0.3204645812511444, 0.3429635167121887, 0.36546242237091064, 0.38796138763427734, 0.41046029329299927, 0.4329592287540436, 0.4554581642150879, 0.4779570996761322, 0.5004560351371765, 0.5229549407958984, 0.5454539060592651, 0.5679528117179871, 0.5904517769813538, 0.6129506826400757, 0.6354496479034424, 0.6579485535621643]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 12.0, 5.0, 7.0, 12.0, 27.0, 37.0, 36.0, 69.0, 97.0, 184.0, 294.0, 501.0, 966.0, 2063.0, 4029.0, 8473.0, 18203.0, 43395.0, 119322.0, 313414.0, 326314.0, 127936.0, 46155.0, 19345.0, 8971.0, 4201.0, 2090.0, 1050.0, 533.0, 316.0, 189.0, 91.0, 74.0, 49.0, 23.0, 20.0, 19.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.28045654296875, -0.2711181640625, -0.26177978515625, -0.25244140625, -0.24310302734375, -0.2337646484375, -0.22442626953125, -0.215087890625, -0.20574951171875, -0.1964111328125, -0.18707275390625, -0.177734375, -0.16839599609375, -0.1590576171875, -0.14971923828125, -0.140380859375, -0.13104248046875, -0.1217041015625, -0.11236572265625, -0.10302734375, -0.09368896484375, -0.0843505859375, -0.07501220703125, -0.065673828125, -0.05633544921875, -0.0469970703125, -0.03765869140625, -0.0283203125, -0.01898193359375, -0.0096435546875, -0.00030517578125, 0.009033203125, 0.01837158203125, 0.0277099609375, 0.03704833984375, 0.04638671875, 0.05572509765625, 0.0650634765625, 0.07440185546875, 0.083740234375, 0.09307861328125, 0.1024169921875, 0.11175537109375, 0.12109375, 0.13043212890625, 0.1397705078125, 0.14910888671875, 0.158447265625, 0.16778564453125, 0.1771240234375, 0.18646240234375, 0.19580078125, 0.20513916015625, 0.2144775390625, 0.22381591796875, 0.233154296875, 0.24249267578125, 0.2518310546875, 0.26116943359375, 0.2705078125, 0.27984619140625, 0.2891845703125, 0.29852294921875, 0.307861328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 11.0, 8.0, 11.0, 27.0, 24.0, 34.0, 46.0, 47.0, 68.0, 56.0, 72.0, 94.0, 88.0, 62.0, 78.0, 80.0, 37.0, 54.0, 30.0, 32.0, 10.0, 11.0, 14.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836181640625, -0.07875633239746094, -0.07389450073242188, -0.06903266906738281, -0.06417083740234375, -0.05930900573730469, -0.054447174072265625, -0.04958534240722656, -0.0447235107421875, -0.03986167907714844, -0.034999847412109375, -0.030138015747070312, -0.02527618408203125, -0.020414352416992188, -0.015552520751953125, -0.010690689086914062, -0.005828857421875, -0.0009670257568359375, 0.003894805908203125, 0.008756637573242188, 0.01361846923828125, 0.018480300903320312, 0.023342132568359375, 0.028203964233398438, 0.0330657958984375, 0.03792762756347656, 0.042789459228515625, 0.04765129089355469, 0.05251312255859375, 0.05737495422363281, 0.062236785888671875, 0.06709861755371094, 0.07196044921875, 0.07682228088378906, 0.08168411254882812, 0.08654594421386719, 0.09140777587890625, 0.09626960754394531, 0.10113143920898438, 0.10599327087402344, 0.1108551025390625, 0.11571693420410156, 0.12057876586914062, 0.1254405975341797, 0.13030242919921875, 0.1351642608642578, 0.14002609252929688, 0.14488792419433594, 0.149749755859375, 0.15461158752441406, 0.15947341918945312, 0.1643352508544922, 0.16919708251953125, 0.1740589141845703, 0.17892074584960938, 0.18378257751464844, 0.1886444091796875, 0.19350624084472656, 0.19836807250976562, 0.2032299041748047, 0.20809173583984375, 0.2129535675048828, 0.21781539916992188, 0.22267723083496094, 0.2275390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 10.0, 18.0, 31.0, 58.0, 147.0, 267.0, 569.0, 1209.0, 2588.0, 5894.0, 13536.0, 37689.0, 154211.0, 516203.0, 232454.0, 52556.0, 17745.0, 7321.0, 3226.0, 1444.0, 658.0, 343.0, 150.0, 84.0, 49.0, 34.0, 12.0, 8.0, 12.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3935546875, -0.38027191162109375, -0.3669891357421875, -0.35370635986328125, -0.340423583984375, -0.32714080810546875, -0.3138580322265625, -0.30057525634765625, -0.28729248046875, -0.27400970458984375, -0.2607269287109375, -0.24744415283203125, -0.234161376953125, -0.22087860107421875, -0.2075958251953125, -0.19431304931640625, -0.1810302734375, -0.16774749755859375, -0.1544647216796875, -0.14118194580078125, -0.127899169921875, -0.11461639404296875, -0.1013336181640625, -0.08805084228515625, -0.07476806640625, -0.06148529052734375, -0.0482025146484375, -0.03491973876953125, -0.021636962890625, -0.00835418701171875, 0.0049285888671875, 0.01821136474609375, 0.031494140625, 0.04477691650390625, 0.0580596923828125, 0.07134246826171875, 0.084625244140625, 0.09790802001953125, 0.1111907958984375, 0.12447357177734375, 0.13775634765625, 0.15103912353515625, 0.1643218994140625, 0.17760467529296875, 0.190887451171875, 0.20417022705078125, 0.2174530029296875, 0.23073577880859375, 0.2440185546875, 0.25730133056640625, 0.2705841064453125, 0.28386688232421875, 0.297149658203125, 0.31043243408203125, 0.3237152099609375, 0.33699798583984375, 0.35028076171875, 0.36356353759765625, 0.3768463134765625, 0.39012908935546875, 0.403411865234375, 0.41669464111328125, 0.4299774169921875, 0.44326019287109375, 0.45654296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 4.0, 8.0, 16.0, 14.0, 18.0, 28.0, 29.0, 30.0, 30.0, 43.0, 49.0, 61.0, 60.0, 62.0, 67.0, 53.0, 70.0, 56.0, 39.0, 48.0, 44.0, 26.0, 31.0, 24.0, 21.0, 18.0, 11.0, 8.0, 5.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.39488983154296875, -0.3835296630859375, -0.37216949462890625, -0.360809326171875, -0.34944915771484375, -0.3380889892578125, -0.32672882080078125, -0.31536865234375, -0.30400848388671875, -0.2926483154296875, -0.28128814697265625, -0.269927978515625, -0.25856781005859375, -0.2472076416015625, -0.23584747314453125, -0.2244873046875, -0.21312713623046875, -0.2017669677734375, -0.19040679931640625, -0.179046630859375, -0.16768646240234375, -0.1563262939453125, -0.14496612548828125, -0.13360595703125, -0.12224578857421875, -0.1108856201171875, -0.09952545166015625, -0.088165283203125, -0.07680511474609375, -0.0654449462890625, -0.05408477783203125, -0.042724609375, -0.03136444091796875, -0.0200042724609375, -0.00864410400390625, 0.002716064453125, 0.01407623291015625, 0.0254364013671875, 0.03679656982421875, 0.04815673828125, 0.05951690673828125, 0.0708770751953125, 0.08223724365234375, 0.093597412109375, 0.10495758056640625, 0.1163177490234375, 0.12767791748046875, 0.1390380859375, 0.15039825439453125, 0.1617584228515625, 0.17311859130859375, 0.184478759765625, 0.19583892822265625, 0.2071990966796875, 0.21855926513671875, 0.22991943359375, 0.24127960205078125, 0.2526397705078125, 0.26399993896484375, 0.275360107421875, 0.28672027587890625, 0.2980804443359375, 0.30944061279296875, 0.32080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 1.0, 7.0, 8.0, 17.0, 29.0, 35.0, 65.0, 95.0, 200.0, 366.0, 559.0, 1087.0, 2155.0, 4454.0, 9976.0, 23890.0, 62425.0, 230100.0, 483577.0, 150036.0, 46034.0, 18185.0, 7875.0, 3568.0, 1729.0, 911.0, 503.0, 291.0, 143.0, 94.0, 56.0, 31.0, 18.0, 8.0, 13.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037353515625, -0.1967945098876953, -0.18985366821289062, -0.18291282653808594, -0.17597198486328125, -0.16903114318847656, -0.16209030151367188, -0.1551494598388672, -0.1482086181640625, -0.1412677764892578, -0.13432693481445312, -0.12738609313964844, -0.12044525146484375, -0.11350440979003906, -0.10656356811523438, -0.09962272644042969, -0.092681884765625, -0.08574104309082031, -0.07880020141601562, -0.07185935974121094, -0.06491851806640625, -0.05797767639160156, -0.051036834716796875, -0.04409599304199219, -0.0371551513671875, -0.030214309692382812, -0.023273468017578125, -0.016332626342773438, -0.00939178466796875, -0.0024509429931640625, 0.004489898681640625, 0.011430740356445312, 0.01837158203125, 0.025312423706054688, 0.032253265380859375, 0.03919410705566406, 0.04613494873046875, 0.05307579040527344, 0.060016632080078125, 0.06695747375488281, 0.0738983154296875, 0.08083915710449219, 0.08777999877929688, 0.09472084045410156, 0.10166168212890625, 0.10860252380371094, 0.11554336547851562, 0.12248420715332031, 0.129425048828125, 0.1363658905029297, 0.14330673217773438, 0.15024757385253906, 0.15718841552734375, 0.16412925720214844, 0.17107009887695312, 0.1780109405517578, 0.1849517822265625, 0.1918926239013672, 0.19883346557617188, 0.20577430725097656, 0.21271514892578125, 0.21965599060058594, 0.22659683227539062, 0.2335376739501953, 0.240478515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 14.0, 14.0, 13.0, 40.0, 41.0, 81.0, 150.0, 195.0, 152.0, 88.0, 54.0, 28.0, 30.0, 19.0, 12.0, 7.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.115436553955078e-05, -5.9567391872406006e-05, -5.798041820526123e-05, -5.6393444538116455e-05, -5.480647087097168e-05, -5.3219497203826904e-05, -5.163252353668213e-05, -5.0045549869537354e-05, -4.845857620239258e-05, -4.68716025352478e-05, -4.528462886810303e-05, -4.369765520095825e-05, -4.2110681533813477e-05, -4.05237078666687e-05, -3.8936734199523926e-05, -3.734976053237915e-05, -3.5762786865234375e-05, -3.41758131980896e-05, -3.2588839530944824e-05, -3.100186586380005e-05, -2.9414892196655273e-05, -2.7827918529510498e-05, -2.6240944862365723e-05, -2.4653971195220947e-05, -2.3066997528076172e-05, -2.1480023860931396e-05, -1.989305019378662e-05, -1.8306076526641846e-05, -1.671910285949707e-05, -1.5132129192352295e-05, -1.354515552520752e-05, -1.1958181858062744e-05, -1.0371208190917969e-05, -8.784234523773193e-06, -7.197260856628418e-06, -5.610287189483643e-06, -4.023313522338867e-06, -2.436339855194092e-06, -8.493661880493164e-07, 7.37607479095459e-07, 2.3245811462402344e-06, 3.91155481338501e-06, 5.498528480529785e-06, 7.0855021476745605e-06, 8.672475814819336e-06, 1.0259449481964111e-05, 1.1846423149108887e-05, 1.3433396816253662e-05, 1.5020370483398438e-05, 1.6607344150543213e-05, 1.8194317817687988e-05, 1.9781291484832764e-05, 2.136826515197754e-05, 2.2955238819122314e-05, 2.454221248626709e-05, 2.6129186153411865e-05, 2.771615982055664e-05, 2.9303133487701416e-05, 3.089010715484619e-05, 3.247708082199097e-05, 3.406405448913574e-05, 3.565102815628052e-05, 3.723800182342529e-05, 3.882497549057007e-05, 4.0411949157714844e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 12.0, 29.0, 27.0, 32.0, 60.0, 83.0, 118.0, 198.0, 283.0, 467.0, 810.0, 1356.0, 2462.0, 4757.0, 9826.0, 21418.0, 50857.0, 152410.0, 438092.0, 238782.0, 72236.0, 28272.0, 12579.0, 6119.0, 3086.0, 1638.0, 936.0, 575.0, 318.0, 209.0, 145.0, 104.0, 77.0, 44.0, 29.0, 28.0, 20.0, 13.0, 12.0, 4.0, 4.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.17630958557128906, -0.17036819458007812, -0.1644268035888672, -0.15848541259765625, -0.1525440216064453, -0.14660263061523438, -0.14066123962402344, -0.1347198486328125, -0.12877845764160156, -0.12283706665039062, -0.11689567565917969, -0.11095428466796875, -0.10501289367675781, -0.09907150268554688, -0.09313011169433594, -0.087188720703125, -0.08124732971191406, -0.07530593872070312, -0.06936454772949219, -0.06342315673828125, -0.05748176574707031, -0.051540374755859375, -0.04559898376464844, -0.0396575927734375, -0.03371620178222656, -0.027774810791015625, -0.021833419799804688, -0.01589202880859375, -0.009950637817382812, -0.004009246826171875, 0.0019321441650390625, 0.00787353515625, 0.013814926147460938, 0.019756317138671875, 0.025697708129882812, 0.03163909912109375, 0.03758049011230469, 0.043521881103515625, 0.04946327209472656, 0.0554046630859375, 0.06134605407714844, 0.06728744506835938, 0.07322883605957031, 0.07917022705078125, 0.08511161804199219, 0.09105300903320312, 0.09699440002441406, 0.102935791015625, 0.10887718200683594, 0.11481857299804688, 0.12075996398925781, 0.12670135498046875, 0.1326427459716797, 0.13858413696289062, 0.14452552795410156, 0.1504669189453125, 0.15640830993652344, 0.16234970092773438, 0.1682910919189453, 0.17423248291015625, 0.1801738739013672, 0.18611526489257812, 0.19205665588378906, 0.197998046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 2.0, 5.0, 3.0, 11.0, 13.0, 22.0, 34.0, 57.0, 90.0, 121.0, 136.0, 142.0, 114.0, 70.0, 56.0, 37.0, 17.0, 10.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.288330078125, -0.28067588806152344, -0.2730216979980469, -0.2653675079345703, -0.25771331787109375, -0.2500591278076172, -0.24240493774414062, -0.23475074768066406, -0.2270965576171875, -0.21944236755371094, -0.21178817749023438, -0.2041339874267578, -0.19647979736328125, -0.1888256072998047, -0.18117141723632812, -0.17351722717285156, -0.165863037109375, -0.15820884704589844, -0.15055465698242188, -0.1429004669189453, -0.13524627685546875, -0.1275920867919922, -0.11993789672851562, -0.11228370666503906, -0.1046295166015625, -0.09697532653808594, -0.08932113647460938, -0.08166694641113281, -0.07401275634765625, -0.06635856628417969, -0.058704376220703125, -0.05105018615722656, -0.04339599609375, -0.03574180603027344, -0.028087615966796875, -0.020433425903320312, -0.01277923583984375, -0.0051250457763671875, 0.002529144287109375, 0.010183334350585938, 0.0178375244140625, 0.025491714477539062, 0.033145904541015625, 0.04080009460449219, 0.04845428466796875, 0.05610847473144531, 0.06376266479492188, 0.07141685485839844, 0.079071044921875, 0.08672523498535156, 0.09437942504882812, 0.10203361511230469, 0.10968780517578125, 0.11734199523925781, 0.12499618530273438, 0.13265037536621094, 0.1403045654296875, 0.14795875549316406, 0.15561294555664062, 0.1632671356201172, 0.17092132568359375, 0.1785755157470703, 0.18622970581054688, 0.19388389587402344, 0.2015380859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 8.0, 9.0, 22.0, 36.0, 47.0, 75.0, 99.0, 104.0, 101.0, 115.0, 95.0, 93.0, 52.0, 50.0, 30.0, 19.0, 9.0, 14.0, 6.0, 2.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6127504110336304, -1.5591074228286743, -1.5054645538330078, -1.4518215656280518, -1.3981785774230957, -1.3445355892181396, -1.2908927202224731, -1.237249732017517, -1.1836068630218506, -1.1299638748168945, -1.076321005821228, -1.022678017616272, -0.9690350294113159, -0.9153921008110046, -0.8617491722106934, -0.8081061840057373, -0.7544631958007812, -0.70082026720047, -0.6471772789955139, -0.5935343503952026, -0.5398913621902466, -0.4862484335899353, -0.432605504989624, -0.37896254658699036, -0.3253195881843567, -0.271676629781723, -0.21803368628025055, -0.16439074277877808, -0.11074778437614441, -0.05710482597351074, -0.003461897373199463, 0.050181061029434204, 0.10382401943206787, 0.15746697783470154, 0.211109921336174, 0.2647528648376465, 0.31839582324028015, 0.3720387816429138, 0.4256817102432251, 0.47932466864585876, 0.5329676270484924, 0.5866105556488037, 0.6402535438537598, 0.693896472454071, 0.7475394010543823, 0.8011823892593384, 0.8548253178596497, 0.9084682464599609, 0.962111234664917, 1.015754222869873, 1.0693970918655396, 1.1230400800704956, 1.1766830682754517, 1.2303259372711182, 1.2839689254760742, 1.3376119136810303, 1.3912549018859863, 1.4448978900909424, 1.4985407590866089, 1.552183747291565, 1.605826735496521, 1.6594696044921875, 1.7131125926971436, 1.7667555809020996, 1.8203984498977661]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 13.0, 6.0, 9.0, 10.0, 16.0, 20.0, 24.0, 18.0, 27.0, 40.0, 38.0, 30.0, 45.0, 33.0, 44.0, 34.0, 39.0, 51.0, 45.0, 47.0, 25.0, 35.0, 39.0, 31.0, 33.0, 31.0, 21.0, 27.0, 32.0, 23.0, 16.0, 21.0, 7.0, 14.0, 8.0, 9.0, 5.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8816020488739014, -0.853523313999176, -0.8254446387290955, -0.7973659038543701, -0.7692871689796448, -0.7412084341049194, -0.7131297588348389, -0.6850510239601135, -0.6569722890853882, -0.6288935542106628, -0.6008148789405823, -0.5727361440658569, -0.5446574091911316, -0.5165786743164062, -0.4884999990463257, -0.46042126417160034, -0.4323425590991974, -0.40426385402679443, -0.3761851191520691, -0.34810641407966614, -0.3200276792049408, -0.29194897413253784, -0.2638702392578125, -0.23579153418540955, -0.2077128142118454, -0.17963409423828125, -0.1515553742647171, -0.12347666174173355, -0.0953979417681694, -0.06731922924518585, -0.039240509271621704, -0.011161789298057556, 0.016916930675506592, 0.04499565064907074, 0.07307437062263489, 0.10115308314561844, 0.12923181056976318, 0.15731051564216614, 0.18538923561573029, 0.21346795558929443, 0.24154667556285858, 0.26962539553642273, 0.2977041006088257, 0.325782835483551, 0.353861540555954, 0.38194024562835693, 0.4100189805030823, 0.4380977153778076, 0.46617642045021057, 0.4942551255226135, 0.5223338603973389, 0.5504125952720642, 0.5784912705421448, 0.6065700054168701, 0.6346487402915955, 0.6627274751663208, 0.6908061504364014, 0.7188848853111267, 0.7469635605812073, 0.7750422954559326, 0.803121030330658, 0.8311997652053833, 0.8592784404754639, 0.8873571753501892, 0.9154359102249146]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 3.0, 15.0, 11.0, 27.0, 37.0, 45.0, 62.0, 124.0, 179.0, 348.0, 668.0, 1340.0, 3046.0, 8021.0, 24825.0, 102023.0, 726140.0, 2915070.0, 327792.0, 58374.0, 15902.0, 5471.0, 2260.0, 1076.0, 594.0, 292.0, 187.0, 107.0, 77.0, 45.0, 34.0, 20.0, 18.0, 14.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.31640625, -0.306304931640625, -0.29620361328125, -0.286102294921875, -0.2760009765625, -0.265899658203125, -0.25579833984375, -0.245697021484375, -0.235595703125, -0.225494384765625, -0.21539306640625, -0.205291748046875, -0.1951904296875, -0.185089111328125, -0.17498779296875, -0.164886474609375, -0.15478515625, -0.144683837890625, -0.13458251953125, -0.124481201171875, -0.1143798828125, -0.104278564453125, -0.09417724609375, -0.084075927734375, -0.073974609375, -0.063873291015625, -0.05377197265625, -0.043670654296875, -0.0335693359375, -0.023468017578125, -0.01336669921875, -0.003265380859375, 0.0068359375, 0.016937255859375, 0.02703857421875, 0.037139892578125, 0.0472412109375, 0.057342529296875, 0.06744384765625, 0.077545166015625, 0.087646484375, 0.097747802734375, 0.10784912109375, 0.117950439453125, 0.1280517578125, 0.138153076171875, 0.14825439453125, 0.158355712890625, 0.16845703125, 0.178558349609375, 0.18865966796875, 0.198760986328125, 0.2088623046875, 0.218963623046875, 0.22906494140625, 0.239166259765625, 0.249267578125, 0.259368896484375, 0.26947021484375, 0.279571533203125, 0.2896728515625, 0.299774169921875, 0.30987548828125, 0.319976806640625, 0.330078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 21.0, 32.0, 36.0, 38.0, 57.0, 63.0, 60.0, 65.0, 80.0, 67.0, 73.0, 67.0, 59.0, 59.0, 46.0, 50.0, 20.0, 21.0, 18.0, 14.0, 3.0, 9.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09344482421875, -0.08835506439208984, -0.08326530456542969, -0.07817554473876953, -0.07308578491210938, -0.06799602508544922, -0.06290626525878906, -0.057816505432128906, -0.05272674560546875, -0.047636985778808594, -0.04254722595214844, -0.03745746612548828, -0.032367706298828125, -0.02727794647216797, -0.022188186645507812, -0.017098426818847656, -0.0120086669921875, -0.006918907165527344, -0.0018291473388671875, 0.0032606124877929688, 0.008350372314453125, 0.013440132141113281, 0.018529891967773438, 0.023619651794433594, 0.02870941162109375, 0.033799171447753906, 0.03888893127441406, 0.04397869110107422, 0.049068450927734375, 0.05415821075439453, 0.05924797058105469, 0.06433773040771484, 0.069427490234375, 0.07451725006103516, 0.07960700988769531, 0.08469676971435547, 0.08978652954101562, 0.09487628936767578, 0.09996604919433594, 0.1050558090209961, 0.11014556884765625, 0.1152353286743164, 0.12032508850097656, 0.12541484832763672, 0.13050460815429688, 0.13559436798095703, 0.1406841278076172, 0.14577388763427734, 0.1508636474609375, 0.15595340728759766, 0.1610431671142578, 0.16613292694091797, 0.17122268676757812, 0.17631244659423828, 0.18140220642089844, 0.1864919662475586, 0.19158172607421875, 0.1966714859008789, 0.20176124572753906, 0.20685100555419922, 0.21194076538085938, 0.21703052520751953, 0.2221202850341797, 0.22721004486083984, 0.2322998046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 8.0, 8.0, 13.0, 12.0, 13.0, 34.0, 52.0, 93.0, 122.0, 199.0, 249.0, 451.0, 783.0, 1253.0, 2249.0, 4653.0, 10091.0, 24575.0, 71031.0, 249227.0, 1167616.0, 2062995.0, 424768.0, 111099.0, 36053.0, 13826.0, 5949.0, 2878.0, 1582.0, 900.0, 524.0, 332.0, 214.0, 146.0, 94.0, 54.0, 46.0, 28.0, 24.0, 6.0, 12.0, 10.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3359375, -0.32550048828125, -0.3150634765625, -0.30462646484375, -0.294189453125, -0.28375244140625, -0.2733154296875, -0.26287841796875, -0.25244140625, -0.24200439453125, -0.2315673828125, -0.22113037109375, -0.210693359375, -0.20025634765625, -0.1898193359375, -0.17938232421875, -0.1689453125, -0.15850830078125, -0.1480712890625, -0.13763427734375, -0.127197265625, -0.11676025390625, -0.1063232421875, -0.09588623046875, -0.08544921875, -0.07501220703125, -0.0645751953125, -0.05413818359375, -0.043701171875, -0.03326416015625, -0.0228271484375, -0.01239013671875, -0.001953125, 0.00848388671875, 0.0189208984375, 0.02935791015625, 0.039794921875, 0.05023193359375, 0.0606689453125, 0.07110595703125, 0.08154296875, 0.09197998046875, 0.1024169921875, 0.11285400390625, 0.123291015625, 0.13372802734375, 0.1441650390625, 0.15460205078125, 0.1650390625, 0.17547607421875, 0.1859130859375, 0.19635009765625, 0.206787109375, 0.21722412109375, 0.2276611328125, 0.23809814453125, 0.24853515625, 0.25897216796875, 0.2694091796875, 0.27984619140625, 0.290283203125, 0.30072021484375, 0.3111572265625, 0.32159423828125, 0.33203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 8.0, 10.0, 12.0, 22.0, 29.0, 45.0, 56.0, 95.0, 148.0, 219.0, 369.0, 587.0, 811.0, 612.0, 369.0, 224.0, 148.0, 103.0, 63.0, 35.0, 34.0, 19.0, 19.0, 12.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24821853637695312, -0.23886871337890625, -0.22951889038085938, -0.2201690673828125, -0.21081924438476562, -0.20146942138671875, -0.19211959838867188, -0.182769775390625, -0.17341995239257812, -0.16407012939453125, -0.15472030639648438, -0.1453704833984375, -0.13602066040039062, -0.12667083740234375, -0.11732101440429688, -0.10797119140625, -0.09862136840820312, -0.08927154541015625, -0.07992172241210938, -0.0705718994140625, -0.061222076416015625, -0.05187225341796875, -0.042522430419921875, -0.033172607421875, -0.023822784423828125, -0.01447296142578125, -0.005123138427734375, 0.0042266845703125, 0.013576507568359375, 0.02292633056640625, 0.032276153564453125, 0.0416259765625, 0.050975799560546875, 0.06032562255859375, 0.06967544555664062, 0.0790252685546875, 0.08837509155273438, 0.09772491455078125, 0.10707473754882812, 0.116424560546875, 0.12577438354492188, 0.13512420654296875, 0.14447402954101562, 0.1538238525390625, 0.16317367553710938, 0.17252349853515625, 0.18187332153320312, 0.19122314453125, 0.20057296752929688, 0.20992279052734375, 0.21927261352539062, 0.2286224365234375, 0.23797225952148438, 0.24732208251953125, 0.2566719055175781, 0.266021728515625, 0.2753715515136719, 0.28472137451171875, 0.2940711975097656, 0.3034210205078125, 0.3127708435058594, 0.32212066650390625, 0.3314704895019531, 0.3408203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 14.0, 15.0, 15.0, 28.0, 31.0, 42.0, 60.0, 63.0, 68.0, 81.0, 93.0, 79.0, 87.0, 74.0, 57.0, 41.0, 40.0, 27.0, 13.0, 14.0, 14.0, 12.0, 11.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2687612771987915, -1.2335816621780396, -1.198401927947998, -1.163222312927246, -1.1280426979064941, -1.0928629636764526, -1.0576833486557007, -1.0225036144256592, -0.9873239994049072, -0.9521443247795105, -0.9169646501541138, -0.8817850351333618, -0.8466053605079651, -0.8114256858825684, -0.7762460708618164, -0.7410663962364197, -0.705886721611023, -0.6707070469856262, -0.6355273723602295, -0.6003477573394775, -0.5651680827140808, -0.5299884080886841, -0.49480876326560974, -0.4596291184425354, -0.42444944381713867, -0.38926976919174194, -0.3540901243686676, -0.31891047954559326, -0.28373080492019653, -0.248551145195961, -0.21337148547172546, -0.17819182574748993, -0.1430121660232544, -0.10783250629901886, -0.07265284657478333, -0.03747318685054779, -0.002293527126312256, 0.03288613259792328, 0.06806579232215881, 0.10324545204639435, 0.13842511177062988, 0.17360477149486542, 0.20878443121910095, 0.2439640909433365, 0.279143750667572, 0.31432342529296875, 0.3495030701160431, 0.38468271493911743, 0.41986238956451416, 0.4550420641899109, 0.49022170901298523, 0.5254013538360596, 0.5605810284614563, 0.595760703086853, 0.630940318107605, 0.6661199927330017, 0.7012996673583984, 0.7364793419837952, 0.7716590166091919, 0.8068386316299438, 0.8420183062553406, 0.8771979808807373, 0.9123775959014893, 0.947557270526886, 0.9827369451522827]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 12.0, 9.0, 16.0, 13.0, 12.0, 21.0, 18.0, 30.0, 21.0, 33.0, 26.0, 35.0, 48.0, 33.0, 37.0, 30.0, 45.0, 29.0, 38.0, 51.0, 35.0, 39.0, 31.0, 34.0, 31.0, 33.0, 27.0, 15.0, 22.0, 18.0, 19.0, 19.0, 13.0, 13.0, 17.0, 13.0, 4.0, 7.0, 9.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.669475793838501, -0.6492985486984253, -0.6291213631629944, -0.6089441180229187, -0.588766872882843, -0.5685896873474121, -0.5484124422073364, -0.5282351970672607, -0.5080579519271851, -0.48788073658943176, -0.4677034914493561, -0.4475262761116028, -0.4273490309715271, -0.4071718156337738, -0.3869946002960205, -0.3668173551559448, -0.3466401696205139, -0.3264629542827606, -0.30628570914268494, -0.28610849380493164, -0.26593124866485596, -0.24575403332710266, -0.22557681798934937, -0.20539958775043488, -0.18522235751152039, -0.1650451272726059, -0.1448678970336914, -0.12469068169593811, -0.10451345145702362, -0.08433622121810913, -0.06415899842977524, -0.043981775641441345, -0.023804545402526855, -0.003627318888902664, 0.016549907624721527, 0.03672713413834572, 0.05690436065196991, 0.0770815908908844, 0.09725881367921829, 0.11743603646755219, 0.13761326670646667, 0.15779049694538116, 0.17796772718429565, 0.19814494252204895, 0.21832217276096344, 0.23849940299987793, 0.2586766183376312, 0.2788538336753845, 0.2990310788154602, 0.3192082941532135, 0.3393855392932892, 0.3595627546310425, 0.37973999977111816, 0.39991721510887146, 0.42009443044662476, 0.44027167558670044, 0.46044889092445374, 0.48062610626220703, 0.5008033514022827, 0.5209805965423584, 0.5411577820777893, 0.561335027217865, 0.5815122723579407, 0.6016894578933716, 0.6218667030334473]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 9.0, 12.0, 15.0, 19.0, 39.0, 54.0, 68.0, 96.0, 184.0, 255.0, 431.0, 699.0, 1222.0, 2014.0, 3447.0, 6186.0, 10591.0, 19058.0, 35368.0, 72722.0, 171784.0, 336910.0, 210151.0, 85837.0, 41233.0, 21480.0, 12053.0, 6846.0, 3990.0, 2298.0, 1330.0, 793.0, 458.0, 287.0, 200.0, 125.0, 95.0, 60.0, 44.0, 29.0, 20.0, 14.0, 6.0, 5.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25830078125, -0.2503795623779297, -0.24245834350585938, -0.23453712463378906, -0.22661590576171875, -0.21869468688964844, -0.21077346801757812, -0.2028522491455078, -0.1949310302734375, -0.1870098114013672, -0.17908859252929688, -0.17116737365722656, -0.16324615478515625, -0.15532493591308594, -0.14740371704101562, -0.1394824981689453, -0.131561279296875, -0.12364006042480469, -0.11571884155273438, -0.10779762268066406, -0.09987640380859375, -0.09195518493652344, -0.08403396606445312, -0.07611274719238281, -0.0681915283203125, -0.06027030944824219, -0.052349090576171875, -0.04442787170410156, -0.03650665283203125, -0.028585433959960938, -0.020664215087890625, -0.012742996215820312, -0.00482177734375, 0.0030994415283203125, 0.011020660400390625, 0.018941879272460938, 0.02686309814453125, 0.03478431701660156, 0.042705535888671875, 0.05062675476074219, 0.0585479736328125, 0.06646919250488281, 0.07439041137695312, 0.08231163024902344, 0.09023284912109375, 0.09815406799316406, 0.10607528686523438, 0.11399650573730469, 0.121917724609375, 0.1298389434814453, 0.13776016235351562, 0.14568138122558594, 0.15360260009765625, 0.16152381896972656, 0.16944503784179688, 0.1773662567138672, 0.1852874755859375, 0.1932086944580078, 0.20112991333007812, 0.20905113220214844, 0.21697235107421875, 0.22489356994628906, 0.23281478881835938, 0.2407360076904297, 0.2486572265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 14.0, 22.0, 19.0, 28.0, 27.0, 56.0, 44.0, 40.0, 53.0, 66.0, 80.0, 57.0, 68.0, 55.0, 50.0, 43.0, 62.0, 50.0, 38.0, 40.0, 16.0, 16.0, 12.0, 11.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09765625, -0.09277534484863281, -0.08789443969726562, -0.08301353454589844, -0.07813262939453125, -0.07325172424316406, -0.06837081909179688, -0.06348991394042969, -0.0586090087890625, -0.05372810363769531, -0.048847198486328125, -0.04396629333496094, -0.03908538818359375, -0.03420448303222656, -0.029323577880859375, -0.024442672729492188, -0.019561767578125, -0.014680862426757812, -0.009799957275390625, -0.0049190521240234375, -3.814697265625e-05, 0.0048427581787109375, 0.009723663330078125, 0.014604568481445312, 0.0194854736328125, 0.024366378784179688, 0.029247283935546875, 0.03412818908691406, 0.03900909423828125, 0.04388999938964844, 0.048770904541015625, 0.05365180969238281, 0.05853271484375, 0.06341361999511719, 0.06829452514648438, 0.07317543029785156, 0.07805633544921875, 0.08293724060058594, 0.08781814575195312, 0.09269905090332031, 0.0975799560546875, 0.10246086120605469, 0.10734176635742188, 0.11222267150878906, 0.11710357666015625, 0.12198448181152344, 0.12686538696289062, 0.1317462921142578, 0.136627197265625, 0.1415081024169922, 0.14638900756835938, 0.15126991271972656, 0.15615081787109375, 0.16103172302246094, 0.16591262817382812, 0.1707935333251953, 0.1756744384765625, 0.1805553436279297, 0.18543624877929688, 0.19031715393066406, 0.19519805908203125, 0.20007896423339844, 0.20495986938476562, 0.2098407745361328, 0.2147216796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 17.0, 12.0, 24.0, 25.0, 34.0, 48.0, 53.0, 105.0, 156.0, 275.0, 465.0, 963.0, 1882.0, 3600.0, 7079.0, 14442.0, 30233.0, 69648.0, 202500.0, 422429.0, 177020.0, 63079.0, 27648.0, 13194.0, 6625.0, 3257.0, 1689.0, 901.0, 452.0, 250.0, 140.0, 89.0, 56.0, 33.0, 24.0, 26.0, 14.0, 8.0, 10.0, 9.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.310302734375, -0.3004341125488281, -0.29056549072265625, -0.2806968688964844, -0.2708282470703125, -0.2609596252441406, -0.25109100341796875, -0.24122238159179688, -0.231353759765625, -0.22148513793945312, -0.21161651611328125, -0.20174789428710938, -0.1918792724609375, -0.18201065063476562, -0.17214202880859375, -0.16227340698242188, -0.15240478515625, -0.14253616333007812, -0.13266754150390625, -0.12279891967773438, -0.1129302978515625, -0.10306167602539062, -0.09319305419921875, -0.08332443237304688, -0.073455810546875, -0.06358718872070312, -0.05371856689453125, -0.043849945068359375, -0.0339813232421875, -0.024112701416015625, -0.01424407958984375, -0.004375457763671875, 0.0054931640625, 0.015361785888671875, 0.02523040771484375, 0.035099029541015625, 0.0449676513671875, 0.054836273193359375, 0.06470489501953125, 0.07457351684570312, 0.084442138671875, 0.09431076049804688, 0.10417938232421875, 0.11404800415039062, 0.1239166259765625, 0.13378524780273438, 0.14365386962890625, 0.15352249145507812, 0.16339111328125, 0.17325973510742188, 0.18312835693359375, 0.19299697875976562, 0.2028656005859375, 0.21273422241210938, 0.22260284423828125, 0.23247146606445312, 0.242340087890625, 0.2522087097167969, 0.26207733154296875, 0.2719459533691406, 0.2818145751953125, 0.2916831970214844, 0.30155181884765625, 0.3114204406738281, 0.3212890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 10.0, 18.0, 17.0, 11.0, 21.0, 29.0, 32.0, 38.0, 36.0, 48.0, 43.0, 49.0, 65.0, 48.0, 46.0, 46.0, 43.0, 45.0, 52.0, 40.0, 27.0, 20.0, 35.0, 21.0, 25.0, 12.0, 22.0, 12.0, 13.0, 12.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.34228515625, -0.33154296875, -0.32080078125, -0.31005859375, -0.29931640625, -0.28857421875, -0.27783203125, -0.26708984375, -0.25634765625, -0.24560546875, -0.23486328125, -0.22412109375, -0.21337890625, -0.20263671875, -0.19189453125, -0.18115234375, -0.17041015625, -0.15966796875, -0.14892578125, -0.13818359375, -0.12744140625, -0.11669921875, -0.10595703125, -0.09521484375, -0.08447265625, -0.07373046875, -0.06298828125, -0.05224609375, -0.04150390625, -0.03076171875, -0.02001953125, -0.00927734375, 0.00146484375, 0.01220703125, 0.02294921875, 0.03369140625, 0.04443359375, 0.05517578125, 0.06591796875, 0.07666015625, 0.08740234375, 0.09814453125, 0.10888671875, 0.11962890625, 0.13037109375, 0.14111328125, 0.15185546875, 0.16259765625, 0.17333984375, 0.18408203125, 0.19482421875, 0.20556640625, 0.21630859375, 0.22705078125, 0.23779296875, 0.24853515625, 0.25927734375, 0.27001953125, 0.28076171875, 0.29150390625, 0.30224609375, 0.31298828125, 0.32373046875, 0.33447265625, 0.34521484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 17.0, 21.0, 65.0, 89.0, 150.0, 291.0, 447.0, 843.0, 1526.0, 2642.0, 4890.0, 8557.0, 15554.0, 27801.0, 53806.0, 134353.0, 373212.0, 251194.0, 85800.0, 39418.0, 21034.0, 11755.0, 6640.0, 3705.0, 2068.0, 1122.0, 652.0, 347.0, 222.0, 118.0, 77.0, 39.0, 34.0, 18.0, 9.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129150390625, -0.12450027465820312, -0.11985015869140625, -0.11520004272460938, -0.1105499267578125, -0.10589981079101562, -0.10124969482421875, -0.09659957885742188, -0.091949462890625, -0.08729934692382812, -0.08264923095703125, -0.07799911499023438, -0.0733489990234375, -0.06869888305664062, -0.06404876708984375, -0.059398651123046875, -0.05474853515625, -0.050098419189453125, -0.04544830322265625, -0.040798187255859375, -0.0361480712890625, -0.031497955322265625, -0.02684783935546875, -0.022197723388671875, -0.017547607421875, -0.012897491455078125, -0.00824737548828125, -0.003597259521484375, 0.0010528564453125, 0.005702972412109375, 0.01035308837890625, 0.015003204345703125, 0.0196533203125, 0.024303436279296875, 0.02895355224609375, 0.033603668212890625, 0.0382537841796875, 0.042903900146484375, 0.04755401611328125, 0.052204132080078125, 0.056854248046875, 0.061504364013671875, 0.06615447998046875, 0.07080459594726562, 0.0754547119140625, 0.08010482788085938, 0.08475494384765625, 0.08940505981445312, 0.09405517578125, 0.09870529174804688, 0.10335540771484375, 0.10800552368164062, 0.1126556396484375, 0.11730575561523438, 0.12195587158203125, 0.12660598754882812, 0.131256103515625, 0.13590621948242188, 0.14055633544921875, 0.14520645141601562, 0.1498565673828125, 0.15450668334960938, 0.15915679931640625, 0.16380691528320312, 0.16845703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 3.0, 8.0, 14.0, 10.0, 28.0, 26.0, 48.0, 51.0, 106.0, 174.0, 170.0, 117.0, 60.0, 54.0, 27.0, 26.0, 12.0, 10.0, 7.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.601478576660156e-05, -4.463084042072296e-05, -4.324689507484436e-05, -4.186294972896576e-05, -4.047900438308716e-05, -3.909505903720856e-05, -3.7711113691329956e-05, -3.6327168345451355e-05, -3.4943222999572754e-05, -3.355927765369415e-05, -3.217533230781555e-05, -3.079138696193695e-05, -2.940744161605835e-05, -2.802349627017975e-05, -2.6639550924301147e-05, -2.5255605578422546e-05, -2.3871660232543945e-05, -2.2487714886665344e-05, -2.1103769540786743e-05, -1.9719824194908142e-05, -1.833587884902954e-05, -1.695193350315094e-05, -1.556798815727234e-05, -1.4184042811393738e-05, -1.2800097465515137e-05, -1.1416152119636536e-05, -1.0032206773757935e-05, -8.648261427879333e-06, -7.264316082000732e-06, -5.880370736122131e-06, -4.49642539024353e-06, -3.112480044364929e-06, -1.7285346984863281e-06, -3.4458935260772705e-07, 1.039355993270874e-06, 2.423301339149475e-06, 3.807246685028076e-06, 5.191192030906677e-06, 6.575137376785278e-06, 7.95908272266388e-06, 9.34302806854248e-06, 1.0726973414421082e-05, 1.2110918760299683e-05, 1.3494864106178284e-05, 1.4878809452056885e-05, 1.6262754797935486e-05, 1.7646700143814087e-05, 1.9030645489692688e-05, 2.041459083557129e-05, 2.179853618144989e-05, 2.318248152732849e-05, 2.4566426873207092e-05, 2.5950372219085693e-05, 2.7334317564964294e-05, 2.8718262910842896e-05, 3.0102208256721497e-05, 3.14861536026001e-05, 3.28700989484787e-05, 3.42540442943573e-05, 3.56379896402359e-05, 3.70219349861145e-05, 3.84058803319931e-05, 3.9789825677871704e-05, 4.1173771023750305e-05, 4.2557716369628906e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 16.0, 20.0, 35.0, 56.0, 121.0, 168.0, 449.0, 1126.0, 2721.0, 7231.0, 18793.0, 48660.0, 159540.0, 558463.0, 168911.0, 50108.0, 19670.0, 7491.0, 2900.0, 1125.0, 471.0, 205.0, 106.0, 62.0, 33.0, 36.0, 13.0, 7.0, 8.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2333984375, -0.22622108459472656, -0.21904373168945312, -0.2118663787841797, -0.20468902587890625, -0.1975116729736328, -0.19033432006835938, -0.18315696716308594, -0.1759796142578125, -0.16880226135253906, -0.16162490844726562, -0.1544475555419922, -0.14727020263671875, -0.1400928497314453, -0.13291549682617188, -0.12573814392089844, -0.118560791015625, -0.11138343811035156, -0.10420608520507812, -0.09702873229980469, -0.08985137939453125, -0.08267402648925781, -0.07549667358398438, -0.06831932067871094, -0.0611419677734375, -0.05396461486816406, -0.046787261962890625, -0.03960990905761719, -0.03243255615234375, -0.025255203247070312, -0.018077850341796875, -0.010900497436523438, -0.00372314453125, 0.0034542083740234375, 0.010631561279296875, 0.017808914184570312, 0.02498626708984375, 0.03216361999511719, 0.039340972900390625, 0.04651832580566406, 0.0536956787109375, 0.06087303161621094, 0.06805038452148438, 0.07522773742675781, 0.08240509033203125, 0.08958244323730469, 0.09675979614257812, 0.10393714904785156, 0.111114501953125, 0.11829185485839844, 0.12546920776367188, 0.1326465606689453, 0.13982391357421875, 0.1470012664794922, 0.15417861938476562, 0.16135597229003906, 0.1685333251953125, 0.17571067810058594, 0.18288803100585938, 0.1900653839111328, 0.19724273681640625, 0.2044200897216797, 0.21159744262695312, 0.21877479553222656, 0.2259521484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 9.0, 7.0, 7.0, 9.0, 13.0, 17.0, 15.0, 30.0, 35.0, 43.0, 62.0, 94.0, 107.0, 121.0, 94.0, 92.0, 44.0, 34.0, 26.0, 18.0, 15.0, 16.0, 17.0, 11.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.162109375, -0.15708160400390625, -0.1520538330078125, -0.14702606201171875, -0.141998291015625, -0.13697052001953125, -0.1319427490234375, -0.12691497802734375, -0.12188720703125, -0.11685943603515625, -0.1118316650390625, -0.10680389404296875, -0.101776123046875, -0.09674835205078125, -0.0917205810546875, -0.08669281005859375, -0.0816650390625, -0.07663726806640625, -0.0716094970703125, -0.06658172607421875, -0.061553955078125, -0.05652618408203125, -0.0514984130859375, -0.04647064208984375, -0.04144287109375, -0.03641510009765625, -0.0313873291015625, -0.02635955810546875, -0.021331787109375, -0.01630401611328125, -0.0112762451171875, -0.00624847412109375, -0.001220703125, 0.00380706787109375, 0.0088348388671875, 0.01386260986328125, 0.018890380859375, 0.02391815185546875, 0.0289459228515625, 0.03397369384765625, 0.03900146484375, 0.04402923583984375, 0.0490570068359375, 0.05408477783203125, 0.059112548828125, 0.06414031982421875, 0.0691680908203125, 0.07419586181640625, 0.0792236328125, 0.08425140380859375, 0.0892791748046875, 0.09430694580078125, 0.099334716796875, 0.10436248779296875, 0.1093902587890625, 0.11441802978515625, 0.11944580078125, 0.12447357177734375, 0.1295013427734375, 0.13452911376953125, 0.139556884765625, 0.14458465576171875, 0.1496124267578125, 0.15464019775390625, 0.15966796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 27.0, 84.0, 163.0, 282.0, 257.0, 129.0, 49.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1073641777038574, -0.9641190767288208, -0.8208739757537842, -0.6776288747787476, -0.5343837738037109, -0.3911386728286743, -0.2478935718536377, -0.10464847087860107, 0.03859663009643555, 0.18184173107147217, 0.3250868320465088, 0.4683319330215454, 0.611577033996582, 0.7548221349716187, 0.8980672359466553, 1.041312336921692, 1.1845574378967285, 1.3278025388717651, 1.4710476398468018, 1.6142927408218384, 1.757537841796875, 1.9007829427719116, 2.0440280437469482, 2.1872730255126953, 2.3305182456970215, 2.4737634658813477, 2.6170084476470947, 2.760253429412842, 2.903498649597168, 3.046743869781494, 3.189988851547241, 3.3332338333129883, 3.4764795303344727, 3.619724750518799, 3.762969732284546, 3.906214714050293, 4.049459934234619, 4.192705154418945, 4.335949897766113, 4.4791951179504395, 4.622440338134766, 4.765685558319092, 4.908930778503418, 5.052175521850586, 5.195420742034912, 5.338665962219238, 5.481910705566406, 5.625155925750732, 5.768401145935059, 5.911646366119385, 6.054891586303711, 6.198136329650879, 6.341381549835205, 6.484626770019531, 6.627871513366699, 6.771116733551025, 6.914361953735352, 7.057607173919678, 7.200852394104004, 7.344097137451172, 7.487342357635498, 7.630587577819824, 7.773832321166992, 7.917077541351318, 8.060322761535645]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 7.0, 6.0, 11.0, 13.0, 17.0, 21.0, 15.0, 9.0, 24.0, 27.0, 23.0, 21.0, 24.0, 43.0, 46.0, 36.0, 43.0, 28.0, 33.0, 38.0, 28.0, 44.0, 46.0, 40.0, 25.0, 38.0, 26.0, 40.0, 26.0, 20.0, 21.0, 23.0, 22.0, 24.0, 20.0, 6.0, 8.0, 10.0, 6.0, 8.0, 4.0, 7.0, 8.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8121540546417236, -0.783103883266449, -0.7540537118911743, -0.7250035405158997, -0.695953369140625, -0.6669031977653503, -0.6378530263900757, -0.6088029146194458, -0.5797526836395264, -0.5507025122642517, -0.521652340888977, -0.4926021695137024, -0.46355199813842773, -0.4345018267631531, -0.4054516851902008, -0.37640151381492615, -0.3473513722419739, -0.3183012008666992, -0.28925102949142456, -0.2602008581161499, -0.23115070164203644, -0.20210053026676178, -0.17305037379264832, -0.14400020241737366, -0.114950031042099, -0.08589985966682434, -0.05684969574213028, -0.027799531817436218, 0.00125063955783844, 0.030300810933113098, 0.05935096740722656, 0.08840113878250122, 0.11745131015777588, 0.14650148153305054, 0.1755516529083252, 0.20460180938243866, 0.23365198075771332, 0.26270216703414917, 0.29175230860710144, 0.3208024799823761, 0.34985265135765076, 0.3789028227329254, 0.4079529941082001, 0.43700313568115234, 0.466053307056427, 0.49510347843170166, 0.5241536498069763, 0.553203821182251, 0.5822539925575256, 0.6113041639328003, 0.640354335308075, 0.6694045066833496, 0.6984546780586243, 0.7275048494338989, 0.7565549612045288, 0.7856051921844482, 0.8146553039550781, 0.8437054753303528, 0.8727556467056274, 0.9018058180809021, 0.9308559894561768, 0.9599061608314514, 0.9889563322067261, 1.018006443977356, 1.0470566749572754]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 11.0, 14.0, 11.0, 20.0, 38.0, 52.0, 72.0, 84.0, 142.0, 222.0, 319.0, 497.0, 798.0, 1315.0, 2260.0, 4081.0, 8115.0, 16443.0, 35752.0, 85098.0, 228738.0, 840760.0, 2206996.0, 491301.0, 156436.0, 60987.0, 26436.0, 12615.0, 6436.0, 3248.0, 1828.0, 1144.0, 669.0, 434.0, 277.0, 195.0, 119.0, 110.0, 52.0, 37.0, 34.0, 24.0, 15.0, 14.0, 13.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192626953125, -0.18627357482910156, -0.17992019653320312, -0.1735668182373047, -0.16721343994140625, -0.1608600616455078, -0.15450668334960938, -0.14815330505371094, -0.1417999267578125, -0.13544654846191406, -0.12909317016601562, -0.12273979187011719, -0.11638641357421875, -0.11003303527832031, -0.10367965698242188, -0.09732627868652344, -0.090972900390625, -0.08461952209472656, -0.07826614379882812, -0.07191276550292969, -0.06555938720703125, -0.05920600891113281, -0.052852630615234375, -0.04649925231933594, -0.0401458740234375, -0.03379249572753906, -0.027439117431640625, -0.021085739135742188, -0.01473236083984375, -0.008378982543945312, -0.002025604248046875, 0.0043277740478515625, 0.01068115234375, 0.017034530639648438, 0.023387908935546875, 0.029741287231445312, 0.03609466552734375, 0.04244804382324219, 0.048801422119140625, 0.05515480041503906, 0.0615081787109375, 0.06786155700683594, 0.07421493530273438, 0.08056831359863281, 0.08692169189453125, 0.09327507019042969, 0.09962844848632812, 0.10598182678222656, 0.112335205078125, 0.11868858337402344, 0.12504196166992188, 0.1313953399658203, 0.13774871826171875, 0.1441020965576172, 0.15045547485351562, 0.15680885314941406, 0.1631622314453125, 0.16951560974121094, 0.17586898803710938, 0.1822223663330078, 0.18857574462890625, 0.1949291229248047, 0.20128250122070312, 0.20763587951660156, 0.2139892578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 8.0, 11.0, 11.0, 22.0, 26.0, 29.0, 34.0, 37.0, 48.0, 61.0, 61.0, 62.0, 66.0, 53.0, 64.0, 57.0, 59.0, 38.0, 60.0, 37.0, 37.0, 27.0, 23.0, 15.0, 9.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09636116027832031, -0.09140396118164062, -0.08644676208496094, -0.08148956298828125, -0.07653236389160156, -0.07157516479492188, -0.06661796569824219, -0.0616607666015625, -0.05670356750488281, -0.051746368408203125, -0.04678916931152344, -0.04183197021484375, -0.03687477111816406, -0.031917572021484375, -0.026960372924804688, -0.022003173828125, -0.017045974731445312, -0.012088775634765625, -0.0071315765380859375, -0.00217437744140625, 0.0027828216552734375, 0.007740020751953125, 0.012697219848632812, 0.0176544189453125, 0.022611618041992188, 0.027568817138671875, 0.03252601623535156, 0.03748321533203125, 0.04244041442871094, 0.047397613525390625, 0.05235481262207031, 0.05731201171875, 0.06226921081542969, 0.06722640991210938, 0.07218360900878906, 0.07714080810546875, 0.08209800720214844, 0.08705520629882812, 0.09201240539550781, 0.0969696044921875, 0.10192680358886719, 0.10688400268554688, 0.11184120178222656, 0.11679840087890625, 0.12175559997558594, 0.12671279907226562, 0.1316699981689453, 0.136627197265625, 0.1415843963623047, 0.14654159545898438, 0.15149879455566406, 0.15645599365234375, 0.16141319274902344, 0.16637039184570312, 0.1713275909423828, 0.1762847900390625, 0.1812419891357422, 0.18619918823242188, 0.19115638732910156, 0.19611358642578125, 0.20107078552246094, 0.20602798461914062, 0.2109851837158203, 0.2159423828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 14.0, 16.0, 24.0, 32.0, 44.0, 58.0, 81.0, 119.0, 151.0, 254.0, 397.0, 519.0, 816.0, 1334.0, 1961.0, 3466.0, 5898.0, 10932.0, 21002.0, 43153.0, 97026.0, 238522.0, 672722.0, 1842119.0, 779127.0, 267941.0, 107604.0, 48014.0, 22737.0, 11992.0, 6446.0, 3637.0, 2181.0, 1384.0, 849.0, 537.0, 354.0, 259.0, 162.0, 123.0, 74.0, 50.0, 44.0, 34.0, 17.0, 20.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2490234375, -0.240875244140625, -0.23272705078125, -0.224578857421875, -0.2164306640625, -0.208282470703125, -0.20013427734375, -0.191986083984375, -0.183837890625, -0.175689697265625, -0.16754150390625, -0.159393310546875, -0.1512451171875, -0.143096923828125, -0.13494873046875, -0.126800537109375, -0.11865234375, -0.110504150390625, -0.10235595703125, -0.094207763671875, -0.0860595703125, -0.077911376953125, -0.06976318359375, -0.061614990234375, -0.053466796875, -0.045318603515625, -0.03717041015625, -0.029022216796875, -0.0208740234375, -0.012725830078125, -0.00457763671875, 0.003570556640625, 0.01171875, 0.019866943359375, 0.02801513671875, 0.036163330078125, 0.0443115234375, 0.052459716796875, 0.06060791015625, 0.068756103515625, 0.076904296875, 0.085052490234375, 0.09320068359375, 0.101348876953125, 0.1094970703125, 0.117645263671875, 0.12579345703125, 0.133941650390625, 0.14208984375, 0.150238037109375, 0.15838623046875, 0.166534423828125, 0.1746826171875, 0.182830810546875, 0.19097900390625, 0.199127197265625, 0.207275390625, 0.215423583984375, 0.22357177734375, 0.231719970703125, 0.2398681640625, 0.248016357421875, 0.25616455078125, 0.264312744140625, 0.2724609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 12.0, 16.0, 10.0, 15.0, 21.0, 31.0, 35.0, 41.0, 70.0, 91.0, 146.0, 177.0, 253.0, 369.0, 527.0, 655.0, 464.0, 317.0, 232.0, 173.0, 104.0, 75.0, 56.0, 48.0, 26.0, 28.0, 15.0, 12.0, 6.0, 12.0, 7.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.281005859375, -0.2732830047607422, -0.2655601501464844, -0.25783729553222656, -0.25011444091796875, -0.24239158630371094, -0.23466873168945312, -0.2269458770751953, -0.2192230224609375, -0.2115001678466797, -0.20377731323242188, -0.19605445861816406, -0.18833160400390625, -0.18060874938964844, -0.17288589477539062, -0.1651630401611328, -0.157440185546875, -0.1497173309326172, -0.14199447631835938, -0.13427162170410156, -0.12654876708984375, -0.11882591247558594, -0.11110305786132812, -0.10338020324707031, -0.0956573486328125, -0.08793449401855469, -0.08021163940429688, -0.07248878479003906, -0.06476593017578125, -0.05704307556152344, -0.049320220947265625, -0.04159736633300781, -0.03387451171875, -0.026151657104492188, -0.018428802490234375, -0.010705947875976562, -0.00298309326171875, 0.0047397613525390625, 0.012462615966796875, 0.020185470581054688, 0.0279083251953125, 0.03563117980957031, 0.043354034423828125, 0.05107688903808594, 0.05879974365234375, 0.06652259826660156, 0.07424545288085938, 0.08196830749511719, 0.089691162109375, 0.09741401672363281, 0.10513687133789062, 0.11285972595214844, 0.12058258056640625, 0.12830543518066406, 0.13602828979492188, 0.1437511444091797, 0.1514739990234375, 0.1591968536376953, 0.16691970825195312, 0.17464256286621094, 0.18236541748046875, 0.19008827209472656, 0.19781112670898438, 0.2055339813232422, 0.2132568359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 6.0, 12.0, 29.0, 34.0, 53.0, 66.0, 79.0, 84.0, 75.0, 92.0, 99.0, 78.0, 70.0, 61.0, 42.0, 31.0, 28.0, 15.0, 11.0, 11.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6479687690734863, -1.604292392730713, -1.5606160163879395, -1.5169397592544556, -1.4732633829116821, -1.4295870065689087, -1.3859106302261353, -1.3422343730926514, -1.298557996749878, -1.2548816204071045, -1.211205244064331, -1.1675289869308472, -1.1238526105880737, -1.0801762342453003, -1.0364998579025269, -0.9928235411643982, -0.9491471648216248, -0.9054707884788513, -0.8617944717407227, -0.8181180953979492, -0.7744417786598206, -0.7307654023170471, -0.6870890855789185, -0.643412709236145, -0.5997363328933716, -0.5560599565505981, -0.5123836398124695, -0.46870726346969604, -0.4250309467315674, -0.38135457038879395, -0.3376782238483429, -0.29400187730789185, -0.2503255605697632, -0.20664921402931213, -0.16297286748886108, -0.11929650604724884, -0.07562015950679779, -0.03194381296634674, 0.011732548475265503, 0.05540889501571655, 0.0990852415561676, 0.14276158809661865, 0.1864379346370697, 0.23011429607868195, 0.2737906575202942, 0.31746697425842285, 0.3611433506011963, 0.40481969714164734, 0.4484960436820984, 0.49217239022254944, 0.5358487367630005, 0.5795251131057739, 0.6232014298439026, 0.666877806186676, 0.7105541229248047, 0.7542304992675781, 0.7979068756103516, 0.841583251953125, 0.8852595686912537, 0.9289359450340271, 0.9726122617721558, 1.0162886381149292, 1.0599650144577026, 1.1036412715911865, 1.14731764793396]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 6.0, 4.0, 9.0, 12.0, 10.0, 20.0, 13.0, 24.0, 18.0, 19.0, 18.0, 31.0, 30.0, 23.0, 31.0, 45.0, 40.0, 30.0, 39.0, 36.0, 44.0, 33.0, 43.0, 47.0, 39.0, 27.0, 40.0, 30.0, 38.0, 34.0, 25.0, 14.0, 21.0, 15.0, 21.0, 22.0, 8.0, 8.0, 10.0, 5.0, 7.0, 3.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7765210270881653, -0.7536066174507141, -0.7306922674179077, -0.7077778577804565, -0.6848634481430054, -0.661949098110199, -0.6390346884727478, -0.6161203384399414, -0.5932059288024902, -0.5702915191650391, -0.5473771691322327, -0.5244627594947815, -0.5015484094619751, -0.4786339998245239, -0.45571959018707275, -0.43280521035194397, -0.4098908305168152, -0.3869764506816864, -0.3640620708465576, -0.34114766120910645, -0.31823328137397766, -0.2953189015388489, -0.2724044919013977, -0.24949011206626892, -0.22657573223114014, -0.20366135239601135, -0.18074695765972137, -0.1578325629234314, -0.1349181830883026, -0.11200379580259323, -0.08908940851688385, -0.06617501378059387, -0.04326069355010986, -0.020346306264400482, 0.002568081021308899, 0.02548246830701828, 0.04839685559272766, 0.07131124287843704, 0.09422563016414642, 0.1171400249004364, 0.14005440473556519, 0.16296878457069397, 0.18588317930698395, 0.20879757404327393, 0.2317119538784027, 0.2546263337135315, 0.27754074335098267, 0.30045512318611145, 0.32336950302124023, 0.346283882856369, 0.3691982626914978, 0.392112672328949, 0.41502705216407776, 0.43794143199920654, 0.4608558416366577, 0.4837702214717865, 0.5066846013069153, 0.5295990109443665, 0.5525133609771729, 0.575427770614624, 0.5983421802520752, 0.6212565302848816, 0.6441709399223328, 0.6670852899551392, 0.6899996995925903]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 8.0, 12.0, 8.0, 21.0, 25.0, 31.0, 77.0, 84.0, 127.0, 199.0, 293.0, 489.0, 720.0, 1196.0, 1932.0, 2936.0, 4544.0, 7317.0, 11663.0, 18671.0, 29895.0, 49802.0, 83304.0, 136979.0, 192500.0, 185137.0, 126209.0, 75451.0, 45138.0, 27466.0, 17256.0, 10505.0, 6872.0, 4277.0, 2734.0, 1666.0, 984.0, 735.0, 435.0, 293.0, 163.0, 142.0, 86.0, 58.0, 45.0, 18.0, 14.0, 15.0, 7.0, 7.0, 1.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.16943359375, -0.16395187377929688, -0.15847015380859375, -0.15298843383789062, -0.1475067138671875, -0.14202499389648438, -0.13654327392578125, -0.13106155395507812, -0.125579833984375, -0.12009811401367188, -0.11461639404296875, -0.10913467407226562, -0.1036529541015625, -0.09817123413085938, -0.09268951416015625, -0.08720779418945312, -0.08172607421875, -0.07624435424804688, -0.07076263427734375, -0.06528091430664062, -0.0597991943359375, -0.054317474365234375, -0.04883575439453125, -0.043354034423828125, -0.037872314453125, -0.032390594482421875, -0.02690887451171875, -0.021427154541015625, -0.0159454345703125, -0.010463714599609375, -0.00498199462890625, 0.000499725341796875, 0.0059814453125, 0.011463165283203125, 0.01694488525390625, 0.022426605224609375, 0.0279083251953125, 0.033390045166015625, 0.03887176513671875, 0.044353485107421875, 0.049835205078125, 0.055316925048828125, 0.06079864501953125, 0.06628036499023438, 0.0717620849609375, 0.07724380493164062, 0.08272552490234375, 0.08820724487304688, 0.09368896484375, 0.09917068481445312, 0.10465240478515625, 0.11013412475585938, 0.1156158447265625, 0.12109756469726562, 0.12657928466796875, 0.13206100463867188, 0.137542724609375, 0.14302444458007812, 0.14850616455078125, 0.15398788452148438, 0.1594696044921875, 0.16495132446289062, 0.17043304443359375, 0.17591476440429688, 0.181396484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 11.0, 10.0, 11.0, 12.0, 26.0, 24.0, 33.0, 30.0, 45.0, 37.0, 47.0, 56.0, 64.0, 55.0, 67.0, 70.0, 62.0, 44.0, 44.0, 43.0, 37.0, 45.0, 26.0, 20.0, 21.0, 19.0, 17.0, 6.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.1123952865600586, -0.10693168640136719, -0.10146808624267578, -0.09600448608398438, -0.09054088592529297, -0.08507728576660156, -0.07961368560791016, -0.07415008544921875, -0.06868648529052734, -0.06322288513183594, -0.05775928497314453, -0.052295684814453125, -0.04683208465576172, -0.04136848449707031, -0.035904884338378906, -0.0304412841796875, -0.024977684020996094, -0.019514083862304688, -0.014050483703613281, -0.008586883544921875, -0.0031232833862304688, 0.0023403167724609375, 0.007803916931152344, 0.01326751708984375, 0.018731117248535156, 0.024194717407226562, 0.02965831756591797, 0.035121917724609375, 0.04058551788330078, 0.04604911804199219, 0.051512718200683594, 0.056976318359375, 0.062439918518066406, 0.06790351867675781, 0.07336711883544922, 0.07883071899414062, 0.08429431915283203, 0.08975791931152344, 0.09522151947021484, 0.10068511962890625, 0.10614871978759766, 0.11161231994628906, 0.11707592010498047, 0.12253952026367188, 0.12800312042236328, 0.1334667205810547, 0.1389303207397461, 0.1443939208984375, 0.1498575210571289, 0.1553211212158203, 0.16078472137451172, 0.16624832153320312, 0.17171192169189453, 0.17717552185058594, 0.18263912200927734, 0.18810272216796875, 0.19356632232666016, 0.19902992248535156, 0.20449352264404297, 0.20995712280273438, 0.21542072296142578, 0.2208843231201172, 0.2263479232788086, 0.2318115234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 12.0, 12.0, 24.0, 28.0, 47.0, 70.0, 122.0, 230.0, 561.0, 1263.0, 3647.0, 10277.0, 30220.0, 99236.0, 350242.0, 386133.0, 114194.0, 34157.0, 11436.0, 3983.0, 1493.0, 565.0, 248.0, 122.0, 58.0, 45.0, 29.0, 11.0, 21.0, 13.0, 9.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.425048828125, -0.4113616943359375, -0.397674560546875, -0.3839874267578125, -0.37030029296875, -0.3566131591796875, -0.342926025390625, -0.3292388916015625, -0.3155517578125, -0.3018646240234375, -0.288177490234375, -0.2744903564453125, -0.26080322265625, -0.2471160888671875, -0.233428955078125, -0.2197418212890625, -0.2060546875, -0.1923675537109375, -0.178680419921875, -0.1649932861328125, -0.15130615234375, -0.1376190185546875, -0.123931884765625, -0.1102447509765625, -0.0965576171875, -0.0828704833984375, -0.069183349609375, -0.0554962158203125, -0.04180908203125, -0.0281219482421875, -0.014434814453125, -0.0007476806640625, 0.012939453125, 0.0266265869140625, 0.040313720703125, 0.0540008544921875, 0.06768798828125, 0.0813751220703125, 0.095062255859375, 0.1087493896484375, 0.1224365234375, 0.1361236572265625, 0.149810791015625, 0.1634979248046875, 0.17718505859375, 0.1908721923828125, 0.204559326171875, 0.2182464599609375, 0.23193359375, 0.2456207275390625, 0.259307861328125, 0.2729949951171875, 0.28668212890625, 0.3003692626953125, 0.314056396484375, 0.3277435302734375, 0.3414306640625, 0.3551177978515625, 0.368804931640625, 0.3824920654296875, 0.39617919921875, 0.4098663330078125, 0.423553466796875, 0.4372406005859375, 0.450927734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 7.0, 8.0, 9.0, 20.0, 19.0, 18.0, 17.0, 27.0, 27.0, 28.0, 41.0, 59.0, 49.0, 36.0, 47.0, 58.0, 39.0, 43.0, 38.0, 48.0, 47.0, 45.0, 37.0, 37.0, 33.0, 36.0, 24.0, 17.0, 13.0, 12.0, 4.0, 6.0, 2.0, 7.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.431396484375, -0.4179801940917969, -0.40456390380859375, -0.3911476135253906, -0.3777313232421875, -0.3643150329589844, -0.35089874267578125, -0.3374824523925781, -0.324066162109375, -0.3106498718261719, -0.29723358154296875, -0.2838172912597656, -0.2704010009765625, -0.2569847106933594, -0.24356842041015625, -0.23015213012695312, -0.21673583984375, -0.20331954956054688, -0.18990325927734375, -0.17648696899414062, -0.1630706787109375, -0.14965438842773438, -0.13623809814453125, -0.12282180786132812, -0.109405517578125, -0.09598922729492188, -0.08257293701171875, -0.06915664672851562, -0.0557403564453125, -0.042324066162109375, -0.02890777587890625, -0.015491485595703125, -0.0020751953125, 0.011341094970703125, 0.02475738525390625, 0.038173675537109375, 0.0515899658203125, 0.06500625610351562, 0.07842254638671875, 0.09183883666992188, 0.105255126953125, 0.11867141723632812, 0.13208770751953125, 0.14550399780273438, 0.1589202880859375, 0.17233657836914062, 0.18575286865234375, 0.19916915893554688, 0.21258544921875, 0.22600173950195312, 0.23941802978515625, 0.2528343200683594, 0.2662506103515625, 0.2796669006347656, 0.29308319091796875, 0.3064994812011719, 0.319915771484375, 0.3333320617675781, 0.34674835205078125, 0.3601646423339844, 0.3735809326171875, 0.3869972229003906, 0.40041351318359375, 0.4138298034667969, 0.42724609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 11.0, 12.0, 19.0, 21.0, 39.0, 44.0, 69.0, 105.0, 146.0, 288.0, 416.0, 788.0, 1425.0, 2600.0, 5169.0, 10262.0, 21629.0, 47171.0, 110137.0, 312352.0, 325625.0, 116226.0, 49385.0, 22500.0, 10638.0, 5262.0, 2646.0, 1529.0, 792.0, 451.0, 279.0, 171.0, 119.0, 65.0, 47.0, 32.0, 27.0, 20.0, 13.0, 4.0, 1.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15883445739746094, -0.15336227416992188, -0.1478900909423828, -0.14241790771484375, -0.1369457244873047, -0.13147354125976562, -0.12600135803222656, -0.1205291748046875, -0.11505699157714844, -0.10958480834960938, -0.10411262512207031, -0.09864044189453125, -0.09316825866699219, -0.08769607543945312, -0.08222389221191406, -0.076751708984375, -0.07127952575683594, -0.06580734252929688, -0.06033515930175781, -0.05486297607421875, -0.04939079284667969, -0.043918609619140625, -0.03844642639160156, -0.0329742431640625, -0.027502059936523438, -0.022029876708984375, -0.016557693481445312, -0.01108551025390625, -0.0056133270263671875, -0.000141143798828125, 0.0053310394287109375, 0.01080322265625, 0.016275405883789062, 0.021747589111328125, 0.027219772338867188, 0.03269195556640625, 0.03816413879394531, 0.043636322021484375, 0.04910850524902344, 0.0545806884765625, 0.06005287170410156, 0.06552505493164062, 0.07099723815917969, 0.07646942138671875, 0.08194160461425781, 0.08741378784179688, 0.09288597106933594, 0.098358154296875, 0.10383033752441406, 0.10930252075195312, 0.11477470397949219, 0.12024688720703125, 0.1257190704345703, 0.13119125366210938, 0.13666343688964844, 0.1421356201171875, 0.14760780334472656, 0.15307998657226562, 0.1585521697998047, 0.16402435302734375, 0.1694965362548828, 0.17496871948242188, 0.18044090270996094, 0.1859130859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 16.0, 15.0, 15.0, 25.0, 38.0, 54.0, 99.0, 145.0, 203.0, 153.0, 64.0, 49.0, 35.0, 33.0, 16.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0187110900878906e-05, -4.820898175239563e-05, -4.6230852603912354e-05, -4.425272345542908e-05, -4.22745943069458e-05, -4.0296465158462524e-05, -3.831833600997925e-05, -3.634020686149597e-05, -3.4362077713012695e-05, -3.238394856452942e-05, -3.0405819416046143e-05, -2.8427690267562866e-05, -2.644956111907959e-05, -2.4471431970596313e-05, -2.2493302822113037e-05, -2.051517367362976e-05, -1.8537044525146484e-05, -1.6558915376663208e-05, -1.4580786228179932e-05, -1.2602657079696655e-05, -1.0624527931213379e-05, -8.646398782730103e-06, -6.668269634246826e-06, -4.69014048576355e-06, -2.7120113372802734e-06, -7.338821887969971e-07, 1.2442469596862793e-06, 3.2223761081695557e-06, 5.200505256652832e-06, 7.178634405136108e-06, 9.156763553619385e-06, 1.1134892702102661e-05, 1.3113021850585938e-05, 1.5091150999069214e-05, 1.706928014755249e-05, 1.9047409296035767e-05, 2.1025538444519043e-05, 2.300366759300232e-05, 2.4981796741485596e-05, 2.6959925889968872e-05, 2.893805503845215e-05, 3.0916184186935425e-05, 3.28943133354187e-05, 3.487244248390198e-05, 3.6850571632385254e-05, 3.882870078086853e-05, 4.080682992935181e-05, 4.278495907783508e-05, 4.476308822631836e-05, 4.6741217374801636e-05, 4.871934652328491e-05, 5.069747567176819e-05, 5.2675604820251465e-05, 5.465373396873474e-05, 5.663186311721802e-05, 5.8609992265701294e-05, 6.058812141418457e-05, 6.256625056266785e-05, 6.454437971115112e-05, 6.65225088596344e-05, 6.850063800811768e-05, 7.047876715660095e-05, 7.245689630508423e-05, 7.44350254535675e-05, 7.641315460205078e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 15.0, 9.0, 28.0, 40.0, 37.0, 73.0, 127.0, 185.0, 310.0, 508.0, 983.0, 1972.0, 4536.0, 11369.0, 31597.0, 93028.0, 375199.0, 380796.0, 95111.0, 32235.0, 11679.0, 4653.0, 1916.0, 920.0, 466.0, 245.0, 166.0, 122.0, 76.0, 39.0, 40.0, 24.0, 13.0, 7.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.287353515625, -0.2795886993408203, -0.2718238830566406, -0.26405906677246094, -0.25629425048828125, -0.24852943420410156, -0.24076461791992188, -0.2329998016357422, -0.2252349853515625, -0.2174701690673828, -0.20970535278320312, -0.20194053649902344, -0.19417572021484375, -0.18641090393066406, -0.17864608764648438, -0.1708812713623047, -0.163116455078125, -0.1553516387939453, -0.14758682250976562, -0.13982200622558594, -0.13205718994140625, -0.12429237365722656, -0.11652755737304688, -0.10876274108886719, -0.1009979248046875, -0.09323310852050781, -0.08546829223632812, -0.07770347595214844, -0.06993865966796875, -0.06217384338378906, -0.054409027099609375, -0.04664421081542969, -0.03887939453125, -0.031114578247070312, -0.023349761962890625, -0.015584945678710938, -0.00782012939453125, -5.53131103515625e-05, 0.007709503173828125, 0.015474319458007812, 0.0232391357421875, 0.031003952026367188, 0.038768768310546875, 0.04653358459472656, 0.05429840087890625, 0.06206321716308594, 0.06982803344726562, 0.07759284973144531, 0.085357666015625, 0.09312248229980469, 0.10088729858398438, 0.10865211486816406, 0.11641693115234375, 0.12418174743652344, 0.13194656372070312, 0.1397113800048828, 0.1474761962890625, 0.1552410125732422, 0.16300582885742188, 0.17077064514160156, 0.17853546142578125, 0.18630027770996094, 0.19406509399414062, 0.2018299102783203, 0.2095947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 10.0, 17.0, 18.0, 25.0, 37.0, 64.0, 126.0, 162.0, 190.0, 109.0, 71.0, 41.0, 28.0, 22.0, 18.0, 19.0, 5.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.23785781860351562, -0.22937774658203125, -0.22089767456054688, -0.2124176025390625, -0.20393753051757812, -0.19545745849609375, -0.18697738647460938, -0.178497314453125, -0.17001724243164062, -0.16153717041015625, -0.15305709838867188, -0.1445770263671875, -0.13609695434570312, -0.12761688232421875, -0.11913681030273438, -0.11065673828125, -0.10217666625976562, -0.09369659423828125, -0.08521652221679688, -0.0767364501953125, -0.06825637817382812, -0.05977630615234375, -0.051296234130859375, -0.042816162109375, -0.034336090087890625, -0.02585601806640625, -0.017375946044921875, -0.0088958740234375, -0.000415802001953125, 0.00806427001953125, 0.016544342041015625, 0.0250244140625, 0.033504486083984375, 0.04198455810546875, 0.050464630126953125, 0.0589447021484375, 0.06742477416992188, 0.07590484619140625, 0.08438491821289062, 0.092864990234375, 0.10134506225585938, 0.10982513427734375, 0.11830520629882812, 0.1267852783203125, 0.13526535034179688, 0.14374542236328125, 0.15222549438476562, 0.16070556640625, 0.16918563842773438, 0.17766571044921875, 0.18614578247070312, 0.1946258544921875, 0.20310592651367188, 0.21158599853515625, 0.22006607055664062, 0.228546142578125, 0.23702621459960938, 0.24550628662109375, 0.2539863586425781, 0.2624664306640625, 0.2709465026855469, 0.27942657470703125, 0.2879066467285156, 0.29638671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 45.0, 266.0, 482.0, 193.0, 24.0, 2.0, 1.0], "bins": [-16.446990966796875, -16.1691837310791, -15.891377449035645, -15.613570213317871, -15.335763931274414, -15.05795669555664, -14.780150413513184, -14.50234317779541, -14.224536895751953, -13.94672966003418, -13.668923377990723, -13.39111614227295, -13.113309860229492, -12.835502624511719, -12.557696342468262, -12.279889106750488, -12.002082824707031, -11.724275588989258, -11.4464693069458, -11.168662071228027, -10.89085578918457, -10.613048553466797, -10.33524227142334, -10.057435035705566, -9.779627799987793, -9.50182056427002, -9.224014282226562, -8.946207046508789, -8.668400764465332, -8.390593528747559, -8.112787246704102, -7.834980010986328, -7.557173728942871, -7.279366970062256, -7.001560211181641, -6.723753452301025, -6.44594669342041, -6.168139934539795, -5.89033317565918, -5.612525939941406, -5.334719181060791, -5.056912422180176, -4.7791056632995605, -4.501298904418945, -4.22349214553833, -3.945685386657715, -3.6678783893585205, -3.3900716304779053, -3.112265110015869, -2.834458351135254, -2.5566515922546387, -2.2788448333740234, -2.001038074493408, -1.7232311964035034, -1.4454243183135986, -1.1676175594329834, -0.8898106813430786, -0.6120039224624634, -0.33419710397720337, -0.05639028549194336, 0.22141647338867188, 0.4992232322692871, 0.7770301103591919, 1.0548368692398071, 1.3326436281204224]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 14.0, 6.0, 5.0, 9.0, 24.0, 15.0, 28.0, 32.0, 28.0, 34.0, 33.0, 37.0, 38.0, 42.0, 53.0, 63.0, 67.0, 51.0, 44.0, 63.0, 54.0, 43.0, 31.0, 37.0, 29.0, 31.0, 23.0, 17.0, 11.0, 11.0, 10.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.956747829914093, -0.9150879979133606, -0.873428225517273, -0.8317683935165405, -0.7901085615158081, -0.7484487295150757, -0.706788957118988, -0.6651291251182556, -0.623469352722168, -0.5818095207214355, -0.5401497483253479, -0.4984899163246155, -0.45683008432388306, -0.415170282125473, -0.373510479927063, -0.33185064792633057, -0.29019081592559814, -0.24853099882602692, -0.2068711817264557, -0.16521137952804565, -0.12355156242847443, -0.0818917453289032, -0.040231943130493164, 0.0014278888702392578, 0.04308769106864929, 0.08474750816822052, 0.12640732526779175, 0.16806712746620178, 0.209726944565773, 0.25138676166534424, 0.2930465638637543, 0.3347063958644867, 0.3763662576675415, 0.41802605986595154, 0.45968589186668396, 0.501345694065094, 0.5430055260658264, 0.5846652984619141, 0.6263251304626465, 0.6679849624633789, 0.7096447944641113, 0.7513046264648438, 0.7929643988609314, 0.8346242308616638, 0.8762840628623962, 0.9179438352584839, 0.9596036672592163, 1.0012634992599487, 1.0429232120513916, 1.084583044052124, 1.1262428760528564, 1.1679027080535889, 1.2095624208450317, 1.2512222528457642, 1.2928820848464966, 1.334541916847229, 1.3762017488479614, 1.4178615808486938, 1.4595214128494263, 1.5011811256408691, 1.5428409576416016, 1.584500789642334, 1.6261606216430664, 1.6678204536437988, 1.7094802856445312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 3.0, 9.0, 15.0, 14.0, 17.0, 19.0, 40.0, 58.0, 67.0, 113.0, 158.0, 214.0, 345.0, 580.0, 843.0, 1438.0, 2437.0, 4595.0, 9366.0, 19759.0, 46586.0, 122861.0, 399964.0, 1914837.0, 1238912.0, 273725.0, 90886.0, 35022.0, 15005.0, 7262.0, 3700.0, 2082.0, 1229.0, 697.0, 462.0, 294.0, 217.0, 136.0, 109.0, 63.0, 39.0, 26.0, 26.0, 9.0, 12.0, 12.0, 4.0, 4.0, 4.0, 1.0, 2.0, 6.0], "bins": [-0.290283203125, -0.28218650817871094, -0.2740898132324219, -0.2659931182861328, -0.25789642333984375, -0.2497997283935547, -0.24170303344726562, -0.23360633850097656, -0.2255096435546875, -0.21741294860839844, -0.20931625366210938, -0.2012195587158203, -0.19312286376953125, -0.1850261688232422, -0.17692947387695312, -0.16883277893066406, -0.160736083984375, -0.15263938903808594, -0.14454269409179688, -0.1364459991455078, -0.12834930419921875, -0.12025260925292969, -0.11215591430664062, -0.10405921936035156, -0.0959625244140625, -0.08786582946777344, -0.07976913452148438, -0.07167243957519531, -0.06357574462890625, -0.05547904968261719, -0.047382354736328125, -0.03928565979003906, -0.03118896484375, -0.023092269897460938, -0.014995574951171875, -0.0068988800048828125, 0.00119781494140625, 0.009294509887695312, 0.017391204833984375, 0.025487899780273438, 0.0335845947265625, 0.04168128967285156, 0.049777984619140625, 0.05787467956542969, 0.06597137451171875, 0.07406806945800781, 0.08216476440429688, 0.09026145935058594, 0.098358154296875, 0.10645484924316406, 0.11455154418945312, 0.12264823913574219, 0.13074493408203125, 0.1388416290283203, 0.14693832397460938, 0.15503501892089844, 0.1631317138671875, 0.17122840881347656, 0.17932510375976562, 0.1874217987060547, 0.19551849365234375, 0.2036151885986328, 0.21171188354492188, 0.21980857849121094, 0.2279052734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 13.0, 13.0, 14.0, 11.0, 24.0, 29.0, 27.0, 22.0, 44.0, 28.0, 49.0, 38.0, 47.0, 39.0, 38.0, 63.0, 62.0, 57.0, 43.0, 36.0, 44.0, 39.0, 49.0, 28.0, 25.0, 24.0, 17.0, 15.0, 16.0, 9.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10968017578125, -0.10486888885498047, -0.10005760192871094, -0.0952463150024414, -0.09043502807617188, -0.08562374114990234, -0.08081245422363281, -0.07600116729736328, -0.07118988037109375, -0.06637859344482422, -0.06156730651855469, -0.056756019592285156, -0.051944732666015625, -0.047133445739746094, -0.04232215881347656, -0.03751087188720703, -0.0326995849609375, -0.02788829803466797, -0.023077011108398438, -0.018265724182128906, -0.013454437255859375, -0.008643150329589844, -0.0038318634033203125, 0.0009794235229492188, 0.00579071044921875, 0.010601997375488281, 0.015413284301757812, 0.020224571228027344, 0.025035858154296875, 0.029847145080566406, 0.03465843200683594, 0.03946971893310547, 0.044281005859375, 0.04909229278564453, 0.05390357971191406, 0.058714866638183594, 0.06352615356445312, 0.06833744049072266, 0.07314872741699219, 0.07796001434326172, 0.08277130126953125, 0.08758258819580078, 0.09239387512207031, 0.09720516204833984, 0.10201644897460938, 0.1068277359008789, 0.11163902282714844, 0.11645030975341797, 0.1212615966796875, 0.12607288360595703, 0.13088417053222656, 0.1356954574584961, 0.14050674438476562, 0.14531803131103516, 0.1501293182373047, 0.15494060516357422, 0.15975189208984375, 0.16456317901611328, 0.1693744659423828, 0.17418575286865234, 0.17899703979492188, 0.1838083267211914, 0.18861961364746094, 0.19343090057373047, 0.1982421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 13.0, 21.0, 18.0, 34.0, 57.0, 73.0, 103.0, 172.0, 243.0, 379.0, 605.0, 940.0, 1576.0, 2720.0, 4943.0, 8935.0, 18084.0, 39448.0, 95700.0, 261971.0, 904187.0, 1954870.0, 579441.0, 186499.0, 70912.0, 30744.0, 14455.0, 7356.0, 3948.0, 2218.0, 1324.0, 829.0, 522.0, 325.0, 225.0, 150.0, 86.0, 58.0, 35.0, 24.0, 13.0, 9.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.3072547912597656, -0.29712677001953125, -0.2869987487792969, -0.2768707275390625, -0.2667427062988281, -0.25661468505859375, -0.24648666381835938, -0.236358642578125, -0.22623062133789062, -0.21610260009765625, -0.20597457885742188, -0.1958465576171875, -0.18571853637695312, -0.17559051513671875, -0.16546249389648438, -0.15533447265625, -0.14520645141601562, -0.13507843017578125, -0.12495040893554688, -0.1148223876953125, -0.10469436645507812, -0.09456634521484375, -0.08443832397460938, -0.074310302734375, -0.06418228149414062, -0.05405426025390625, -0.043926239013671875, -0.0337982177734375, -0.023670196533203125, -0.01354217529296875, -0.003414154052734375, 0.0067138671875, 0.016841888427734375, 0.02696990966796875, 0.037097930908203125, 0.0472259521484375, 0.057353973388671875, 0.06748199462890625, 0.07761001586914062, 0.087738037109375, 0.09786605834960938, 0.10799407958984375, 0.11812210083007812, 0.1282501220703125, 0.13837814331054688, 0.14850616455078125, 0.15863418579101562, 0.16876220703125, 0.17889022827148438, 0.18901824951171875, 0.19914627075195312, 0.2092742919921875, 0.21940231323242188, 0.22953033447265625, 0.23965835571289062, 0.249786376953125, 0.2599143981933594, 0.27004241943359375, 0.2801704406738281, 0.2902984619140625, 0.3004264831542969, 0.31055450439453125, 0.3206825256347656, 0.330810546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 13.0, 10.0, 8.0, 15.0, 11.0, 22.0, 29.0, 39.0, 60.0, 85.0, 110.0, 166.0, 237.0, 360.0, 563.0, 745.0, 543.0, 330.0, 221.0, 158.0, 99.0, 73.0, 58.0, 35.0, 20.0, 13.0, 10.0, 8.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34033203125, -0.3283576965332031, -0.31638336181640625, -0.3044090270996094, -0.2924346923828125, -0.2804603576660156, -0.26848602294921875, -0.2565116882324219, -0.244537353515625, -0.23256301879882812, -0.22058868408203125, -0.20861434936523438, -0.1966400146484375, -0.18466567993164062, -0.17269134521484375, -0.16071701049804688, -0.14874267578125, -0.13676834106445312, -0.12479400634765625, -0.11281967163085938, -0.1008453369140625, -0.08887100219726562, -0.07689666748046875, -0.06492233276367188, -0.052947998046875, -0.040973663330078125, -0.02899932861328125, -0.017024993896484375, -0.0050506591796875, 0.006923675537109375, 0.01889801025390625, 0.030872344970703125, 0.0428466796875, 0.054821014404296875, 0.06679534912109375, 0.07876968383789062, 0.0907440185546875, 0.10271835327148438, 0.11469268798828125, 0.12666702270507812, 0.138641357421875, 0.15061569213867188, 0.16259002685546875, 0.17456436157226562, 0.1865386962890625, 0.19851303100585938, 0.21048736572265625, 0.22246170043945312, 0.23443603515625, 0.24641036987304688, 0.25838470458984375, 0.2703590393066406, 0.2823333740234375, 0.2943077087402344, 0.30628204345703125, 0.3182563781738281, 0.330230712890625, 0.3422050476074219, 0.35417938232421875, 0.3661537170410156, 0.3781280517578125, 0.3901023864746094, 0.40207672119140625, 0.4140510559082031, 0.426025390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 6.0, 7.0, 10.0, 16.0, 20.0, 38.0, 38.0, 54.0, 62.0, 74.0, 99.0, 99.0, 80.0, 87.0, 71.0, 61.0, 48.0, 29.0, 28.0, 19.0, 18.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4691505432128906, -1.4128050804138184, -1.3564597368240356, -1.3001142740249634, -1.2437689304351807, -1.1874234676361084, -1.1310780048370361, -1.0747326612472534, -1.0183873176574707, -0.9620419144630432, -0.9056965112686157, -0.8493510484695435, -0.7930057048797607, -0.7366602420806885, -0.680314838886261, -0.6239694356918335, -0.5676239728927612, -0.5112785696983337, -0.45493316650390625, -0.39858773350715637, -0.3422423303127289, -0.2858969271183014, -0.2295514941215515, -0.17320609092712402, -0.11686068773269653, -0.060515277087688446, -0.004169866442680359, 0.052175551652908325, 0.10852095484733582, 0.1648663580417633, 0.22121179103851318, 0.2775571942329407, 0.33390259742736816, 0.39024800062179565, 0.44659340381622314, 0.5029388666152954, 0.5592842102050781, 0.6156296730041504, 0.6719750761985779, 0.7283204793930054, 0.7846658825874329, 0.8410112857818604, 0.8973566889762878, 0.9537020921707153, 1.0100475549697876, 1.0663928985595703, 1.1227383613586426, 1.1790838241577148, 1.2354291677474976, 1.2917746305465698, 1.3481199741363525, 1.4044654369354248, 1.4608107805252075, 1.5171562433242798, 1.5735015869140625, 1.6298470497131348, 1.686192512512207, 1.7425379753112793, 1.798883318901062, 1.8552287817001343, 1.911574125289917, 1.9679195880889893, 2.0242650508880615, 2.0806102752685547, 2.136955738067627]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 8.0, 10.0, 15.0, 9.0, 8.0, 13.0, 16.0, 18.0, 13.0, 28.0, 25.0, 23.0, 30.0, 40.0, 46.0, 41.0, 42.0, 41.0, 38.0, 48.0, 29.0, 40.0, 32.0, 39.0, 40.0, 31.0, 30.0, 25.0, 23.0, 37.0, 26.0, 17.0, 14.0, 13.0, 17.0, 12.0, 13.0, 10.0, 9.0, 5.0, 9.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0113821029663086, -0.9774859547615051, -0.9435898661613464, -0.909693717956543, -0.8757976293563843, -0.8419014811515808, -0.8080053329467773, -0.7741092443466187, -0.7402130961418152, -0.7063169479370117, -0.672420859336853, -0.6385247111320496, -0.6046285629272461, -0.5707324743270874, -0.5368363261222839, -0.5029401779174805, -0.4690440893173218, -0.4351479709148407, -0.4012518525123596, -0.36735570430755615, -0.3334595859050751, -0.299563467502594, -0.2656673192977905, -0.23177120089530945, -0.19787508249282837, -0.1639789640903473, -0.13008283078670502, -0.09618670493364334, -0.062290579080581665, -0.028394460678100586, 0.005501672625541687, 0.03939780592918396, 0.07329380512237549, 0.10718993097543716, 0.14108605682849884, 0.1749821901321411, 0.2088783085346222, 0.24277442693710327, 0.27667057514190674, 0.3105666935443878, 0.3444628119468689, 0.37835893034935, 0.41225504875183105, 0.4461511969566345, 0.4800473153591156, 0.5139434337615967, 0.5478395819664001, 0.5817357301712036, 0.6156318187713623, 0.6495279669761658, 0.6834240555763245, 0.7173202037811279, 0.7512162923812866, 0.7851124405860901, 0.8190085887908936, 0.8529046773910522, 0.8868008255958557, 0.9206969738006592, 0.9545930624008179, 0.9884892106056213, 1.0223853588104248, 1.0562814474105835, 1.0901775360107422, 1.1240737438201904, 1.1579698324203491]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 12.0, 17.0, 33.0, 48.0, 74.0, 123.0, 195.0, 342.0, 514.0, 768.0, 1303.0, 2020.0, 3343.0, 5304.0, 8951.0, 14898.0, 24758.0, 42582.0, 74987.0, 134257.0, 224607.0, 216027.0, 124478.0, 69838.0, 39841.0, 23395.0, 13794.0, 8434.0, 5176.0, 3241.0, 2025.0, 1179.0, 725.0, 472.0, 290.0, 178.0, 116.0, 70.0, 43.0, 36.0, 24.0, 11.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2555732727050781, -0.24674224853515625, -0.23791122436523438, -0.2290802001953125, -0.22024917602539062, -0.21141815185546875, -0.20258712768554688, -0.193756103515625, -0.18492507934570312, -0.17609405517578125, -0.16726303100585938, -0.1584320068359375, -0.14960098266601562, -0.14076995849609375, -0.13193893432617188, -0.12310791015625, -0.11427688598632812, -0.10544586181640625, -0.09661483764648438, -0.0877838134765625, -0.07895278930664062, -0.07012176513671875, -0.061290740966796875, -0.052459716796875, -0.043628692626953125, -0.03479766845703125, -0.025966644287109375, -0.0171356201171875, -0.008304595947265625, 0.00052642822265625, 0.009357452392578125, 0.0181884765625, 0.027019500732421875, 0.03585052490234375, 0.044681549072265625, 0.0535125732421875, 0.062343597412109375, 0.07117462158203125, 0.08000564575195312, 0.088836669921875, 0.09766769409179688, 0.10649871826171875, 0.11532974243164062, 0.1241607666015625, 0.13299179077148438, 0.14182281494140625, 0.15065383911132812, 0.15948486328125, 0.16831588745117188, 0.17714691162109375, 0.18597793579101562, 0.1948089599609375, 0.20363998413085938, 0.21247100830078125, 0.22130203247070312, 0.230133056640625, 0.23896408081054688, 0.24779510498046875, 0.2566261291503906, 0.2654571533203125, 0.2742881774902344, 0.28311920166015625, 0.2919502258300781, 0.30078125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 2.0, 10.0, 12.0, 9.0, 20.0, 21.0, 22.0, 30.0, 34.0, 33.0, 30.0, 35.0, 38.0, 36.0, 43.0, 65.0, 58.0, 47.0, 55.0, 55.0, 47.0, 43.0, 35.0, 34.0, 29.0, 45.0, 26.0, 12.0, 19.0, 12.0, 15.0, 10.0, 3.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.13978004455566406, -0.13417434692382812, -0.1285686492919922, -0.12296295166015625, -0.11735725402832031, -0.11175155639648438, -0.10614585876464844, -0.1005401611328125, -0.09493446350097656, -0.08932876586914062, -0.08372306823730469, -0.07811737060546875, -0.07251167297363281, -0.06690597534179688, -0.06130027770996094, -0.055694580078125, -0.05008888244628906, -0.044483184814453125, -0.03887748718261719, -0.03327178955078125, -0.027666091918945312, -0.022060394287109375, -0.016454696655273438, -0.0108489990234375, -0.0052433013916015625, 0.000362396240234375, 0.0059680938720703125, 0.01157379150390625, 0.017179489135742188, 0.022785186767578125, 0.028390884399414062, 0.03399658203125, 0.03960227966308594, 0.045207977294921875, 0.05081367492675781, 0.05641937255859375, 0.06202507019042969, 0.06763076782226562, 0.07323646545410156, 0.0788421630859375, 0.08444786071777344, 0.09005355834960938, 0.09565925598144531, 0.10126495361328125, 0.10687065124511719, 0.11247634887695312, 0.11808204650878906, 0.123687744140625, 0.12929344177246094, 0.13489913940429688, 0.1405048370361328, 0.14611053466796875, 0.1517162322998047, 0.15732192993164062, 0.16292762756347656, 0.1685333251953125, 0.17413902282714844, 0.17974472045898438, 0.1853504180908203, 0.19095611572265625, 0.1965618133544922, 0.20216751098632812, 0.20777320861816406, 0.21337890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 1.0, 2.0, 10.0, 5.0, 9.0, 15.0, 9.0, 26.0, 34.0, 47.0, 61.0, 99.0, 164.0, 291.0, 534.0, 1105.0, 2192.0, 4787.0, 10175.0, 22268.0, 50259.0, 117993.0, 283950.0, 314697.0, 136008.0, 56607.0, 25328.0, 11459.0, 5237.0, 2495.0, 1176.0, 604.0, 336.0, 194.0, 112.0, 81.0, 49.0, 29.0, 20.0, 14.0, 15.0, 13.0, 8.0, 8.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.415771484375, -0.401947021484375, -0.38812255859375, -0.374298095703125, -0.3604736328125, -0.346649169921875, -0.33282470703125, -0.319000244140625, -0.30517578125, -0.291351318359375, -0.27752685546875, -0.263702392578125, -0.2498779296875, -0.236053466796875, -0.22222900390625, -0.208404541015625, -0.194580078125, -0.180755615234375, -0.16693115234375, -0.153106689453125, -0.1392822265625, -0.125457763671875, -0.11163330078125, -0.097808837890625, -0.083984375, -0.070159912109375, -0.05633544921875, -0.042510986328125, -0.0286865234375, -0.014862060546875, -0.00103759765625, 0.012786865234375, 0.026611328125, 0.040435791015625, 0.05426025390625, 0.068084716796875, 0.0819091796875, 0.095733642578125, 0.10955810546875, 0.123382568359375, 0.13720703125, 0.151031494140625, 0.16485595703125, 0.178680419921875, 0.1925048828125, 0.206329345703125, 0.22015380859375, 0.233978271484375, 0.247802734375, 0.261627197265625, 0.27545166015625, 0.289276123046875, 0.3031005859375, 0.316925048828125, 0.33074951171875, 0.344573974609375, 0.3583984375, 0.372222900390625, 0.38604736328125, 0.399871826171875, 0.4136962890625, 0.427520751953125, 0.44134521484375, 0.455169677734375, 0.468994140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 7.0, 9.0, 15.0, 17.0, 21.0, 14.0, 27.0, 26.0, 32.0, 40.0, 32.0, 33.0, 40.0, 39.0, 50.0, 60.0, 55.0, 44.0, 44.0, 38.0, 45.0, 32.0, 29.0, 29.0, 35.0, 29.0, 22.0, 15.0, 23.0, 19.0, 13.0, 12.0, 12.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5439453125, -0.5272445678710938, -0.5105438232421875, -0.49384307861328125, -0.477142333984375, -0.46044158935546875, -0.4437408447265625, -0.42704010009765625, -0.41033935546875, -0.39363861083984375, -0.3769378662109375, -0.36023712158203125, -0.343536376953125, -0.32683563232421875, -0.3101348876953125, -0.29343414306640625, -0.2767333984375, -0.26003265380859375, -0.2433319091796875, -0.22663116455078125, -0.209930419921875, -0.19322967529296875, -0.1765289306640625, -0.15982818603515625, -0.14312744140625, -0.12642669677734375, -0.1097259521484375, -0.09302520751953125, -0.076324462890625, -0.05962371826171875, -0.0429229736328125, -0.02622222900390625, -0.009521484375, 0.00717926025390625, 0.0238800048828125, 0.04058074951171875, 0.057281494140625, 0.07398223876953125, 0.0906829833984375, 0.10738372802734375, 0.12408447265625, 0.14078521728515625, 0.1574859619140625, 0.17418670654296875, 0.190887451171875, 0.20758819580078125, 0.2242889404296875, 0.24098968505859375, 0.2576904296875, 0.27439117431640625, 0.2910919189453125, 0.30779266357421875, 0.324493408203125, 0.34119415283203125, 0.3578948974609375, 0.37459564208984375, 0.39129638671875, 0.40799713134765625, 0.4246978759765625, 0.44139862060546875, 0.458099365234375, 0.47480010986328125, 0.4915008544921875, 0.5082015991210938, 0.52490234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 6.0, 9.0, 10.0, 31.0, 38.0, 66.0, 111.0, 162.0, 229.0, 386.0, 563.0, 1023.0, 1911.0, 3710.0, 7888.0, 17758.0, 41561.0, 107422.0, 307035.0, 349077.0, 123939.0, 47634.0, 19858.0, 8990.0, 4180.0, 2057.0, 1141.0, 659.0, 415.0, 249.0, 147.0, 104.0, 68.0, 41.0, 27.0, 17.0, 7.0, 2.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2432861328125, -0.2357006072998047, -0.22811508178710938, -0.22052955627441406, -0.21294403076171875, -0.20535850524902344, -0.19777297973632812, -0.1901874542236328, -0.1826019287109375, -0.1750164031982422, -0.16743087768554688, -0.15984535217285156, -0.15225982666015625, -0.14467430114746094, -0.13708877563476562, -0.1295032501220703, -0.121917724609375, -0.11433219909667969, -0.10674667358398438, -0.09916114807128906, -0.09157562255859375, -0.08399009704589844, -0.07640457153320312, -0.06881904602050781, -0.0612335205078125, -0.05364799499511719, -0.046062469482421875, -0.03847694396972656, -0.03089141845703125, -0.023305892944335938, -0.015720367431640625, -0.008134841918945312, -0.00054931640625, 0.0070362091064453125, 0.014621734619140625, 0.022207260131835938, 0.02979278564453125, 0.03737831115722656, 0.044963836669921875, 0.05254936218261719, 0.0601348876953125, 0.06772041320800781, 0.07530593872070312, 0.08289146423339844, 0.09047698974609375, 0.09806251525878906, 0.10564804077148438, 0.11323356628417969, 0.120819091796875, 0.1284046173095703, 0.13599014282226562, 0.14357566833496094, 0.15116119384765625, 0.15874671936035156, 0.16633224487304688, 0.1739177703857422, 0.1815032958984375, 0.1890888214111328, 0.19667434692382812, 0.20425987243652344, 0.21184539794921875, 0.21943092346191406, 0.22701644897460938, 0.2346019744873047, 0.2421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 13.0, 8.0, 16.0, 13.0, 17.0, 14.0, 27.0, 20.0, 32.0, 46.0, 57.0, 93.0, 106.0, 97.0, 84.0, 56.0, 47.0, 38.0, 32.0, 21.0, 25.0, 21.0, 13.0, 15.0, 13.0, 7.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.684925079345703e-05, -4.543270915746689e-05, -4.4016167521476746e-05, -4.25996258854866e-05, -4.118308424949646e-05, -3.976654261350632e-05, -3.8350000977516174e-05, -3.693345934152603e-05, -3.551691770553589e-05, -3.4100376069545746e-05, -3.26838344335556e-05, -3.126729279756546e-05, -2.9850751161575317e-05, -2.8434209525585175e-05, -2.7017667889595032e-05, -2.560112625360489e-05, -2.4184584617614746e-05, -2.2768042981624603e-05, -2.135150134563446e-05, -1.9934959709644318e-05, -1.8518418073654175e-05, -1.7101876437664032e-05, -1.568533480167389e-05, -1.4268793165683746e-05, -1.2852251529693604e-05, -1.143570989370346e-05, -1.0019168257713318e-05, -8.602626621723175e-06, -7.186084985733032e-06, -5.769543349742889e-06, -4.353001713752747e-06, -2.9364600777626038e-06, -1.519918441772461e-06, -1.0337680578231812e-07, 1.3131648302078247e-06, 2.7297064661979675e-06, 4.14624810218811e-06, 5.562789738178253e-06, 6.979331374168396e-06, 8.395873010158539e-06, 9.812414646148682e-06, 1.1228956282138824e-05, 1.2645497918128967e-05, 1.406203955411911e-05, 1.5478581190109253e-05, 1.6895122826099396e-05, 1.831166446208954e-05, 1.972820609807968e-05, 2.1144747734069824e-05, 2.2561289370059967e-05, 2.397783100605011e-05, 2.5394372642040253e-05, 2.6810914278030396e-05, 2.822745591402054e-05, 2.964399755001068e-05, 3.1060539186000824e-05, 3.247708082199097e-05, 3.389362245798111e-05, 3.531016409397125e-05, 3.6726705729961395e-05, 3.814324736595154e-05, 3.955978900194168e-05, 4.0976330637931824e-05, 4.2392872273921967e-05, 4.380941390991211e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 5.0, 5.0, 11.0, 12.0, 30.0, 28.0, 57.0, 89.0, 141.0, 251.0, 495.0, 956.0, 2063.0, 4972.0, 13062.0, 35979.0, 106313.0, 329608.0, 366883.0, 121571.0, 41053.0, 14858.0, 5608.0, 2296.0, 1038.0, 475.0, 271.0, 151.0, 103.0, 49.0, 39.0, 35.0, 10.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206298828125, -0.19806671142578125, -0.1898345947265625, -0.18160247802734375, -0.173370361328125, -0.16513824462890625, -0.1569061279296875, -0.14867401123046875, -0.14044189453125, -0.13220977783203125, -0.1239776611328125, -0.11574554443359375, -0.107513427734375, -0.09928131103515625, -0.0910491943359375, -0.08281707763671875, -0.0745849609375, -0.06635284423828125, -0.0581207275390625, -0.04988861083984375, -0.041656494140625, -0.03342437744140625, -0.0251922607421875, -0.01696014404296875, -0.00872802734375, -0.00049591064453125, 0.0077362060546875, 0.01596832275390625, 0.024200439453125, 0.03243255615234375, 0.0406646728515625, 0.04889678955078125, 0.05712890625, 0.06536102294921875, 0.0735931396484375, 0.08182525634765625, 0.090057373046875, 0.09828948974609375, 0.1065216064453125, 0.11475372314453125, 0.12298583984375, 0.13121795654296875, 0.1394500732421875, 0.14768218994140625, 0.155914306640625, 0.16414642333984375, 0.1723785400390625, 0.18061065673828125, 0.1888427734375, 0.19707489013671875, 0.2053070068359375, 0.21353912353515625, 0.221771240234375, 0.23000335693359375, 0.2382354736328125, 0.24646759033203125, 0.25469970703125, 0.26293182373046875, 0.2711639404296875, 0.27939605712890625, 0.287628173828125, 0.29586029052734375, 0.3040924072265625, 0.31232452392578125, 0.320556640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 7.0, 10.0, 22.0, 13.0, 22.0, 26.0, 50.0, 36.0, 55.0, 59.0, 77.0, 86.0, 85.0, 81.0, 57.0, 58.0, 49.0, 23.0, 34.0, 26.0, 27.0, 14.0, 8.0, 10.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.1644916534423828, -0.15820693969726562, -0.15192222595214844, -0.14563751220703125, -0.13935279846191406, -0.13306808471679688, -0.1267833709716797, -0.1204986572265625, -0.11421394348144531, -0.10792922973632812, -0.10164451599121094, -0.09535980224609375, -0.08907508850097656, -0.08279037475585938, -0.07650566101074219, -0.070220947265625, -0.06393623352050781, -0.057651519775390625, -0.05136680603027344, -0.04508209228515625, -0.03879737854003906, -0.032512664794921875, -0.026227951049804688, -0.0199432373046875, -0.013658523559570312, -0.007373809814453125, -0.0010890960693359375, 0.00519561767578125, 0.011480331420898438, 0.017765045166015625, 0.024049758911132812, 0.03033447265625, 0.03661918640136719, 0.042903900146484375, 0.04918861389160156, 0.05547332763671875, 0.06175804138183594, 0.06804275512695312, 0.07432746887207031, 0.0806121826171875, 0.08689689636230469, 0.09318161010742188, 0.09946632385253906, 0.10575103759765625, 0.11203575134277344, 0.11832046508789062, 0.12460517883300781, 0.130889892578125, 0.1371746063232422, 0.14345932006835938, 0.14974403381347656, 0.15602874755859375, 0.16231346130371094, 0.16859817504882812, 0.1748828887939453, 0.1811676025390625, 0.1874523162841797, 0.19373703002929688, 0.20002174377441406, 0.20630645751953125, 0.21259117126464844, 0.21887588500976562, 0.2251605987548828, 0.2314453125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 28.0, 87.0, 186.0, 320.0, 233.0, 110.0, 39.0, 8.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1280171871185303, -1.8813002109527588, -1.6345831155776978, -1.3878660202026367, -1.1411490440368652, -0.8944320678710938, -0.6477149724960327, -0.4009978771209717, -0.1542809009552002, 0.09243613481521606, 0.3391531705856323, 0.5858702063560486, 0.8325872421264648, 1.0793042182922363, 1.3260213136672974, 1.5727384090423584, 1.8194553852081299, 2.0661723613739014, 2.312889575958252, 2.5596065521240234, 2.806323528289795, 3.0530405044555664, 3.299757480621338, 3.5464746952056885, 3.79319167137146, 4.0399088859558105, 4.286625862121582, 4.5333428382873535, 4.780059814453125, 5.0267767906188965, 5.273493766784668, 5.520211219787598, 5.766927719116211, 6.013644695281982, 6.260361671447754, 6.507078647613525, 6.753795623779297, 7.000513076782227, 7.247230052947998, 7.4939470291137695, 7.740664005279541, 7.9873809814453125, 8.234098434448242, 8.480814933776855, 8.727532386779785, 8.974248886108398, 9.220966339111328, 9.467683792114258, 9.714400291442871, 9.9611177444458, 10.207834243774414, 10.454551696777344, 10.701268196105957, 10.947985649108887, 11.1947021484375, 11.44141960144043, 11.68813705444336, 11.934854507446289, 12.181571006774902, 12.428288459777832, 12.675004959106445, 12.921722412109375, 13.168438911437988, 13.415156364440918, 13.661872863769531]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 11.0, 9.0, 18.0, 10.0, 16.0, 15.0, 24.0, 30.0, 22.0, 34.0, 37.0, 34.0, 48.0, 51.0, 36.0, 64.0, 50.0, 49.0, 54.0, 32.0, 37.0, 50.0, 47.0, 44.0, 19.0, 34.0, 16.0, 21.0, 17.0, 17.0, 10.0, 7.0, 8.0, 10.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7428758144378662, -1.6881561279296875, -1.6334364414215088, -1.57871675491333, -1.5239969491958618, -1.469277262687683, -1.4145575761795044, -1.3598378896713257, -1.3051180839538574, -1.2503983974456787, -1.1956787109375, -1.1409590244293213, -1.086239218711853, -1.0315195322036743, -0.9767998456954956, -0.9220801591873169, -0.8673604726791382, -0.8126407861709595, -0.757921040058136, -0.7032013535499573, -0.6484816074371338, -0.5937619209289551, -0.5390422344207764, -0.48432251811027527, -0.42960280179977417, -0.37488308548927307, -0.320163369178772, -0.26544368267059326, -0.21072396636009216, -0.15600425004959106, -0.10128456354141235, -0.046564847230911255, 0.008154749870300293, 0.0628744587302208, 0.1175941675901413, 0.1723138689994812, 0.2270335853099823, 0.2817533016204834, 0.3364729881286621, 0.3911927044391632, 0.4459124207496643, 0.500632107257843, 0.5553518533706665, 0.6100715398788452, 0.6647912263870239, 0.7195109724998474, 0.7742306590080261, 0.8289504051208496, 0.8836700916290283, 0.938389778137207, 0.9931095242500305, 1.0478291511535645, 1.1025489568710327, 1.1572686433792114, 1.2119883298873901, 1.2667080163955688, 1.321427822113037, 1.3761475086212158, 1.4308671951293945, 1.4855868816375732, 1.5403066873550415, 1.5950263738632202, 1.649746060371399, 1.7044657468795776, 1.7591854333877563]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 11.0, 12.0, 15.0, 21.0, 24.0, 42.0, 54.0, 74.0, 107.0, 114.0, 194.0, 285.0, 453.0, 659.0, 1009.0, 1703.0, 2784.0, 4527.0, 7761.0, 13947.0, 24695.0, 47372.0, 95897.0, 212798.0, 588133.0, 1774509.0, 883003.0, 284104.0, 120847.0, 58708.0, 30572.0, 16627.0, 9272.0, 5508.0, 3078.0, 1906.0, 1100.0, 758.0, 519.0, 335.0, 210.0, 168.0, 92.0, 81.0, 61.0, 42.0, 36.0, 15.0, 16.0, 6.0, 12.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.2200927734375, -0.21314048767089844, -0.20618820190429688, -0.1992359161376953, -0.19228363037109375, -0.1853313446044922, -0.17837905883789062, -0.17142677307128906, -0.1644744873046875, -0.15752220153808594, -0.15056991577148438, -0.1436176300048828, -0.13666534423828125, -0.1297130584716797, -0.12276077270507812, -0.11580848693847656, -0.108856201171875, -0.10190391540527344, -0.09495162963867188, -0.08799934387207031, -0.08104705810546875, -0.07409477233886719, -0.06714248657226562, -0.06019020080566406, -0.0532379150390625, -0.04628562927246094, -0.039333343505859375, -0.03238105773925781, -0.02542877197265625, -0.018476486206054688, -0.011524200439453125, -0.0045719146728515625, 0.00238037109375, 0.009332656860351562, 0.016284942626953125, 0.023237228393554688, 0.03018951416015625, 0.03714179992675781, 0.044094085693359375, 0.05104637145996094, 0.0579986572265625, 0.06495094299316406, 0.07190322875976562, 0.07885551452636719, 0.08580780029296875, 0.09276008605957031, 0.09971237182617188, 0.10666465759277344, 0.113616943359375, 0.12056922912597656, 0.12752151489257812, 0.1344738006591797, 0.14142608642578125, 0.1483783721923828, 0.15533065795898438, 0.16228294372558594, 0.1692352294921875, 0.17618751525878906, 0.18313980102539062, 0.1900920867919922, 0.19704437255859375, 0.2039966583251953, 0.21094894409179688, 0.21790122985839844, 0.224853515625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 6.0, 8.0, 18.0, 14.0, 11.0, 14.0, 17.0, 15.0, 30.0, 28.0, 41.0, 36.0, 34.0, 41.0, 38.0, 39.0, 40.0, 43.0, 45.0, 46.0, 40.0, 53.0, 48.0, 51.0, 46.0, 32.0, 28.0, 28.0, 20.0, 22.0, 17.0, 12.0, 11.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.144073486328125, -0.13836669921875, -0.132659912109375, -0.126953125, -0.121246337890625, -0.11553955078125, -0.109832763671875, -0.1041259765625, -0.098419189453125, -0.09271240234375, -0.087005615234375, -0.081298828125, -0.075592041015625, -0.06988525390625, -0.064178466796875, -0.0584716796875, -0.052764892578125, -0.04705810546875, -0.041351318359375, -0.03564453125, -0.029937744140625, -0.02423095703125, -0.018524169921875, -0.0128173828125, -0.007110595703125, -0.00140380859375, 0.004302978515625, 0.010009765625, 0.015716552734375, 0.02142333984375, 0.027130126953125, 0.0328369140625, 0.038543701171875, 0.04425048828125, 0.049957275390625, 0.0556640625, 0.061370849609375, 0.06707763671875, 0.072784423828125, 0.0784912109375, 0.084197998046875, 0.08990478515625, 0.095611572265625, 0.101318359375, 0.107025146484375, 0.11273193359375, 0.118438720703125, 0.1241455078125, 0.129852294921875, 0.13555908203125, 0.141265869140625, 0.14697265625, 0.152679443359375, 0.15838623046875, 0.164093017578125, 0.1697998046875, 0.175506591796875, 0.18121337890625, 0.186920166015625, 0.192626953125, 0.198333740234375, 0.20404052734375, 0.209747314453125, 0.2154541015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 16.0, 28.0, 26.0, 42.0, 89.0, 116.0, 176.0, 276.0, 458.0, 784.0, 1488.0, 2672.0, 5139.0, 10101.0, 21547.0, 48353.0, 113634.0, 294526.0, 951151.0, 1844581.0, 558157.0, 195997.0, 78889.0, 34062.0, 15741.0, 7557.0, 3826.0, 2039.0, 1108.0, 611.0, 388.0, 225.0, 172.0, 109.0, 62.0, 41.0, 35.0, 19.0, 9.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3773460388183594, -0.36528778076171875, -0.3532295227050781, -0.3411712646484375, -0.3291130065917969, -0.31705474853515625, -0.3049964904785156, -0.292938232421875, -0.2808799743652344, -0.26882171630859375, -0.2567634582519531, -0.2447052001953125, -0.23264694213867188, -0.22058868408203125, -0.20853042602539062, -0.19647216796875, -0.18441390991210938, -0.17235565185546875, -0.16029739379882812, -0.1482391357421875, -0.13618087768554688, -0.12412261962890625, -0.11206436157226562, -0.100006103515625, -0.08794784545898438, -0.07588958740234375, -0.06383132934570312, -0.0517730712890625, -0.039714813232421875, -0.02765655517578125, -0.015598297119140625, -0.0035400390625, 0.008518218994140625, 0.02057647705078125, 0.032634735107421875, 0.0446929931640625, 0.056751251220703125, 0.06880950927734375, 0.08086776733398438, 0.092926025390625, 0.10498428344726562, 0.11704254150390625, 0.12910079956054688, 0.1411590576171875, 0.15321731567382812, 0.16527557373046875, 0.17733383178710938, 0.18939208984375, 0.20145034790039062, 0.21350860595703125, 0.22556686401367188, 0.2376251220703125, 0.24968338012695312, 0.26174163818359375, 0.2737998962402344, 0.285858154296875, 0.2979164123535156, 0.30997467041015625, 0.3220329284667969, 0.3340911865234375, 0.3461494445800781, 0.35820770263671875, 0.3702659606933594, 0.38232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 12.0, 11.0, 17.0, 24.0, 34.0, 43.0, 60.0, 102.0, 133.0, 159.0, 233.0, 373.0, 557.0, 734.0, 544.0, 309.0, 216.0, 147.0, 114.0, 71.0, 39.0, 37.0, 26.0, 23.0, 12.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.4130859375, -0.39794921875, -0.3828125, -0.36767578125, -0.3525390625, -0.33740234375, -0.322265625, -0.30712890625, -0.2919921875, -0.27685546875, -0.26171875, -0.24658203125, -0.2314453125, -0.21630859375, -0.201171875, -0.18603515625, -0.1708984375, -0.15576171875, -0.140625, -0.12548828125, -0.1103515625, -0.09521484375, -0.080078125, -0.06494140625, -0.0498046875, -0.03466796875, -0.01953125, -0.00439453125, 0.0107421875, 0.02587890625, 0.041015625, 0.05615234375, 0.0712890625, 0.08642578125, 0.1015625, 0.11669921875, 0.1318359375, 0.14697265625, 0.162109375, 0.17724609375, 0.1923828125, 0.20751953125, 0.22265625, 0.23779296875, 0.2529296875, 0.26806640625, 0.283203125, 0.29833984375, 0.3134765625, 0.32861328125, 0.34375, 0.35888671875, 0.3740234375, 0.38916015625, 0.404296875, 0.41943359375, 0.4345703125, 0.44970703125, 0.46484375, 0.47998046875, 0.4951171875, 0.51025390625, 0.525390625, 0.54052734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 12.0, 15.0, 27.0, 39.0, 52.0, 64.0, 75.0, 84.0, 120.0, 112.0, 91.0, 84.0, 63.0, 64.0, 35.0, 21.0, 15.0, 7.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2121691703796387, -2.129901647567749, -2.0476343631744385, -1.9653668403625488, -1.8830993175506592, -1.800831913948059, -1.718564510345459, -1.6362969875335693, -1.5540295839309692, -1.4717621803283691, -1.3894946575164795, -1.3072272539138794, -1.2249598503112793, -1.1426923274993896, -1.0604249238967896, -0.9781574606895447, -0.8958899974822998, -0.8136225342750549, -0.7313550710678101, -0.64908766746521, -0.5668202042579651, -0.4845527410507202, -0.40228530764579773, -0.32001787424087524, -0.23775041103363037, -0.1554829627275467, -0.07321551442146301, 0.009051933884620667, 0.09131938219070435, 0.17358684539794922, 0.2558542788028717, 0.3381217122077942, 0.42038917541503906, 0.5026566386222839, 0.5849241018295288, 0.6671915054321289, 0.7494589686393738, 0.8317264318466187, 0.9139938354492188, 0.9962612986564636, 1.0785287618637085, 1.1607961654663086, 1.2430636882781982, 1.3253310918807983, 1.4075984954833984, 1.489866018295288, 1.5721334218978882, 1.6544008255004883, 1.736668348312378, 1.818935751914978, 1.9012032747268677, 1.9834706783294678, 2.0657382011413574, 2.148005485534668, 2.2302730083465576, 2.3125405311584473, 2.394807815551758, 2.4770753383636475, 2.559342622756958, 2.6416101455688477, 2.7238776683807373, 2.806145191192627, 2.8884124755859375, 2.970679998397827, 3.052947521209717]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 3.0, 8.0, 7.0, 7.0, 13.0, 12.0, 9.0, 10.0, 23.0, 18.0, 26.0, 19.0, 25.0, 18.0, 33.0, 34.0, 40.0, 50.0, 31.0, 41.0, 34.0, 27.0, 36.0, 39.0, 48.0, 37.0, 41.0, 40.0, 26.0, 30.0, 28.0, 24.0, 27.0, 31.0, 14.0, 14.0, 17.0, 15.0, 6.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1867331266403198, -1.146103024482727, -1.1054729223251343, -1.064842939376831, -1.0242128372192383, -0.9835827350616455, -0.9429526329040527, -0.90232253074646, -0.861692488193512, -0.8210623860359192, -0.7804323434829712, -0.7398022413253784, -0.6991721391677856, -0.6585420966148376, -0.6179119944572449, -0.5772819519042969, -0.5366518497467041, -0.4960217773914337, -0.45539170503616333, -0.41476160287857056, -0.37413153052330017, -0.3335014581680298, -0.292871356010437, -0.2522412836551666, -0.21161121129989624, -0.17098113894462585, -0.13035105168819427, -0.08972097188234329, -0.04909089207649231, -0.008460819721221924, 0.032169267535209656, 0.07279935479164124, 0.11342930793762207, 0.15405938029289246, 0.19468946754932404, 0.23531955480575562, 0.275949627161026, 0.3165796995162964, 0.35720980167388916, 0.39783987402915955, 0.43846994638442993, 0.4791000187397003, 0.5197300910949707, 0.5603601932525635, 0.6009902954101562, 0.6416203379631042, 0.682250440120697, 0.722880482673645, 0.7635105848312378, 0.8041406869888306, 0.8447707295417786, 0.8854008316993713, 0.9260308742523193, 0.9666609764099121, 1.0072910785675049, 1.0479211807250977, 1.0885512828826904, 1.1291813850402832, 1.169811487197876, 1.2104414701461792, 1.251071572303772, 1.2917016744613647, 1.3323317766189575, 1.3729618787765503, 1.4135918617248535]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 15.0, 16.0, 21.0, 18.0, 50.0, 58.0, 80.0, 134.0, 192.0, 296.0, 441.0, 536.0, 816.0, 1233.0, 1838.0, 2790.0, 4187.0, 6414.0, 10138.0, 16107.0, 27638.0, 50192.0, 103849.0, 235368.0, 288095.0, 144463.0, 65076.0, 34205.0, 19815.0, 12064.0, 7454.0, 4846.0, 3327.0, 2103.0, 1448.0, 997.0, 711.0, 489.0, 336.0, 218.0, 156.0, 102.0, 66.0, 51.0, 34.0, 22.0, 19.0, 11.0, 10.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.304443359375, -0.2949867248535156, -0.28553009033203125, -0.2760734558105469, -0.2666168212890625, -0.2571601867675781, -0.24770355224609375, -0.23824691772460938, -0.228790283203125, -0.21933364868164062, -0.20987701416015625, -0.20042037963867188, -0.1909637451171875, -0.18150711059570312, -0.17205047607421875, -0.16259384155273438, -0.15313720703125, -0.14368057250976562, -0.13422393798828125, -0.12476730346679688, -0.1153106689453125, -0.10585403442382812, -0.09639739990234375, -0.08694076538085938, -0.077484130859375, -0.06802749633789062, -0.05857086181640625, -0.049114227294921875, -0.0396575927734375, -0.030200958251953125, -0.02074432373046875, -0.011287689208984375, -0.0018310546875, 0.007625579833984375, 0.01708221435546875, 0.026538848876953125, 0.0359954833984375, 0.045452117919921875, 0.05490875244140625, 0.06436538696289062, 0.073822021484375, 0.08327865600585938, 0.09273529052734375, 0.10219192504882812, 0.1116485595703125, 0.12110519409179688, 0.13056182861328125, 0.14001846313476562, 0.14947509765625, 0.15893173217773438, 0.16838836669921875, 0.17784500122070312, 0.1873016357421875, 0.19675827026367188, 0.20621490478515625, 0.21567153930664062, 0.225128173828125, 0.23458480834960938, 0.24404144287109375, 0.2534980773925781, 0.2629547119140625, 0.2724113464355469, 0.28186798095703125, 0.2913246154785156, 0.30078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 6.0, 1.0, 2.0, 7.0, 2.0, 13.0, 9.0, 6.0, 12.0, 13.0, 21.0, 19.0, 20.0, 30.0, 19.0, 30.0, 37.0, 34.0, 44.0, 28.0, 32.0, 40.0, 39.0, 40.0, 40.0, 35.0, 51.0, 36.0, 43.0, 33.0, 28.0, 30.0, 22.0, 33.0, 26.0, 25.0, 20.0, 13.0, 21.0, 18.0, 8.0, 4.0, 6.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.162353515625, -0.15653228759765625, -0.1507110595703125, -0.14488983154296875, -0.139068603515625, -0.13324737548828125, -0.1274261474609375, -0.12160491943359375, -0.11578369140625, -0.10996246337890625, -0.1041412353515625, -0.09832000732421875, -0.092498779296875, -0.08667755126953125, -0.0808563232421875, -0.07503509521484375, -0.0692138671875, -0.06339263916015625, -0.0575714111328125, -0.05175018310546875, -0.045928955078125, -0.04010772705078125, -0.0342864990234375, -0.02846527099609375, -0.02264404296875, -0.01682281494140625, -0.0110015869140625, -0.00518035888671875, 0.000640869140625, 0.00646209716796875, 0.0122833251953125, 0.01810455322265625, 0.02392578125, 0.02974700927734375, 0.0355682373046875, 0.04138946533203125, 0.047210693359375, 0.05303192138671875, 0.0588531494140625, 0.06467437744140625, 0.07049560546875, 0.07631683349609375, 0.0821380615234375, 0.08795928955078125, 0.093780517578125, 0.09960174560546875, 0.1054229736328125, 0.11124420166015625, 0.1170654296875, 0.12288665771484375, 0.1287078857421875, 0.13452911376953125, 0.140350341796875, 0.14617156982421875, 0.1519927978515625, 0.15781402587890625, 0.16363525390625, 0.16945648193359375, 0.1752777099609375, 0.18109893798828125, 0.186920166015625, 0.19274139404296875, 0.1985626220703125, 0.20438385009765625, 0.210205078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 4.0, 17.0, 27.0, 32.0, 77.0, 117.0, 310.0, 575.0, 1106.0, 2540.0, 5614.0, 12924.0, 29043.0, 75276.0, 282311.0, 438623.0, 125656.0, 41711.0, 17912.0, 7827.0, 3683.0, 1676.0, 720.0, 360.0, 198.0, 87.0, 51.0, 24.0, 20.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65380859375, -0.6371345520019531, -0.6204605102539062, -0.6037864685058594, -0.5871124267578125, -0.5704383850097656, -0.5537643432617188, -0.5370903015136719, -0.520416259765625, -0.5037422180175781, -0.48706817626953125, -0.4703941345214844, -0.4537200927734375, -0.4370460510253906, -0.42037200927734375, -0.4036979675292969, -0.38702392578125, -0.3703498840332031, -0.35367584228515625, -0.3370018005371094, -0.3203277587890625, -0.3036537170410156, -0.28697967529296875, -0.2703056335449219, -0.253631591796875, -0.23695755004882812, -0.22028350830078125, -0.20360946655273438, -0.1869354248046875, -0.17026138305664062, -0.15358734130859375, -0.13691329956054688, -0.1202392578125, -0.10356521606445312, -0.08689117431640625, -0.07021713256835938, -0.0535430908203125, -0.036869049072265625, -0.02019500732421875, -0.003520965576171875, 0.013153076171875, 0.029827117919921875, 0.04650115966796875, 0.06317520141601562, 0.0798492431640625, 0.09652328491210938, 0.11319732666015625, 0.12987136840820312, 0.14654541015625, 0.16321945190429688, 0.17989349365234375, 0.19656753540039062, 0.2132415771484375, 0.22991561889648438, 0.24658966064453125, 0.2632637023925781, 0.279937744140625, 0.2966117858886719, 0.31328582763671875, 0.3299598693847656, 0.3466339111328125, 0.3633079528808594, 0.37998199462890625, 0.3966560363769531, 0.413330078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 6.0, 7.0, 6.0, 9.0, 1.0, 8.0, 18.0, 9.0, 13.0, 20.0, 25.0, 21.0, 27.0, 26.0, 30.0, 42.0, 38.0, 52.0, 38.0, 42.0, 46.0, 34.0, 39.0, 33.0, 38.0, 37.0, 48.0, 36.0, 32.0, 24.0, 26.0, 23.0, 16.0, 18.0, 13.0, 14.0, 12.0, 13.0, 11.0, 12.0, 5.0, 2.0, 7.0, 7.0, 8.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5598907470703125, -0.542633056640625, -0.5253753662109375, -0.50811767578125, -0.4908599853515625, -0.473602294921875, -0.4563446044921875, -0.4390869140625, -0.4218292236328125, -0.404571533203125, -0.3873138427734375, -0.37005615234375, -0.3527984619140625, -0.335540771484375, -0.3182830810546875, -0.301025390625, -0.2837677001953125, -0.266510009765625, -0.2492523193359375, -0.23199462890625, -0.2147369384765625, -0.197479248046875, -0.1802215576171875, -0.1629638671875, -0.1457061767578125, -0.128448486328125, -0.1111907958984375, -0.09393310546875, -0.0766754150390625, -0.059417724609375, -0.0421600341796875, -0.02490234375, -0.0076446533203125, 0.009613037109375, 0.0268707275390625, 0.04412841796875, 0.0613861083984375, 0.078643798828125, 0.0959014892578125, 0.1131591796875, 0.1304168701171875, 0.147674560546875, 0.1649322509765625, 0.18218994140625, 0.1994476318359375, 0.216705322265625, 0.2339630126953125, 0.251220703125, 0.2684783935546875, 0.285736083984375, 0.3029937744140625, 0.32025146484375, 0.3375091552734375, 0.354766845703125, 0.3720245361328125, 0.3892822265625, 0.4065399169921875, 0.423797607421875, 0.4410552978515625, 0.45831298828125, 0.4755706787109375, 0.492828369140625, 0.5100860595703125, 0.52734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 17.0, 19.0, 17.0, 47.0, 67.0, 124.0, 181.0, 296.0, 553.0, 883.0, 1583.0, 2764.0, 4783.0, 8484.0, 14869.0, 26375.0, 47069.0, 89651.0, 210704.0, 324708.0, 154211.0, 71467.0, 39116.0, 21691.0, 12259.0, 7169.0, 3953.0, 2289.0, 1329.0, 764.0, 451.0, 251.0, 133.0, 91.0, 58.0, 48.0, 26.0, 21.0, 7.0, 11.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11358642578125, -0.10927295684814453, -0.10495948791503906, -0.1006460189819336, -0.09633255004882812, -0.09201908111572266, -0.08770561218261719, -0.08339214324951172, -0.07907867431640625, -0.07476520538330078, -0.07045173645019531, -0.06613826751708984, -0.061824798583984375, -0.057511329650878906, -0.05319786071777344, -0.04888439178466797, -0.0445709228515625, -0.04025745391845703, -0.03594398498535156, -0.031630516052246094, -0.027317047119140625, -0.023003578186035156, -0.018690109252929688, -0.014376640319824219, -0.01006317138671875, -0.005749702453613281, -0.0014362335205078125, 0.0028772354125976562, 0.007190704345703125, 0.011504173278808594, 0.015817642211914062, 0.02013111114501953, 0.024444580078125, 0.02875804901123047, 0.03307151794433594, 0.037384986877441406, 0.041698455810546875, 0.046011924743652344, 0.05032539367675781, 0.05463886260986328, 0.05895233154296875, 0.06326580047607422, 0.06757926940917969, 0.07189273834228516, 0.07620620727539062, 0.0805196762084961, 0.08483314514160156, 0.08914661407470703, 0.0934600830078125, 0.09777355194091797, 0.10208702087402344, 0.1064004898071289, 0.11071395874023438, 0.11502742767333984, 0.11934089660644531, 0.12365436553955078, 0.12796783447265625, 0.13228130340576172, 0.1365947723388672, 0.14090824127197266, 0.14522171020507812, 0.1495351791381836, 0.15384864807128906, 0.15816211700439453, 0.1624755859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 8.0, 3.0, 10.0, 4.0, 7.0, 9.0, 9.0, 11.0, 9.0, 26.0, 31.0, 40.0, 57.0, 106.0, 167.0, 149.0, 126.0, 62.0, 47.0, 39.0, 15.0, 11.0, 14.0, 9.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.435943603515625e-05, -5.260482430458069e-05, -5.085021257400513e-05, -4.9095600843429565e-05, -4.7340989112854004e-05, -4.558637738227844e-05, -4.383176565170288e-05, -4.207715392112732e-05, -4.032254219055176e-05, -3.8567930459976196e-05, -3.6813318729400635e-05, -3.505870699882507e-05, -3.330409526824951e-05, -3.154948353767395e-05, -2.979487180709839e-05, -2.8040260076522827e-05, -2.6285648345947266e-05, -2.4531036615371704e-05, -2.2776424884796143e-05, -2.102181315422058e-05, -1.926720142364502e-05, -1.7512589693069458e-05, -1.5757977962493896e-05, -1.4003366231918335e-05, -1.2248754501342773e-05, -1.0494142770767212e-05, -8.73953104019165e-06, -6.984919309616089e-06, -5.230307579040527e-06, -3.475695848464966e-06, -1.7210841178894043e-06, 3.3527612686157227e-08, 1.7881393432617188e-06, 3.5427510738372803e-06, 5.297362804412842e-06, 7.051974534988403e-06, 8.806586265563965e-06, 1.0561197996139526e-05, 1.2315809726715088e-05, 1.407042145729065e-05, 1.582503318786621e-05, 1.7579644918441772e-05, 1.9334256649017334e-05, 2.1088868379592896e-05, 2.2843480110168457e-05, 2.459809184074402e-05, 2.635270357131958e-05, 2.810731530189514e-05, 2.9861927032470703e-05, 3.1616538763046265e-05, 3.3371150493621826e-05, 3.512576222419739e-05, 3.688037395477295e-05, 3.863498568534851e-05, 4.038959741592407e-05, 4.2144209146499634e-05, 4.3898820877075195e-05, 4.565343260765076e-05, 4.740804433822632e-05, 4.916265606880188e-05, 5.091726779937744e-05, 5.2671879529953e-05, 5.4426491260528564e-05, 5.6181102991104126e-05, 5.793571472167969e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 16.0, 28.0, 46.0, 75.0, 107.0, 189.0, 416.0, 781.0, 1590.0, 3659.0, 7730.0, 17536.0, 40967.0, 103022.0, 319666.0, 355804.0, 115994.0, 45632.0, 19222.0, 8565.0, 3900.0, 1837.0, 844.0, 441.0, 205.0, 109.0, 67.0, 47.0, 27.0, 17.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2052001953125, -0.1991748809814453, -0.19314956665039062, -0.18712425231933594, -0.18109893798828125, -0.17507362365722656, -0.16904830932617188, -0.1630229949951172, -0.1569976806640625, -0.1509723663330078, -0.14494705200195312, -0.13892173767089844, -0.13289642333984375, -0.12687110900878906, -0.12084579467773438, -0.11482048034667969, -0.108795166015625, -0.10276985168457031, -0.09674453735351562, -0.09071922302246094, -0.08469390869140625, -0.07866859436035156, -0.07264328002929688, -0.06661796569824219, -0.0605926513671875, -0.05456733703613281, -0.048542022705078125, -0.04251670837402344, -0.03649139404296875, -0.030466079711914062, -0.024440765380859375, -0.018415451049804688, -0.01239013671875, -0.0063648223876953125, -0.000339508056640625, 0.0056858062744140625, 0.01171112060546875, 0.017736434936523438, 0.023761749267578125, 0.029787063598632812, 0.0358123779296875, 0.04183769226074219, 0.047863006591796875, 0.05388832092285156, 0.05991363525390625, 0.06593894958496094, 0.07196426391601562, 0.07798957824707031, 0.084014892578125, 0.09004020690917969, 0.09606552124023438, 0.10209083557128906, 0.10811614990234375, 0.11414146423339844, 0.12016677856445312, 0.1261920928955078, 0.1322174072265625, 0.1382427215576172, 0.14426803588867188, 0.15029335021972656, 0.15631866455078125, 0.16234397888183594, 0.16836929321289062, 0.1743946075439453, 0.180419921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 15.0, 6.0, 19.0, 17.0, 21.0, 25.0, 35.0, 42.0, 46.0, 81.0, 75.0, 103.0, 101.0, 88.0, 61.0, 50.0, 36.0, 35.0, 18.0, 21.0, 20.0, 7.0, 8.0, 13.0, 6.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1878662109375, -0.18215179443359375, -0.1764373779296875, -0.17072296142578125, -0.165008544921875, -0.15929412841796875, -0.1535797119140625, -0.14786529541015625, -0.14215087890625, -0.13643646240234375, -0.1307220458984375, -0.12500762939453125, -0.119293212890625, -0.11357879638671875, -0.1078643798828125, -0.10214996337890625, -0.096435546875, -0.09072113037109375, -0.0850067138671875, -0.07929229736328125, -0.073577880859375, -0.06786346435546875, -0.0621490478515625, -0.05643463134765625, -0.05072021484375, -0.04500579833984375, -0.0392913818359375, -0.03357696533203125, -0.027862548828125, -0.02214813232421875, -0.0164337158203125, -0.01071929931640625, -0.0050048828125, 0.00070953369140625, 0.0064239501953125, 0.01213836669921875, 0.017852783203125, 0.02356719970703125, 0.0292816162109375, 0.03499603271484375, 0.04071044921875, 0.04642486572265625, 0.0521392822265625, 0.05785369873046875, 0.063568115234375, 0.06928253173828125, 0.0749969482421875, 0.08071136474609375, 0.08642578125, 0.09214019775390625, 0.0978546142578125, 0.10356903076171875, 0.109283447265625, 0.11499786376953125, 0.1207122802734375, 0.12642669677734375, 0.13214111328125, 0.13785552978515625, 0.1435699462890625, 0.14928436279296875, 0.154998779296875, 0.16071319580078125, 0.1664276123046875, 0.17214202880859375, 0.1778564453125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 11.0, 11.0, 22.0, 29.0, 29.0, 74.0, 78.0, 102.0, 120.0, 125.0, 107.0, 87.0, 67.0, 45.0, 33.0, 26.0, 9.0, 16.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5914758443832397, -1.517104148864746, -1.442732334136963, -1.3683606386184692, -1.2939889430999756, -1.2196171283721924, -1.1452454328536987, -1.070873737335205, -0.9965019822120667, -0.9221302270889282, -0.8477585315704346, -0.7733867764472961, -0.6990150213241577, -0.6246433258056641, -0.5502715706825256, -0.475899875164032, -0.40152812004089355, -0.3271563947200775, -0.2527846693992615, -0.17841291427612305, -0.104041188955307, -0.029669463634490967, 0.04470229148864746, 0.11907398700714111, 0.19344574213027954, 0.2678174674510956, 0.3421891927719116, 0.41656094789505005, 0.4909326732158661, 0.5653043985366821, 0.6396761536598206, 0.7140478491783142, 0.7884194850921631, 0.8627912402153015, 0.9371629357337952, 1.0115346908569336, 1.0859063863754272, 1.160278081893921, 1.234649896621704, 1.3090215921401978, 1.3833932876586914, 1.457764983177185, 1.5321367979049683, 1.606508493423462, 1.6808801889419556, 1.7552518844604492, 1.8296236991882324, 1.903995394706726, 1.9783672094345093, 2.052738904953003, 2.127110719680786, 2.2014822959899902, 2.2758541107177734, 2.3502259254455566, 2.42459774017334, 2.498969316482544, 2.573341131210327, 2.6477129459381104, 2.7220845222473145, 2.7964563369750977, 2.870828151702881, 2.945199728012085, 3.019571542739868, 3.0939431190490723, 3.1683149337768555]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 2.0, 2.0, 4.0, 10.0, 7.0, 5.0, 15.0, 11.0, 18.0, 15.0, 27.0, 30.0, 30.0, 30.0, 30.0, 30.0, 33.0, 33.0, 40.0, 46.0, 40.0, 39.0, 42.0, 33.0, 39.0, 48.0, 37.0, 37.0, 36.0, 30.0, 31.0, 29.0, 28.0, 14.0, 18.0, 17.0, 18.0, 19.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5477862358093262, -1.5011661052703857, -1.4545459747314453, -1.4079258441925049, -1.361305832862854, -1.3146857023239136, -1.2680655717849731, -1.2214454412460327, -1.1748254299163818, -1.1282052993774414, -1.081585168838501, -1.0349650382995605, -0.9883450269699097, -0.9417248964309692, -0.8951047658920288, -0.8484846353530884, -0.801864504814148, -0.7552443742752075, -0.7086243033409119, -0.6620041728019714, -0.6153841018676758, -0.5687639713287354, -0.5221438407897949, -0.4755237400531769, -0.42890363931655884, -0.3822835385799408, -0.33566343784332275, -0.2890433073043823, -0.24242320656776428, -0.19580310583114624, -0.1491829752922058, -0.10256287455558777, -0.05594289302825928, -0.009322784841060638, 0.037297323346138, 0.08391743898391724, 0.13053753972053528, 0.17715764045715332, 0.22377777099609375, 0.2703978717327118, 0.31701797246932983, 0.3636380732059479, 0.4102581739425659, 0.45687830448150635, 0.5034984350204468, 0.5501185059547424, 0.5967386364936829, 0.6433587074279785, 0.689978837966919, 0.7365989685058594, 0.783219039440155, 0.8298391699790955, 0.8764592409133911, 0.9230793714523315, 0.969699501991272, 1.0163196325302124, 1.0629396438598633, 1.1095597743988037, 1.1561799049377441, 1.2028000354766846, 1.2494200468063354, 1.2960401773452759, 1.3426603078842163, 1.3892804384231567, 1.4359005689620972]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 8.0, 5.0, 11.0, 21.0, 23.0, 27.0, 50.0, 71.0, 120.0, 189.0, 296.0, 476.0, 798.0, 1389.0, 2221.0, 4104.0, 7431.0, 13439.0, 26063.0, 52191.0, 112308.0, 284336.0, 1165929.0, 1848822.0, 398302.0, 142822.0, 64174.0, 31483.0, 16368.0, 8935.0, 4931.0, 2848.0, 1594.0, 1015.0, 576.0, 304.0, 221.0, 142.0, 89.0, 59.0, 27.0, 23.0, 15.0, 15.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.23386383056640625, -0.2245635986328125, -0.21526336669921875, -0.205963134765625, -0.19666290283203125, -0.1873626708984375, -0.17806243896484375, -0.16876220703125, -0.15946197509765625, -0.1501617431640625, -0.14086151123046875, -0.131561279296875, -0.12226104736328125, -0.1129608154296875, -0.10366058349609375, -0.0943603515625, -0.08506011962890625, -0.0757598876953125, -0.06645965576171875, -0.057159423828125, -0.04785919189453125, -0.0385589599609375, -0.02925872802734375, -0.01995849609375, -0.01065826416015625, -0.0013580322265625, 0.00794219970703125, 0.017242431640625, 0.02654266357421875, 0.0358428955078125, 0.04514312744140625, 0.054443359375, 0.06374359130859375, 0.0730438232421875, 0.08234405517578125, 0.091644287109375, 0.10094451904296875, 0.1102447509765625, 0.11954498291015625, 0.12884521484375, 0.13814544677734375, 0.1474456787109375, 0.15674591064453125, 0.166046142578125, 0.17534637451171875, 0.1846466064453125, 0.19394683837890625, 0.2032470703125, 0.21254730224609375, 0.2218475341796875, 0.23114776611328125, 0.240447998046875, 0.24974822998046875, 0.2590484619140625, 0.26834869384765625, 0.27764892578125, 0.28694915771484375, 0.2962493896484375, 0.30554962158203125, 0.314849853515625, 0.32415008544921875, 0.3334503173828125, 0.34275054931640625, 0.35205078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 7.0, 4.0, 15.0, 5.0, 15.0, 15.0, 10.0, 8.0, 8.0, 19.0, 23.0, 28.0, 25.0, 30.0, 25.0, 46.0, 45.0, 42.0, 36.0, 42.0, 37.0, 38.0, 49.0, 26.0, 26.0, 39.0, 40.0, 29.0, 38.0, 34.0, 36.0, 18.0, 23.0, 20.0, 17.0, 23.0, 13.0, 14.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15688133239746094, -0.15116500854492188, -0.1454486846923828, -0.13973236083984375, -0.1340160369873047, -0.12829971313476562, -0.12258338928222656, -0.1168670654296875, -0.11115074157714844, -0.10543441772460938, -0.09971809387207031, -0.09400177001953125, -0.08828544616699219, -0.08256912231445312, -0.07685279846191406, -0.071136474609375, -0.06542015075683594, -0.059703826904296875, -0.05398750305175781, -0.04827117919921875, -0.04255485534667969, -0.036838531494140625, -0.031122207641601562, -0.0254058837890625, -0.019689559936523438, -0.013973236083984375, -0.008256912231445312, -0.00254058837890625, 0.0031757354736328125, 0.008892059326171875, 0.014608383178710938, 0.02032470703125, 0.026041030883789062, 0.031757354736328125, 0.03747367858886719, 0.04319000244140625, 0.04890632629394531, 0.054622650146484375, 0.06033897399902344, 0.0660552978515625, 0.07177162170410156, 0.07748794555664062, 0.08320426940917969, 0.08892059326171875, 0.09463691711425781, 0.10035324096679688, 0.10606956481933594, 0.111785888671875, 0.11750221252441406, 0.12321853637695312, 0.1289348602294922, 0.13465118408203125, 0.1403675079345703, 0.14608383178710938, 0.15180015563964844, 0.1575164794921875, 0.16323280334472656, 0.16894912719726562, 0.1746654510498047, 0.18038177490234375, 0.1860980987548828, 0.19181442260742188, 0.19753074645996094, 0.2032470703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 11.0, 17.0, 21.0, 22.0, 49.0, 71.0, 134.0, 206.0, 377.0, 522.0, 921.0, 1622.0, 2781.0, 4959.0, 9256.0, 17475.0, 34203.0, 69954.0, 150748.0, 368608.0, 1351184.0, 1479493.0, 393931.0, 159926.0, 72549.0, 35599.0, 18001.0, 9597.0, 5184.0, 2900.0, 1613.0, 949.0, 565.0, 335.0, 179.0, 117.0, 67.0, 50.0, 45.0, 10.0, 11.0, 10.0, 6.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3676719665527344, -0.35619354248046875, -0.3447151184082031, -0.3332366943359375, -0.3217582702636719, -0.31027984619140625, -0.2988014221191406, -0.287322998046875, -0.2758445739746094, -0.26436614990234375, -0.2528877258300781, -0.2414093017578125, -0.22993087768554688, -0.21845245361328125, -0.20697402954101562, -0.19549560546875, -0.18401718139648438, -0.17253875732421875, -0.16106033325195312, -0.1495819091796875, -0.13810348510742188, -0.12662506103515625, -0.11514663696289062, -0.103668212890625, -0.09218978881835938, -0.08071136474609375, -0.06923294067382812, -0.0577545166015625, -0.046276092529296875, -0.03479766845703125, -0.023319244384765625, -0.0118408203125, -0.000362396240234375, 0.01111602783203125, 0.022594451904296875, 0.0340728759765625, 0.045551300048828125, 0.05702972412109375, 0.06850814819335938, 0.079986572265625, 0.09146499633789062, 0.10294342041015625, 0.11442184448242188, 0.1259002685546875, 0.13737869262695312, 0.14885711669921875, 0.16033554077148438, 0.17181396484375, 0.18329238891601562, 0.19477081298828125, 0.20624923706054688, 0.2177276611328125, 0.22920608520507812, 0.24068450927734375, 0.2521629333496094, 0.263641357421875, 0.2751197814941406, 0.28659820556640625, 0.2980766296386719, 0.3095550537109375, 0.3210334777832031, 0.33251190185546875, 0.3439903259277344, 0.35546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 3.0, 10.0, 19.0, 19.0, 24.0, 32.0, 32.0, 43.0, 58.0, 94.0, 114.0, 190.0, 228.0, 379.0, 683.0, 757.0, 458.0, 283.0, 164.0, 138.0, 101.0, 62.0, 42.0, 29.0, 22.0, 25.0, 24.0, 13.0, 9.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416015625, -0.40006256103515625, -0.3841094970703125, -0.36815643310546875, -0.352203369140625, -0.33625030517578125, -0.3202972412109375, -0.30434417724609375, -0.28839111328125, -0.27243804931640625, -0.2564849853515625, -0.24053192138671875, -0.224578857421875, -0.20862579345703125, -0.1926727294921875, -0.17671966552734375, -0.1607666015625, -0.14481353759765625, -0.1288604736328125, -0.11290740966796875, -0.096954345703125, -0.08100128173828125, -0.0650482177734375, -0.04909515380859375, -0.03314208984375, -0.01718902587890625, -0.0012359619140625, 0.01471710205078125, 0.030670166015625, 0.04662322998046875, 0.0625762939453125, 0.07852935791015625, 0.094482421875, 0.11043548583984375, 0.1263885498046875, 0.14234161376953125, 0.158294677734375, 0.17424774169921875, 0.1902008056640625, 0.20615386962890625, 0.22210693359375, 0.23805999755859375, 0.2540130615234375, 0.26996612548828125, 0.285919189453125, 0.30187225341796875, 0.3178253173828125, 0.33377838134765625, 0.3497314453125, 0.36568450927734375, 0.3816375732421875, 0.39759063720703125, 0.413543701171875, 0.42949676513671875, 0.4454498291015625, 0.46140289306640625, 0.47735595703125, 0.49330902099609375, 0.5092620849609375, 0.5252151489257812, 0.541168212890625, 0.5571212768554688, 0.5730743408203125, 0.5890274047851562, 0.60498046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 15.0, 17.0, 43.0, 45.0, 75.0, 100.0, 126.0, 139.0, 112.0, 119.0, 68.0, 56.0, 37.0, 27.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9155347347259521, -1.808927297592163, -1.702319860458374, -1.595712423324585, -1.489104986190796, -1.3824975490570068, -1.2758902311325073, -1.1692827939987183, -1.0626753568649292, -0.9560679197311401, -0.8494604825973511, -0.7428531050682068, -0.6362456679344177, -0.5296382308006287, -0.4230308532714844, -0.3164234161376953, -0.20981597900390625, -0.10320855677127838, 0.0033988654613494873, 0.11000627279281616, 0.21661370992660522, 0.3232211470603943, 0.4298285245895386, 0.5364359617233276, 0.6430433988571167, 0.7496508359909058, 0.8562582731246948, 0.9628656506538391, 1.0694730281829834, 1.1760804653167725, 1.2826879024505615, 1.3892953395843506, 1.4959025382995605, 1.6025099754333496, 1.7091174125671387, 1.8157248497009277, 1.9223322868347168, 2.028939723968506, 2.135547161102295, 2.242154598236084, 2.348762035369873, 2.455369472503662, 2.561976909637451, 2.6685843467712402, 2.7751917839050293, 2.8817992210388184, 2.9884066581726074, 3.0950140953063965, 3.2016212940216064, 3.3082287311553955, 3.4148361682891846, 3.5214436054229736, 3.6280510425567627, 3.7346584796905518, 3.8412656784057617, 3.947873115539551, 4.05448055267334, 4.161087989807129, 4.267695426940918, 4.374302864074707, 4.480910301208496, 4.587517738342285, 4.694125175476074, 4.800732612609863, 4.907340049743652]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 11.0, 3.0, 9.0, 7.0, 11.0, 20.0, 20.0, 21.0, 27.0, 35.0, 24.0, 24.0, 37.0, 40.0, 39.0, 50.0, 48.0, 37.0, 45.0, 44.0, 52.0, 49.0, 50.0, 21.0, 33.0, 28.0, 27.0, 35.0, 23.0, 19.0, 22.0, 14.0, 12.0, 6.0, 9.0, 10.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.650313377380371, -1.6048355102539062, -1.5593576431274414, -1.5138797760009766, -1.4684019088745117, -1.4229241609573364, -1.3774462938308716, -1.3319684267044067, -1.286490559577942, -1.241012692451477, -1.1955348253250122, -1.1500569581985474, -1.104579210281372, -1.0591013431549072, -1.0136234760284424, -0.9681456089019775, -0.9226677417755127, -0.8771898746490479, -0.831712007522583, -0.7862342000007629, -0.7407563328742981, -0.6952784657478333, -0.6498006582260132, -0.6043227910995483, -0.5588449239730835, -0.5133670568466187, -0.4678892195224762, -0.42241138219833374, -0.3769335150718689, -0.33145564794540405, -0.2859778106212616, -0.24049997329711914, -0.19502222537994385, -0.1495443731546402, -0.10406652092933655, -0.0585886687040329, -0.013110816478729248, 0.0323670357465744, 0.07784488797187805, 0.12332272529602051, 0.16880059242248535, 0.214278444647789, 0.25975629687309265, 0.3052341341972351, 0.35071200132369995, 0.3961898684501648, 0.44166770577430725, 0.4871455430984497, 0.5326234102249146, 0.5781012773513794, 0.6235791444778442, 0.6690569519996643, 0.7145348191261292, 0.760012686252594, 0.8054904937744141, 0.8509683609008789, 0.8964462280273438, 0.9419240951538086, 0.9874019622802734, 1.0328798294067383, 1.0783576965332031, 1.1238354444503784, 1.1693133115768433, 1.214791178703308, 1.260269045829773]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 10.0, 4.0, 5.0, 19.0, 32.0, 39.0, 56.0, 117.0, 137.0, 219.0, 352.0, 550.0, 852.0, 1275.0, 2068.0, 3244.0, 5019.0, 8698.0, 14597.0, 26270.0, 53375.0, 117249.0, 235056.0, 272600.0, 156582.0, 71105.0, 33901.0, 18064.0, 10396.0, 6055.0, 3887.0, 2373.0, 1589.0, 961.0, 639.0, 407.0, 261.0, 184.0, 116.0, 63.0, 40.0, 24.0, 22.0, 18.0, 9.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3246307373046875, -0.314544677734375, -0.3044586181640625, -0.29437255859375, -0.2842864990234375, -0.274200439453125, -0.2641143798828125, -0.2540283203125, -0.2439422607421875, -0.233856201171875, -0.2237701416015625, -0.21368408203125, -0.2035980224609375, -0.193511962890625, -0.1834259033203125, -0.17333984375, -0.1632537841796875, -0.153167724609375, -0.1430816650390625, -0.13299560546875, -0.1229095458984375, -0.112823486328125, -0.1027374267578125, -0.0926513671875, -0.0825653076171875, -0.072479248046875, -0.0623931884765625, -0.05230712890625, -0.0422210693359375, -0.032135009765625, -0.0220489501953125, -0.011962890625, -0.0018768310546875, 0.008209228515625, 0.0182952880859375, 0.02838134765625, 0.0384674072265625, 0.048553466796875, 0.0586395263671875, 0.0687255859375, 0.0788116455078125, 0.088897705078125, 0.0989837646484375, 0.10906982421875, 0.1191558837890625, 0.129241943359375, 0.1393280029296875, 0.1494140625, 0.1595001220703125, 0.169586181640625, 0.1796722412109375, 0.18975830078125, 0.1998443603515625, 0.209930419921875, 0.2200164794921875, 0.2301025390625, 0.2401885986328125, 0.250274658203125, 0.2603607177734375, 0.27044677734375, 0.2805328369140625, 0.290618896484375, 0.3007049560546875, 0.310791015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 2.0, 11.0, 14.0, 13.0, 12.0, 18.0, 20.0, 16.0, 23.0, 32.0, 31.0, 37.0, 28.0, 38.0, 39.0, 41.0, 42.0, 41.0, 50.0, 40.0, 42.0, 40.0, 54.0, 41.0, 25.0, 31.0, 36.0, 25.0, 27.0, 28.0, 15.0, 15.0, 12.0, 9.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.2099609375, -0.20343589782714844, -0.19691085815429688, -0.1903858184814453, -0.18386077880859375, -0.1773357391357422, -0.17081069946289062, -0.16428565979003906, -0.1577606201171875, -0.15123558044433594, -0.14471054077148438, -0.1381855010986328, -0.13166046142578125, -0.1251354217529297, -0.11861038208007812, -0.11208534240722656, -0.105560302734375, -0.09903526306152344, -0.09251022338867188, -0.08598518371582031, -0.07946014404296875, -0.07293510437011719, -0.06641006469726562, -0.05988502502441406, -0.0533599853515625, -0.04683494567871094, -0.040309906005859375, -0.03378486633300781, -0.02725982666015625, -0.020734786987304688, -0.014209747314453125, -0.0076847076416015625, -0.00115966796875, 0.0053653717041015625, 0.011890411376953125, 0.018415451049804688, 0.02494049072265625, 0.03146553039550781, 0.037990570068359375, 0.04451560974121094, 0.0510406494140625, 0.05756568908691406, 0.06409072875976562, 0.07061576843261719, 0.07714080810546875, 0.08366584777832031, 0.09019088745117188, 0.09671592712402344, 0.103240966796875, 0.10976600646972656, 0.11629104614257812, 0.12281608581542969, 0.12934112548828125, 0.1358661651611328, 0.14239120483398438, 0.14891624450683594, 0.1554412841796875, 0.16196632385253906, 0.16849136352539062, 0.1750164031982422, 0.18154144287109375, 0.1880664825439453, 0.19459152221679688, 0.20111656188964844, 0.2076416015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 14.0, 28.0, 30.0, 60.0, 105.0, 167.0, 402.0, 879.0, 2149.0, 5420.0, 13867.0, 39467.0, 137298.0, 435619.0, 295228.0, 77170.0, 24939.0, 9244.0, 3672.0, 1508.0, 616.0, 290.0, 121.0, 88.0, 53.0, 40.0, 19.0, 13.0, 13.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6494140625, -0.6317596435546875, -0.614105224609375, -0.5964508056640625, -0.57879638671875, -0.5611419677734375, -0.543487548828125, -0.5258331298828125, -0.5081787109375, -0.4905242919921875, -0.472869873046875, -0.4552154541015625, -0.43756103515625, -0.4199066162109375, -0.402252197265625, -0.3845977783203125, -0.366943359375, -0.3492889404296875, -0.331634521484375, -0.3139801025390625, -0.29632568359375, -0.2786712646484375, -0.261016845703125, -0.2433624267578125, -0.2257080078125, -0.2080535888671875, -0.190399169921875, -0.1727447509765625, -0.15509033203125, -0.1374359130859375, -0.119781494140625, -0.1021270751953125, -0.08447265625, -0.0668182373046875, -0.049163818359375, -0.0315093994140625, -0.01385498046875, 0.0037994384765625, 0.021453857421875, 0.0391082763671875, 0.0567626953125, 0.0744171142578125, 0.092071533203125, 0.1097259521484375, 0.12738037109375, 0.1450347900390625, 0.162689208984375, 0.1803436279296875, 0.197998046875, 0.2156524658203125, 0.233306884765625, 0.2509613037109375, 0.26861572265625, 0.2862701416015625, 0.303924560546875, 0.3215789794921875, 0.3392333984375, 0.3568878173828125, 0.374542236328125, 0.3921966552734375, 0.40985107421875, 0.4275054931640625, 0.445159912109375, 0.4628143310546875, 0.48046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 9.0, 9.0, 5.0, 9.0, 13.0, 16.0, 19.0, 16.0, 26.0, 23.0, 25.0, 37.0, 35.0, 46.0, 40.0, 38.0, 44.0, 46.0, 52.0, 41.0, 43.0, 48.0, 37.0, 40.0, 34.0, 41.0, 39.0, 26.0, 24.0, 22.0, 15.0, 14.0, 18.0, 10.0, 8.0, 8.0, 10.0, 5.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.67822265625, -0.6588134765625, -0.639404296875, -0.6199951171875, -0.6005859375, -0.5811767578125, -0.561767578125, -0.5423583984375, -0.52294921875, -0.5035400390625, -0.484130859375, -0.4647216796875, -0.4453125, -0.4259033203125, -0.406494140625, -0.3870849609375, -0.36767578125, -0.3482666015625, -0.328857421875, -0.3094482421875, -0.2900390625, -0.2706298828125, -0.251220703125, -0.2318115234375, -0.21240234375, -0.1929931640625, -0.173583984375, -0.1541748046875, -0.134765625, -0.1153564453125, -0.095947265625, -0.0765380859375, -0.05712890625, -0.0377197265625, -0.018310546875, 0.0010986328125, 0.0205078125, 0.0399169921875, 0.059326171875, 0.0787353515625, 0.09814453125, 0.1175537109375, 0.136962890625, 0.1563720703125, 0.17578125, 0.1951904296875, 0.214599609375, 0.2340087890625, 0.25341796875, 0.2728271484375, 0.292236328125, 0.3116455078125, 0.3310546875, 0.3504638671875, 0.369873046875, 0.3892822265625, 0.40869140625, 0.4281005859375, 0.447509765625, 0.4669189453125, 0.486328125, 0.5057373046875, 0.525146484375, 0.5445556640625, 0.56396484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 15.0, 21.0, 35.0, 48.0, 70.0, 119.0, 169.0, 306.0, 506.0, 971.0, 1844.0, 3608.0, 7151.0, 15089.0, 32620.0, 71192.0, 164916.0, 310309.0, 240949.0, 108055.0, 47624.0, 22055.0, 10332.0, 5025.0, 2486.0, 1335.0, 665.0, 372.0, 223.0, 140.0, 109.0, 52.0, 36.0, 36.0, 15.0, 12.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.17333984375, -0.16820335388183594, -0.16306686401367188, -0.1579303741455078, -0.15279388427734375, -0.1476573944091797, -0.14252090454101562, -0.13738441467285156, -0.1322479248046875, -0.12711143493652344, -0.12197494506835938, -0.11683845520019531, -0.11170196533203125, -0.10656547546386719, -0.10142898559570312, -0.09629249572753906, -0.091156005859375, -0.08601951599121094, -0.08088302612304688, -0.07574653625488281, -0.07061004638671875, -0.06547355651855469, -0.060337066650390625, -0.05520057678222656, -0.0500640869140625, -0.04492759704589844, -0.039791107177734375, -0.03465461730957031, -0.02951812744140625, -0.024381637573242188, -0.019245147705078125, -0.014108657836914062, -0.00897216796875, -0.0038356781005859375, 0.001300811767578125, 0.0064373016357421875, 0.01157379150390625, 0.016710281372070312, 0.021846771240234375, 0.026983261108398438, 0.0321197509765625, 0.03725624084472656, 0.042392730712890625, 0.04752922058105469, 0.05266571044921875, 0.05780220031738281, 0.06293869018554688, 0.06807518005371094, 0.073211669921875, 0.07834815979003906, 0.08348464965820312, 0.08862113952636719, 0.09375762939453125, 0.09889411926269531, 0.10403060913085938, 0.10916709899902344, 0.1143035888671875, 0.11944007873535156, 0.12457656860351562, 0.1297130584716797, 0.13484954833984375, 0.1399860382080078, 0.14512252807617188, 0.15025901794433594, 0.1553955078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 7.0, 8.0, 12.0, 13.0, 12.0, 26.0, 24.0, 68.0, 76.0, 109.0, 140.0, 146.0, 121.0, 58.0, 40.0, 34.0, 34.0, 13.0, 8.0, 8.0, 4.0, 3.0, 11.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7637691497802734e-05, -5.577504634857178e-05, -5.391240119934082e-05, -5.204975605010986e-05, -5.0187110900878906e-05, -4.832446575164795e-05, -4.646182060241699e-05, -4.4599175453186035e-05, -4.273653030395508e-05, -4.087388515472412e-05, -3.9011240005493164e-05, -3.714859485626221e-05, -3.528594970703125e-05, -3.342330455780029e-05, -3.1560659408569336e-05, -2.969801425933838e-05, -2.7835369110107422e-05, -2.5972723960876465e-05, -2.4110078811645508e-05, -2.224743366241455e-05, -2.0384788513183594e-05, -1.8522143363952637e-05, -1.665949821472168e-05, -1.4796853065490723e-05, -1.2934207916259766e-05, -1.1071562767028809e-05, -9.208917617797852e-06, -7.3462724685668945e-06, -5.4836273193359375e-06, -3.6209821701049805e-06, -1.7583370208740234e-06, 1.043081283569336e-07, 1.9669532775878906e-06, 3.829598426818848e-06, 5.692243576049805e-06, 7.554888725280762e-06, 9.417533874511719e-06, 1.1280179023742676e-05, 1.3142824172973633e-05, 1.500546932220459e-05, 1.6868114471435547e-05, 1.8730759620666504e-05, 2.059340476989746e-05, 2.2456049919128418e-05, 2.4318695068359375e-05, 2.6181340217590332e-05, 2.804398536682129e-05, 2.9906630516052246e-05, 3.17692756652832e-05, 3.363192081451416e-05, 3.549456596374512e-05, 3.7357211112976074e-05, 3.921985626220703e-05, 4.108250141143799e-05, 4.2945146560668945e-05, 4.48077917098999e-05, 4.667043685913086e-05, 4.8533082008361816e-05, 5.0395727157592773e-05, 5.225837230682373e-05, 5.412101745605469e-05, 5.5983662605285645e-05, 5.78463077545166e-05, 5.970895290374756e-05, 6.157159805297852e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 5.0, 9.0, 16.0, 24.0, 45.0, 71.0, 106.0, 164.0, 321.0, 602.0, 1084.0, 2124.0, 4580.0, 10466.0, 26325.0, 69021.0, 188991.0, 360267.0, 237548.0, 89252.0, 33358.0, 13131.0, 5726.0, 2605.0, 1170.0, 640.0, 367.0, 193.0, 135.0, 79.0, 43.0, 30.0, 21.0, 12.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.1690654754638672, -0.16271591186523438, -0.15636634826660156, -0.15001678466796875, -0.14366722106933594, -0.13731765747070312, -0.1309680938720703, -0.1246185302734375, -0.11826896667480469, -0.11191940307617188, -0.10556983947753906, -0.09922027587890625, -0.09287071228027344, -0.08652114868164062, -0.08017158508300781, -0.073822021484375, -0.06747245788574219, -0.061122894287109375, -0.05477333068847656, -0.04842376708984375, -0.04207420349121094, -0.035724639892578125, -0.029375076293945312, -0.0230255126953125, -0.016675949096679688, -0.010326385498046875, -0.0039768218994140625, 0.00237274169921875, 0.008722305297851562, 0.015071868896484375, 0.021421432495117188, 0.02777099609375, 0.03412055969238281, 0.040470123291015625, 0.04681968688964844, 0.05316925048828125, 0.05951881408691406, 0.06586837768554688, 0.07221794128417969, 0.0785675048828125, 0.08491706848144531, 0.09126663208007812, 0.09761619567871094, 0.10396575927734375, 0.11031532287597656, 0.11666488647460938, 0.12301445007324219, 0.129364013671875, 0.1357135772705078, 0.14206314086914062, 0.14841270446777344, 0.15476226806640625, 0.16111183166503906, 0.16746139526367188, 0.1738109588623047, 0.1801605224609375, 0.1865100860595703, 0.19285964965820312, 0.19920921325683594, 0.20555877685546875, 0.21190834045410156, 0.21825790405273438, 0.2246074676513672, 0.23095703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 14.0, 11.0, 21.0, 23.0, 31.0, 40.0, 52.0, 48.0, 70.0, 96.0, 100.0, 74.0, 79.0, 59.0, 38.0, 55.0, 36.0, 33.0, 26.0, 13.0, 16.0, 17.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2095947265625, -0.20334815979003906, -0.19710159301757812, -0.1908550262451172, -0.18460845947265625, -0.1783618927001953, -0.17211532592773438, -0.16586875915527344, -0.1596221923828125, -0.15337562561035156, -0.14712905883789062, -0.1408824920654297, -0.13463592529296875, -0.1283893585205078, -0.12214279174804688, -0.11589622497558594, -0.109649658203125, -0.10340309143066406, -0.09715652465820312, -0.09090995788574219, -0.08466339111328125, -0.07841682434082031, -0.07217025756835938, -0.06592369079589844, -0.0596771240234375, -0.05343055725097656, -0.047183990478515625, -0.04093742370605469, -0.03469085693359375, -0.028444290161132812, -0.022197723388671875, -0.015951156616210938, -0.00970458984375, -0.0034580230712890625, 0.002788543701171875, 0.009035110473632812, 0.01528167724609375, 0.021528244018554688, 0.027774810791015625, 0.03402137756347656, 0.0402679443359375, 0.04651451110839844, 0.052761077880859375, 0.05900764465332031, 0.06525421142578125, 0.07150077819824219, 0.07774734497070312, 0.08399391174316406, 0.090240478515625, 0.09648704528808594, 0.10273361206054688, 0.10898017883300781, 0.11522674560546875, 0.12147331237792969, 0.12771987915039062, 0.13396644592285156, 0.1402130126953125, 0.14645957946777344, 0.15270614624023438, 0.1589527130126953, 0.16519927978515625, 0.1714458465576172, 0.17769241333007812, 0.18393898010253906, 0.190185546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 11.0, 21.0, 31.0, 43.0, 71.0, 102.0, 134.0, 145.0, 135.0, 113.0, 85.0, 47.0, 20.0, 23.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9292144775390625, -2.8419816493988037, -2.754748821258545, -2.667515993118286, -2.5802831649780273, -2.4930505752563477, -2.405817747116089, -2.31858491897583, -2.2313520908355713, -2.1441192626953125, -2.0568864345550537, -1.9696537256240845, -1.8824208974838257, -1.795188069343567, -1.7079553604125977, -1.6207225322723389, -1.53348970413208, -1.4462568759918213, -1.3590240478515625, -1.2717913389205933, -1.1845585107803345, -1.0973256826400757, -1.0100929737091064, -0.9228601455688477, -0.8356273174285889, -0.7483944892883301, -0.6611617207527161, -0.573928952217102, -0.48669612407684326, -0.39946332573890686, -0.31223052740097046, -0.22499775886535645, -0.13776516914367676, -0.050532370805740356, 0.036700427532196045, 0.12393322587013245, 0.21116602420806885, 0.29839882254600525, 0.38563162088394165, 0.47286438941955566, 0.5600972175598145, 0.6473300457000732, 0.7345628142356873, 0.8217955827713013, 0.9090284109115601, 0.9962612390518188, 1.083493947982788, 1.1707267761230469, 1.2579596042633057, 1.3451924324035645, 1.4324252605438232, 1.5196579694747925, 1.6068907976150513, 1.69412362575531, 1.7813563346862793, 1.868589162826538, 1.9558219909667969, 2.0430548191070557, 2.1302876472473145, 2.2175204753875732, 2.304753303527832, 2.3919858932495117, 2.4792187213897705, 2.5664515495300293, 2.653684377670288]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 6.0, 5.0, 3.0, 12.0, 14.0, 10.0, 11.0, 15.0, 19.0, 26.0, 15.0, 24.0, 29.0, 21.0, 40.0, 37.0, 30.0, 35.0, 50.0, 44.0, 29.0, 33.0, 41.0, 39.0, 48.0, 50.0, 36.0, 33.0, 39.0, 33.0, 33.0, 17.0, 19.0, 18.0, 17.0, 8.0, 11.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4986697435379028, -1.4501937627792358, -1.4017176628112793, -1.3532416820526123, -1.3047655820846558, -1.2562896013259888, -1.2078135013580322, -1.1593375205993652, -1.1108615398406982, -1.0623855590820312, -1.0139094591140747, -0.9654334783554077, -0.9169573783874512, -0.8684813976287842, -0.8200053572654724, -0.7715293169021606, -0.7230532169342041, -0.6745771765708923, -0.6261011362075806, -0.5776251554489136, -0.529149055480957, -0.48067304491996765, -0.43219703435897827, -0.3837209939956665, -0.33524495363235474, -0.28676891326904297, -0.2382928878068924, -0.18981686234474182, -0.14134082198143005, -0.09286478161811829, -0.044388771057128906, 0.004087269306182861, 0.05256319046020508, 0.10103922337293625, 0.14951525628566742, 0.197991281747818, 0.24646732211112976, 0.29494336247444153, 0.3434193730354309, 0.3918954133987427, 0.44037145376205444, 0.4888474941253662, 0.537323534488678, 0.5857995748519897, 0.6342755556106567, 0.6827516555786133, 0.7312276363372803, 0.779703676700592, 0.8281797170639038, 0.8766557574272156, 0.9251317977905273, 0.9736077785491943, 1.0220838785171509, 1.0705598592758179, 1.1190359592437744, 1.1675119400024414, 1.2159879207611084, 1.2644639015197754, 1.312940001487732, 1.361415982246399, 1.4098920822143555, 1.4583680629730225, 1.5068440437316895, 1.555320143699646, 1.6037962436676025]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 7.0, 4.0, 13.0, 14.0, 37.0, 46.0, 86.0, 152.0, 280.0, 557.0, 1205.0, 2498.0, 5504.0, 13562.0, 34655.0, 98162.0, 333721.0, 1727240.0, 1531983.0, 299338.0, 90327.0, 32559.0, 12626.0, 5258.0, 2314.0, 1085.0, 499.0, 253.0, 144.0, 70.0, 43.0, 17.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302978515625, -0.2885246276855469, -0.27407073974609375, -0.2596168518066406, -0.2451629638671875, -0.23070907592773438, -0.21625518798828125, -0.20180130004882812, -0.187347412109375, -0.17289352416992188, -0.15843963623046875, -0.14398574829101562, -0.1295318603515625, -0.11507797241210938, -0.10062408447265625, -0.08617019653320312, -0.07171630859375, -0.057262420654296875, -0.04280853271484375, -0.028354644775390625, -0.0139007568359375, 0.000553131103515625, 0.01500701904296875, 0.029460906982421875, 0.043914794921875, 0.058368682861328125, 0.07282257080078125, 0.08727645874023438, 0.1017303466796875, 0.11618423461914062, 0.13063812255859375, 0.14509201049804688, 0.1595458984375, 0.17399978637695312, 0.18845367431640625, 0.20290756225585938, 0.2173614501953125, 0.23181533813476562, 0.24626922607421875, 0.2607231140136719, 0.275177001953125, 0.2896308898925781, 0.30408477783203125, 0.3185386657714844, 0.3329925537109375, 0.3474464416503906, 0.36190032958984375, 0.3763542175292969, 0.39080810546875, 0.4052619934082031, 0.41971588134765625, 0.4341697692871094, 0.4486236572265625, 0.4630775451660156, 0.47753143310546875, 0.4919853210449219, 0.506439208984375, 0.5208930969238281, 0.5353469848632812, 0.5498008728027344, 0.5642547607421875, 0.5787086486816406, 0.5931625366210938, 0.6076164245605469, 0.6220703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 14.0, 6.0, 8.0, 19.0, 20.0, 23.0, 32.0, 22.0, 22.0, 29.0, 28.0, 38.0, 35.0, 45.0, 52.0, 41.0, 43.0, 40.0, 37.0, 43.0, 48.0, 36.0, 33.0, 33.0, 48.0, 28.0, 23.0, 16.0, 16.0, 21.0, 17.0, 12.0, 14.0, 12.0, 9.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2109375, -0.20439720153808594, -0.19785690307617188, -0.1913166046142578, -0.18477630615234375, -0.1782360076904297, -0.17169570922851562, -0.16515541076660156, -0.1586151123046875, -0.15207481384277344, -0.14553451538085938, -0.1389942169189453, -0.13245391845703125, -0.1259136199951172, -0.11937332153320312, -0.11283302307128906, -0.106292724609375, -0.09975242614746094, -0.09321212768554688, -0.08667182922363281, -0.08013153076171875, -0.07359123229980469, -0.06705093383789062, -0.06051063537597656, -0.0539703369140625, -0.04743003845214844, -0.040889739990234375, -0.03434944152832031, -0.02780914306640625, -0.021268844604492188, -0.014728546142578125, -0.008188247680664062, -0.00164794921875, 0.0048923492431640625, 0.011432647705078125, 0.017972946166992188, 0.02451324462890625, 0.031053543090820312, 0.037593841552734375, 0.04413414001464844, 0.0506744384765625, 0.05721473693847656, 0.06375503540039062, 0.07029533386230469, 0.07683563232421875, 0.08337593078613281, 0.08991622924804688, 0.09645652770996094, 0.102996826171875, 0.10953712463378906, 0.11607742309570312, 0.12261772155761719, 0.12915802001953125, 0.1356983184814453, 0.14223861694335938, 0.14877891540527344, 0.1553192138671875, 0.16185951232910156, 0.16839981079101562, 0.1749401092529297, 0.18148040771484375, 0.1880207061767578, 0.19456100463867188, 0.20110130310058594, 0.2076416015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 12.0, 18.0, 18.0, 29.0, 39.0, 70.0, 105.0, 180.0, 260.0, 390.0, 626.0, 971.0, 1671.0, 2777.0, 4819.0, 8580.0, 15861.0, 29616.0, 58013.0, 117262.0, 255245.0, 644477.0, 1653106.0, 817601.0, 303061.0, 137127.0, 66672.0, 34300.0, 17972.0, 9854.0, 5457.0, 3173.0, 1907.0, 1157.0, 678.0, 399.0, 277.0, 176.0, 114.0, 69.0, 50.0, 28.0, 23.0, 15.0, 10.0, 9.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.309326171875, -0.2998390197753906, -0.29035186767578125, -0.2808647155761719, -0.2713775634765625, -0.2618904113769531, -0.25240325927734375, -0.24291610717773438, -0.233428955078125, -0.22394180297851562, -0.21445465087890625, -0.20496749877929688, -0.1954803466796875, -0.18599319458007812, -0.17650604248046875, -0.16701889038085938, -0.15753173828125, -0.14804458618164062, -0.13855743408203125, -0.12907028198242188, -0.1195831298828125, -0.11009597778320312, -0.10060882568359375, -0.09112167358398438, -0.081634521484375, -0.07214736938476562, -0.06266021728515625, -0.053173065185546875, -0.0436859130859375, -0.034198760986328125, -0.02471160888671875, -0.015224456787109375, -0.0057373046875, 0.003749847412109375, 0.01323699951171875, 0.022724151611328125, 0.0322113037109375, 0.041698455810546875, 0.05118560791015625, 0.060672760009765625, 0.070159912109375, 0.07964706420898438, 0.08913421630859375, 0.09862136840820312, 0.1081085205078125, 0.11759567260742188, 0.12708282470703125, 0.13656997680664062, 0.14605712890625, 0.15554428100585938, 0.16503143310546875, 0.17451858520507812, 0.1840057373046875, 0.19349288940429688, 0.20298004150390625, 0.21246719360351562, 0.221954345703125, 0.23144149780273438, 0.24092864990234375, 0.2504158020019531, 0.2599029541015625, 0.2693901062011719, 0.27887725830078125, 0.2883644104003906, 0.2978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 9.0, 4.0, 11.0, 16.0, 19.0, 14.0, 18.0, 30.0, 32.0, 44.0, 49.0, 77.0, 71.0, 124.0, 164.0, 199.0, 270.0, 383.0, 506.0, 513.0, 405.0, 242.0, 189.0, 171.0, 94.0, 106.0, 60.0, 56.0, 48.0, 24.0, 37.0, 17.0, 14.0, 11.0, 7.0, 8.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.413330078125, -0.4004058837890625, -0.387481689453125, -0.3745574951171875, -0.36163330078125, -0.3487091064453125, -0.335784912109375, -0.3228607177734375, -0.3099365234375, -0.2970123291015625, -0.284088134765625, -0.2711639404296875, -0.25823974609375, -0.2453155517578125, -0.232391357421875, -0.2194671630859375, -0.20654296875, -0.1936187744140625, -0.180694580078125, -0.1677703857421875, -0.15484619140625, -0.1419219970703125, -0.128997802734375, -0.1160736083984375, -0.1031494140625, -0.0902252197265625, -0.077301025390625, -0.0643768310546875, -0.05145263671875, -0.0385284423828125, -0.025604248046875, -0.0126800537109375, 0.000244140625, 0.0131683349609375, 0.026092529296875, 0.0390167236328125, 0.05194091796875, 0.0648651123046875, 0.077789306640625, 0.0907135009765625, 0.1036376953125, 0.1165618896484375, 0.129486083984375, 0.1424102783203125, 0.15533447265625, 0.1682586669921875, 0.181182861328125, 0.1941070556640625, 0.20703125, 0.2199554443359375, 0.232879638671875, 0.2458038330078125, 0.25872802734375, 0.2716522216796875, 0.284576416015625, 0.2975006103515625, 0.3104248046875, 0.3233489990234375, 0.336273193359375, 0.3491973876953125, 0.36212158203125, 0.3750457763671875, 0.387969970703125, 0.4008941650390625, 0.413818359375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 10.0, 19.0, 28.0, 45.0, 52.0, 71.0, 86.0, 104.0, 111.0, 108.0, 91.0, 86.0, 46.0, 41.0, 37.0, 19.0, 9.0, 13.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.197746515274048, -2.1109507083892822, -2.0241551399230957, -1.93735933303833, -1.8505635261535645, -1.7637677192687988, -1.6769720315933228, -1.5901763439178467, -1.503380537033081, -1.4165847301483154, -1.3297890424728394, -1.2429933547973633, -1.1561975479125977, -1.069401741027832, -0.982606053352356, -0.8958103060722351, -0.8090145587921143, -0.7222188115119934, -0.6354230642318726, -0.5486273169517517, -0.46183156967163086, -0.37503582239151, -0.28824007511138916, -0.2014443278312683, -0.11464858055114746, -0.02785283327102661, 0.05894291400909424, 0.1457386612892151, 0.23253440856933594, 0.3193301558494568, 0.40612590312957764, 0.4929216504096985, 0.5797173976898193, 0.6665131449699402, 0.753308892250061, 0.8401046395301819, 0.9269003868103027, 1.0136961936950684, 1.1004918813705444, 1.1872875690460205, 1.2740833759307861, 1.3608791828155518, 1.4476748704910278, 1.534470558166504, 1.6212663650512695, 1.7080621719360352, 1.7948578596115112, 1.8816535472869873, 1.968449354171753, 2.0552451610565186, 2.142040729522705, 2.2288365364074707, 2.3156323432922363, 2.402428150177002, 2.4892239570617676, 2.576019525527954, 2.6628153324127197, 2.7496111392974854, 2.836406707763672, 2.9232025146484375, 3.009998321533203, 3.0967941284179688, 3.1835899353027344, 3.270385503768921, 3.3571813106536865]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 5.0, 5.0, 11.0, 8.0, 11.0, 8.0, 13.0, 12.0, 23.0, 18.0, 18.0, 22.0, 23.0, 23.0, 38.0, 32.0, 45.0, 32.0, 36.0, 35.0, 48.0, 42.0, 39.0, 29.0, 45.0, 38.0, 30.0, 44.0, 31.0, 23.0, 30.0, 35.0, 32.0, 16.0, 10.0, 14.0, 16.0, 12.0, 8.0, 13.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4809997081756592, -1.435689091682434, -1.3903785943984985, -1.3450679779052734, -1.299757480621338, -1.2544468641281128, -1.2091363668441772, -1.1638257503509521, -1.1185152530670166, -1.0732046365737915, -1.027894139289856, -0.9825835824012756, -0.9372730255126953, -0.891962468624115, -0.8466519117355347, -0.8013412952423096, -0.7560307383537292, -0.7107201814651489, -0.6654096245765686, -0.6200990676879883, -0.574788510799408, -0.5294779539108276, -0.4841673672199249, -0.4388568103313446, -0.3935462534427643, -0.34823569655418396, -0.30292513966560364, -0.2576145529747009, -0.2123040109872818, -0.16699345409870148, -0.12168288230895996, -0.07637232542037964, -0.031061768531799316, 0.014248792082071304, 0.059559352695941925, 0.10486991703510284, 0.15018047392368317, 0.1954910308122635, 0.240801602602005, 0.2861121594905853, 0.33142271637916565, 0.37673327326774597, 0.4220438301563263, 0.467354416847229, 0.5126649737358093, 0.5579755306243896, 0.60328608751297, 0.6485966444015503, 0.6939072012901306, 0.7392177581787109, 0.7845283150672913, 0.8298388719558716, 0.8751494288444519, 0.9204599857330322, 0.9657706022262573, 1.0110810995101929, 1.056391716003418, 1.101702332496643, 1.1470128297805786, 1.1923234462738037, 1.2376339435577393, 1.2829445600509644, 1.3282550573349, 1.373565673828125, 1.4188761711120605]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 17.0, 16.0, 27.0, 35.0, 102.0, 126.0, 160.0, 256.0, 453.0, 599.0, 839.0, 1257.0, 1839.0, 2667.0, 3816.0, 5422.0, 8403.0, 13210.0, 22587.0, 44179.0, 105154.0, 257661.0, 306881.0, 143294.0, 57211.0, 27384.0, 15533.0, 9405.0, 6205.0, 4301.0, 3001.0, 2065.0, 1484.0, 967.0, 654.0, 496.0, 284.0, 195.0, 130.0, 77.0, 53.0, 46.0, 28.0, 9.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0], "bins": [-0.44775390625, -0.43537139892578125, -0.4229888916015625, -0.41060638427734375, -0.398223876953125, -0.38584136962890625, -0.3734588623046875, -0.36107635498046875, -0.34869384765625, -0.33631134033203125, -0.3239288330078125, -0.31154632568359375, -0.299163818359375, -0.28678131103515625, -0.2743988037109375, -0.26201629638671875, -0.2496337890625, -0.23725128173828125, -0.2248687744140625, -0.21248626708984375, -0.200103759765625, -0.18772125244140625, -0.1753387451171875, -0.16295623779296875, -0.15057373046875, -0.13819122314453125, -0.1258087158203125, -0.11342620849609375, -0.101043701171875, -0.08866119384765625, -0.0762786865234375, -0.06389617919921875, -0.051513671875, -0.03913116455078125, -0.0267486572265625, -0.01436614990234375, -0.001983642578125, 0.01039886474609375, 0.0227813720703125, 0.03516387939453125, 0.04754638671875, 0.05992889404296875, 0.0723114013671875, 0.08469390869140625, 0.097076416015625, 0.10945892333984375, 0.1218414306640625, 0.13422393798828125, 0.1466064453125, 0.15898895263671875, 0.1713714599609375, 0.18375396728515625, 0.196136474609375, 0.20851898193359375, 0.2209014892578125, 0.23328399658203125, 0.24566650390625, 0.25804901123046875, 0.2704315185546875, 0.28281402587890625, 0.295196533203125, 0.30757904052734375, 0.3199615478515625, 0.33234405517578125, 0.3447265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 12.0, 7.0, 8.0, 10.0, 8.0, 18.0, 18.0, 18.0, 22.0, 19.0, 24.0, 38.0, 35.0, 33.0, 38.0, 37.0, 35.0, 42.0, 35.0, 30.0, 39.0, 42.0, 40.0, 39.0, 49.0, 35.0, 37.0, 36.0, 28.0, 20.0, 26.0, 27.0, 18.0, 15.0, 17.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19839096069335938, -0.19194793701171875, -0.18550491333007812, -0.1790618896484375, -0.17261886596679688, -0.16617584228515625, -0.15973281860351562, -0.153289794921875, -0.14684677124023438, -0.14040374755859375, -0.13396072387695312, -0.1275177001953125, -0.12107467651367188, -0.11463165283203125, -0.10818862915039062, -0.10174560546875, -0.09530258178710938, -0.08885955810546875, -0.08241653442382812, -0.0759735107421875, -0.06953048706054688, -0.06308746337890625, -0.056644439697265625, -0.050201416015625, -0.043758392333984375, -0.03731536865234375, -0.030872344970703125, -0.0244293212890625, -0.017986297607421875, -0.01154327392578125, -0.005100250244140625, 0.0013427734375, 0.007785797119140625, 0.01422882080078125, 0.020671844482421875, 0.0271148681640625, 0.033557891845703125, 0.04000091552734375, 0.046443939208984375, 0.052886962890625, 0.059329986572265625, 0.06577301025390625, 0.07221603393554688, 0.0786590576171875, 0.08510208129882812, 0.09154510498046875, 0.09798812866210938, 0.10443115234375, 0.11087417602539062, 0.11731719970703125, 0.12376022338867188, 0.1302032470703125, 0.13664627075195312, 0.14308929443359375, 0.14953231811523438, 0.155975341796875, 0.16241836547851562, 0.16886138916015625, 0.17530441284179688, 0.1817474365234375, 0.18819046020507812, 0.19463348388671875, 0.20107650756835938, 0.20751953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 13.0, 17.0, 17.0, 38.0, 58.0, 81.0, 109.0, 182.0, 262.0, 545.0, 1092.0, 2226.0, 4922.0, 11396.0, 25914.0, 68499.0, 267720.0, 464745.0, 128306.0, 41023.0, 17099.0, 7417.0, 3465.0, 1575.0, 760.0, 390.0, 200.0, 141.0, 88.0, 64.0, 52.0, 27.0, 25.0, 14.0, 21.0, 7.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6865005493164062, -0.6664581298828125, -0.6464157104492188, -0.626373291015625, -0.6063308715820312, -0.5862884521484375, -0.5662460327148438, -0.54620361328125, -0.5261611938476562, -0.5061187744140625, -0.48607635498046875, -0.466033935546875, -0.44599151611328125, -0.4259490966796875, -0.40590667724609375, -0.3858642578125, -0.36582183837890625, -0.3457794189453125, -0.32573699951171875, -0.305694580078125, -0.28565216064453125, -0.2656097412109375, -0.24556732177734375, -0.22552490234375, -0.20548248291015625, -0.1854400634765625, -0.16539764404296875, -0.145355224609375, -0.12531280517578125, -0.1052703857421875, -0.08522796630859375, -0.065185546875, -0.04514312744140625, -0.0251007080078125, -0.00505828857421875, 0.014984130859375, 0.03502655029296875, 0.0550689697265625, 0.07511138916015625, 0.09515380859375, 0.11519622802734375, 0.1352386474609375, 0.15528106689453125, 0.175323486328125, 0.19536590576171875, 0.2154083251953125, 0.23545074462890625, 0.2554931640625, 0.27553558349609375, 0.2955780029296875, 0.31562042236328125, 0.335662841796875, 0.35570526123046875, 0.3757476806640625, 0.39579010009765625, 0.41583251953125, 0.43587493896484375, 0.4559173583984375, 0.47595977783203125, 0.496002197265625, 0.5160446166992188, 0.5360870361328125, 0.5561294555664062, 0.576171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 7.0, 6.0, 6.0, 9.0, 9.0, 12.0, 10.0, 17.0, 25.0, 35.0, 27.0, 40.0, 28.0, 32.0, 34.0, 31.0, 56.0, 42.0, 46.0, 32.0, 44.0, 42.0, 38.0, 42.0, 47.0, 28.0, 35.0, 34.0, 36.0, 16.0, 23.0, 16.0, 19.0, 12.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 2.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.5565032958984375, -0.537322998046875, -0.5181427001953125, -0.49896240234375, -0.4797821044921875, -0.460601806640625, -0.4414215087890625, -0.4222412109375, -0.4030609130859375, -0.383880615234375, -0.3647003173828125, -0.34552001953125, -0.3263397216796875, -0.307159423828125, -0.2879791259765625, -0.268798828125, -0.2496185302734375, -0.230438232421875, -0.2112579345703125, -0.19207763671875, -0.1728973388671875, -0.153717041015625, -0.1345367431640625, -0.1153564453125, -0.0961761474609375, -0.076995849609375, -0.0578155517578125, -0.03863525390625, -0.0194549560546875, -0.000274658203125, 0.0189056396484375, 0.0380859375, 0.0572662353515625, 0.076446533203125, 0.0956268310546875, 0.11480712890625, 0.1339874267578125, 0.153167724609375, 0.1723480224609375, 0.1915283203125, 0.2107086181640625, 0.229888916015625, 0.2490692138671875, 0.26824951171875, 0.2874298095703125, 0.306610107421875, 0.3257904052734375, 0.344970703125, 0.3641510009765625, 0.383331298828125, 0.4025115966796875, 0.42169189453125, 0.4408721923828125, 0.460052490234375, 0.4792327880859375, 0.4984130859375, 0.5175933837890625, 0.536773681640625, 0.5559539794921875, 0.57513427734375, 0.5943145751953125, 0.613494873046875, 0.6326751708984375, 0.65185546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 4.0, 16.0, 20.0, 29.0, 27.0, 45.0, 82.0, 121.0, 195.0, 310.0, 516.0, 858.0, 1359.0, 2040.0, 3258.0, 5313.0, 9259.0, 17039.0, 36104.0, 83861.0, 212199.0, 337122.0, 191449.0, 76356.0, 33076.0, 15713.0, 8600.0, 5079.0, 3124.0, 2031.0, 1239.0, 742.0, 506.0, 293.0, 187.0, 126.0, 87.0, 57.0, 29.0, 21.0, 13.0, 14.0, 3.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.144775390625, -0.14017105102539062, -0.13556671142578125, -0.13096237182617188, -0.1263580322265625, -0.12175369262695312, -0.11714935302734375, -0.11254501342773438, -0.107940673828125, -0.10333633422851562, -0.09873199462890625, -0.09412765502929688, -0.0895233154296875, -0.08491897583007812, -0.08031463623046875, -0.07571029663085938, -0.07110595703125, -0.06650161743164062, -0.06189727783203125, -0.057292938232421875, -0.0526885986328125, -0.048084259033203125, -0.04347991943359375, -0.038875579833984375, -0.034271240234375, -0.029666900634765625, -0.02506256103515625, -0.020458221435546875, -0.0158538818359375, -0.011249542236328125, -0.00664520263671875, -0.002040863037109375, 0.0025634765625, 0.007167816162109375, 0.01177215576171875, 0.016376495361328125, 0.0209808349609375, 0.025585174560546875, 0.03018951416015625, 0.034793853759765625, 0.039398193359375, 0.044002532958984375, 0.04860687255859375, 0.053211212158203125, 0.0578155517578125, 0.062419891357421875, 0.06702423095703125, 0.07162857055664062, 0.07623291015625, 0.08083724975585938, 0.08544158935546875, 0.09004592895507812, 0.0946502685546875, 0.09925460815429688, 0.10385894775390625, 0.10846328735351562, 0.113067626953125, 0.11767196655273438, 0.12227630615234375, 0.12688064575195312, 0.1314849853515625, 0.13608932495117188, 0.14069366455078125, 0.14529800415039062, 0.14990234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 30.0, 21.0, 42.0, 70.0, 155.0, 250.0, 184.0, 83.0, 39.0, 31.0, 9.0, 11.0, 10.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.202957153320312e-05, -8.91275703907013e-05, -8.622556924819946e-05, -8.332356810569763e-05, -8.04215669631958e-05, -7.751956582069397e-05, -7.461756467819214e-05, -7.171556353569031e-05, -6.881356239318848e-05, -6.591156125068665e-05, -6.300956010818481e-05, -6.0107558965682983e-05, -5.720555782318115e-05, -5.430355668067932e-05, -5.140155553817749e-05, -4.849955439567566e-05, -4.559755325317383e-05, -4.2695552110672e-05, -3.9793550968170166e-05, -3.6891549825668335e-05, -3.3989548683166504e-05, -3.108754754066467e-05, -2.8185546398162842e-05, -2.528354525566101e-05, -2.238154411315918e-05, -1.947954297065735e-05, -1.6577541828155518e-05, -1.3675540685653687e-05, -1.0773539543151855e-05, -7.871538400650024e-06, -4.969537258148193e-06, -2.0675361156463623e-06, 8.344650268554688e-07, 3.7364661693573e-06, 6.638467311859131e-06, 9.540468454360962e-06, 1.2442469596862793e-05, 1.5344470739364624e-05, 1.8246471881866455e-05, 2.1148473024368286e-05, 2.4050474166870117e-05, 2.6952475309371948e-05, 2.985447645187378e-05, 3.275647759437561e-05, 3.565847873687744e-05, 3.856047987937927e-05, 4.1462481021881104e-05, 4.4364482164382935e-05, 4.7266483306884766e-05, 5.01684844493866e-05, 5.307048559188843e-05, 5.597248673439026e-05, 5.887448787689209e-05, 6.177648901939392e-05, 6.467849016189575e-05, 6.758049130439758e-05, 7.048249244689941e-05, 7.338449358940125e-05, 7.628649473190308e-05, 7.918849587440491e-05, 8.209049701690674e-05, 8.499249815940857e-05, 8.78944993019104e-05, 9.079650044441223e-05, 9.369850158691406e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 1.0, 5.0, 9.0, 10.0, 15.0, 10.0, 16.0, 23.0, 28.0, 45.0, 59.0, 73.0, 121.0, 222.0, 339.0, 531.0, 980.0, 1841.0, 3415.0, 6898.0, 13962.0, 31131.0, 75787.0, 187912.0, 323670.0, 230435.0, 97139.0, 39221.0, 17121.0, 8376.0, 4085.0, 2181.0, 1113.0, 680.0, 394.0, 243.0, 144.0, 90.0, 72.0, 40.0, 38.0, 22.0, 21.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1424560546875, -0.13780593872070312, -0.13315582275390625, -0.12850570678710938, -0.1238555908203125, -0.11920547485351562, -0.11455535888671875, -0.10990524291992188, -0.105255126953125, -0.10060501098632812, -0.09595489501953125, -0.09130477905273438, -0.0866546630859375, -0.08200454711914062, -0.07735443115234375, -0.07270431518554688, -0.06805419921875, -0.06340408325195312, -0.05875396728515625, -0.054103851318359375, -0.0494537353515625, -0.044803619384765625, -0.04015350341796875, -0.035503387451171875, -0.030853271484375, -0.026203155517578125, -0.02155303955078125, -0.016902923583984375, -0.0122528076171875, -0.007602691650390625, -0.00295257568359375, 0.001697540283203125, 0.00634765625, 0.010997772216796875, 0.01564788818359375, 0.020298004150390625, 0.0249481201171875, 0.029598236083984375, 0.03424835205078125, 0.038898468017578125, 0.043548583984375, 0.048198699951171875, 0.05284881591796875, 0.057498931884765625, 0.0621490478515625, 0.06679916381835938, 0.07144927978515625, 0.07609939575195312, 0.08074951171875, 0.08539962768554688, 0.09004974365234375, 0.09469985961914062, 0.0993499755859375, 0.10400009155273438, 0.10865020751953125, 0.11330032348632812, 0.117950439453125, 0.12260055541992188, 0.12725067138671875, 0.13190078735351562, 0.1365509033203125, 0.14120101928710938, 0.14585113525390625, 0.15050125122070312, 0.1551513671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 10.0, 15.0, 14.0, 11.0, 23.0, 35.0, 36.0, 48.0, 77.0, 83.0, 107.0, 107.0, 93.0, 84.0, 61.0, 53.0, 37.0, 24.0, 14.0, 22.0, 9.0, 9.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.20372772216796875, -0.1971282958984375, -0.19052886962890625, -0.183929443359375, -0.17733001708984375, -0.1707305908203125, -0.16413116455078125, -0.15753173828125, -0.15093231201171875, -0.1443328857421875, -0.13773345947265625, -0.131134033203125, -0.12453460693359375, -0.1179351806640625, -0.11133575439453125, -0.104736328125, -0.09813690185546875, -0.0915374755859375, -0.08493804931640625, -0.078338623046875, -0.07173919677734375, -0.0651397705078125, -0.05854034423828125, -0.05194091796875, -0.04534149169921875, -0.0387420654296875, -0.03214263916015625, -0.025543212890625, -0.01894378662109375, -0.0123443603515625, -0.00574493408203125, 0.0008544921875, 0.00745391845703125, 0.0140533447265625, 0.02065277099609375, 0.027252197265625, 0.03385162353515625, 0.0404510498046875, 0.04705047607421875, 0.05364990234375, 0.06024932861328125, 0.0668487548828125, 0.07344818115234375, 0.080047607421875, 0.08664703369140625, 0.0932464599609375, 0.09984588623046875, 0.1064453125, 0.11304473876953125, 0.1196441650390625, 0.12624359130859375, 0.132843017578125, 0.13944244384765625, 0.1460418701171875, 0.15264129638671875, 0.15924072265625, 0.16584014892578125, 0.1724395751953125, 0.17903900146484375, 0.185638427734375, 0.19223785400390625, 0.1988372802734375, 0.20543670654296875, 0.2120361328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 17.0, 21.0, 33.0, 51.0, 68.0, 88.0, 70.0, 81.0, 103.0, 79.0, 90.0, 81.0, 56.0, 42.0, 36.0, 25.0, 11.0, 12.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.058450222015381, -1.9919641017913818, -1.9254779815673828, -1.8589919805526733, -1.7925058603286743, -1.7260197401046753, -1.6595337390899658, -1.5930476188659668, -1.5265614986419678, -1.4600753784179688, -1.3935892581939697, -1.3271032571792603, -1.2606171369552612, -1.1941310167312622, -1.1276450157165527, -1.0611588954925537, -0.9946727752685547, -0.9281866550445557, -0.8617005944252014, -0.7952145338058472, -0.7287284135818481, -0.6622422933578491, -0.5957562327384949, -0.5292701721191406, -0.4627840518951416, -0.39629796147346497, -0.32981187105178833, -0.2633257806301117, -0.19683969020843506, -0.13035359978675842, -0.06386750936508179, 0.0026185810565948486, 0.06910467147827148, 0.13559076189994812, 0.20207685232162476, 0.2685629427433014, 0.335049033164978, 0.40153512358665466, 0.4680212140083313, 0.5345072746276855, 0.6009933948516846, 0.6674795150756836, 0.7339655756950378, 0.8004516363143921, 0.8669377565383911, 0.9334238767623901, 0.9999099373817444, 1.0663959980010986, 1.1328821182250977, 1.1993682384490967, 1.2658543586730957, 1.3323403596878052, 1.3988264799118042, 1.4653126001358032, 1.5317986011505127, 1.5982847213745117, 1.6647708415985107, 1.7312569618225098, 1.7977430820465088, 1.8642290830612183, 1.9307152032852173, 1.9972013235092163, 2.063687324523926, 2.130173444747925, 2.196659564971924]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 8.0, 5.0, 11.0, 12.0, 7.0, 16.0, 19.0, 16.0, 17.0, 17.0, 19.0, 25.0, 37.0, 28.0, 30.0, 45.0, 31.0, 40.0, 43.0, 38.0, 60.0, 50.0, 38.0, 35.0, 35.0, 43.0, 35.0, 33.0, 24.0, 28.0, 29.0, 20.0, 16.0, 18.0, 12.0, 7.0, 9.0, 7.0, 6.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4276683330535889, -1.3805620670318604, -1.3334559202194214, -1.2863496541976929, -1.2392433881759644, -1.1921372413635254, -1.1450309753417969, -1.0979247093200684, -1.0508184432983398, -1.0037121772766113, -0.9566059708595276, -0.9094997644424438, -0.8623934984207153, -0.8152872920036316, -0.7681810855865479, -0.7210748195648193, -0.6739686727523804, -0.6268624663352966, -0.5797562003135681, -0.5326499938964844, -0.48554375767707825, -0.4384375214576721, -0.3913313150405884, -0.34422507882118225, -0.2971188426017761, -0.25001260638237, -0.20290638506412506, -0.15580016374588013, -0.108693927526474, -0.06158769130706787, -0.01448148488998413, 0.032624751329422, 0.07973098754882812, 0.12683722376823425, 0.1739434450864792, 0.22104966640472412, 0.26815590262413025, 0.3152621388435364, 0.3623683452606201, 0.40947458148002625, 0.4565808176994324, 0.5036870241165161, 0.5507932901382446, 0.5978994965553284, 0.6450057029724121, 0.6921119689941406, 0.7392181754112244, 0.7863243818283081, 0.8334306478500366, 0.8805368542671204, 0.9276431202888489, 0.9747493267059326, 1.0218555927276611, 1.0689618587493896, 1.1160680055618286, 1.1631742715835571, 1.210280418395996, 1.2573866844177246, 1.3044928312301636, 1.351599097251892, 1.3987053632736206, 1.4458115100860596, 1.492917776107788, 1.5400240421295166, 1.5871303081512451]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 20.0, 37.0, 54.0, 78.0, 154.0, 236.0, 414.0, 867.0, 1632.0, 3209.0, 7231.0, 16718.0, 40968.0, 108778.0, 354673.0, 1707446.0, 1481594.0, 307568.0, 97087.0, 37012.0, 15480.0, 6618.0, 3043.0, 1526.0, 821.0, 437.0, 217.0, 124.0, 79.0, 55.0, 40.0, 25.0, 6.0, 11.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.266845703125, -0.2546882629394531, -0.24253082275390625, -0.23037338256835938, -0.2182159423828125, -0.20605850219726562, -0.19390106201171875, -0.18174362182617188, -0.169586181640625, -0.15742874145507812, -0.14527130126953125, -0.13311386108398438, -0.1209564208984375, -0.10879898071289062, -0.09664154052734375, -0.08448410034179688, -0.07232666015625, -0.060169219970703125, -0.04801177978515625, -0.035854339599609375, -0.0236968994140625, -0.011539459228515625, 0.00061798095703125, 0.012775421142578125, 0.024932861328125, 0.037090301513671875, 0.04924774169921875, 0.061405181884765625, 0.0735626220703125, 0.08572006225585938, 0.09787750244140625, 0.11003494262695312, 0.1221923828125, 0.13434982299804688, 0.14650726318359375, 0.15866470336914062, 0.1708221435546875, 0.18297958374023438, 0.19513702392578125, 0.20729446411132812, 0.219451904296875, 0.23160934448242188, 0.24376678466796875, 0.2559242248535156, 0.2680816650390625, 0.2802391052246094, 0.29239654541015625, 0.3045539855957031, 0.31671142578125, 0.3288688659667969, 0.34102630615234375, 0.3531837463378906, 0.3653411865234375, 0.3774986267089844, 0.38965606689453125, 0.4018135070800781, 0.413970947265625, 0.4261283874511719, 0.43828582763671875, 0.4504432678222656, 0.4626007080078125, 0.4747581481933594, 0.48691558837890625, 0.4990730285644531, 0.51123046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 4.0, 11.0, 7.0, 13.0, 11.0, 15.0, 11.0, 17.0, 15.0, 22.0, 23.0, 22.0, 19.0, 34.0, 36.0, 39.0, 41.0, 29.0, 45.0, 41.0, 38.0, 32.0, 44.0, 39.0, 48.0, 34.0, 34.0, 33.0, 20.0, 24.0, 20.0, 23.0, 28.0, 16.0, 12.0, 17.0, 19.0, 6.0, 11.0, 12.0, 7.0, 6.0, 4.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.16796875, -0.16219329833984375, -0.1564178466796875, -0.15064239501953125, -0.144866943359375, -0.13909149169921875, -0.1333160400390625, -0.12754058837890625, -0.12176513671875, -0.11598968505859375, -0.1102142333984375, -0.10443878173828125, -0.098663330078125, -0.09288787841796875, -0.0871124267578125, -0.08133697509765625, -0.0755615234375, -0.06978607177734375, -0.0640106201171875, -0.05823516845703125, -0.052459716796875, -0.04668426513671875, -0.0409088134765625, -0.03513336181640625, -0.02935791015625, -0.02358245849609375, -0.0178070068359375, -0.01203155517578125, -0.006256103515625, -0.00048065185546875, 0.0052947998046875, 0.01107025146484375, 0.016845703125, 0.02262115478515625, 0.0283966064453125, 0.03417205810546875, 0.039947509765625, 0.04572296142578125, 0.0514984130859375, 0.05727386474609375, 0.06304931640625, 0.06882476806640625, 0.0746002197265625, 0.08037567138671875, 0.086151123046875, 0.09192657470703125, 0.0977020263671875, 0.10347747802734375, 0.1092529296875, 0.11502838134765625, 0.1208038330078125, 0.12657928466796875, 0.132354736328125, 0.13813018798828125, 0.1439056396484375, 0.14968109130859375, 0.15545654296875, 0.16123199462890625, 0.1670074462890625, 0.17278289794921875, 0.178558349609375, 0.18433380126953125, 0.1901092529296875, 0.19588470458984375, 0.20166015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 17.0, 24.0, 35.0, 54.0, 105.0, 127.0, 229.0, 355.0, 601.0, 1220.0, 2417.0, 5924.0, 15520.0, 46205.0, 153358.0, 692175.0, 2538330.0, 544356.0, 129757.0, 39734.0, 13636.0, 5265.0, 2297.0, 1114.0, 562.0, 328.0, 205.0, 114.0, 89.0, 37.0, 28.0, 24.0, 6.0, 6.0, 4.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.56982421875, -0.5527801513671875, -0.535736083984375, -0.5186920166015625, -0.50164794921875, -0.4846038818359375, -0.467559814453125, -0.4505157470703125, -0.4334716796875, -0.4164276123046875, -0.399383544921875, -0.3823394775390625, -0.36529541015625, -0.3482513427734375, -0.331207275390625, -0.3141632080078125, -0.297119140625, -0.2800750732421875, -0.263031005859375, -0.2459869384765625, -0.22894287109375, -0.2118988037109375, -0.194854736328125, -0.1778106689453125, -0.1607666015625, -0.1437225341796875, -0.126678466796875, -0.1096343994140625, -0.09259033203125, -0.0755462646484375, -0.058502197265625, -0.0414581298828125, -0.0244140625, -0.0073699951171875, 0.009674072265625, 0.0267181396484375, 0.04376220703125, 0.0608062744140625, 0.077850341796875, 0.0948944091796875, 0.1119384765625, 0.1289825439453125, 0.146026611328125, 0.1630706787109375, 0.18011474609375, 0.1971588134765625, 0.214202880859375, 0.2312469482421875, 0.248291015625, 0.2653350830078125, 0.282379150390625, 0.2994232177734375, 0.31646728515625, 0.3335113525390625, 0.350555419921875, 0.3675994873046875, 0.3846435546875, 0.4016876220703125, 0.418731689453125, 0.4357757568359375, 0.45281982421875, 0.4698638916015625, 0.486907958984375, 0.5039520263671875, 0.52099609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 6.0, 13.0, 13.0, 19.0, 24.0, 34.0, 49.0, 61.0, 64.0, 88.0, 148.0, 188.0, 308.0, 465.0, 628.0, 626.0, 378.0, 262.0, 156.0, 126.0, 100.0, 77.0, 56.0, 31.0, 31.0, 26.0, 16.0, 13.0, 13.0, 12.0, 6.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.552734375, -0.536865234375, -0.52099609375, -0.505126953125, -0.4892578125, -0.473388671875, -0.45751953125, -0.441650390625, -0.42578125, -0.409912109375, -0.39404296875, -0.378173828125, -0.3623046875, -0.346435546875, -0.33056640625, -0.314697265625, -0.298828125, -0.282958984375, -0.26708984375, -0.251220703125, -0.2353515625, -0.219482421875, -0.20361328125, -0.187744140625, -0.171875, -0.156005859375, -0.14013671875, -0.124267578125, -0.1083984375, -0.092529296875, -0.07666015625, -0.060791015625, -0.044921875, -0.029052734375, -0.01318359375, 0.002685546875, 0.0185546875, 0.034423828125, 0.05029296875, 0.066162109375, 0.08203125, 0.097900390625, 0.11376953125, 0.129638671875, 0.1455078125, 0.161376953125, 0.17724609375, 0.193115234375, 0.208984375, 0.224853515625, 0.24072265625, 0.256591796875, 0.2724609375, 0.288330078125, 0.30419921875, 0.320068359375, 0.3359375, 0.351806640625, 0.36767578125, 0.383544921875, 0.3994140625, 0.415283203125, 0.43115234375, 0.447021484375, 0.462890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 18.0, 30.0, 64.0, 92.0, 136.0, 153.0, 153.0, 141.0, 89.0, 50.0, 33.0, 19.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.621156692504883, -5.490445613861084, -5.359734535217285, -5.229023456573486, -5.0983123779296875, -4.967601776123047, -4.83689022064209, -4.706179618835449, -4.57546854019165, -4.444757461547852, -4.314046382904053, -4.183335304260254, -4.052624225616455, -3.9219133853912354, -3.7912023067474365, -3.6604912281036377, -3.529780149459839, -3.39906907081604, -3.268357992172241, -3.1376471519470215, -3.0069360733032227, -2.876224994659424, -2.745513916015625, -2.614802837371826, -2.4840917587280273, -2.3533806800842285, -2.2226696014404297, -2.091958522796631, -1.9612476825714111, -1.8305366039276123, -1.6998255252838135, -1.5691144466400146, -1.4384033679962158, -1.307692289352417, -1.1769813299179077, -1.0462702512741089, -0.9155592322349548, -0.7848482131958008, -0.654137134552002, -0.5234261155128479, -0.39271509647369385, -0.2620040774345398, -0.13129302859306335, -0.0005819797515869141, 0.13012903928756714, 0.2608400583267212, 0.39155113697052, 0.5222621560096741, 0.6529731750488281, 0.7836841940879822, 0.9143952131271362, 1.045106291770935, 1.1758172512054443, 1.3065283298492432, 1.437239408493042, 1.5679504871368408, 1.69866144657135, 1.829372525215149, 1.9600834846496582, 2.090794563293457, 2.221505641937256, 2.3522167205810547, 2.4829277992248535, 2.6136386394500732, 2.744349718093872]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 9.0, 7.0, 7.0, 11.0, 7.0, 12.0, 14.0, 18.0, 19.0, 31.0, 28.0, 28.0, 28.0, 27.0, 43.0, 46.0, 43.0, 45.0, 51.0, 35.0, 29.0, 42.0, 42.0, 53.0, 34.0, 43.0, 39.0, 32.0, 33.0, 14.0, 21.0, 14.0, 12.0, 15.0, 6.0, 19.0, 9.0, 8.0, 11.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5673120021820068, -1.5174849033355713, -1.4676578044891357, -1.4178305864334106, -1.368003487586975, -1.3181763887405396, -1.2683491706848145, -1.218522071838379, -1.1686949729919434, -1.1188678741455078, -1.0690407752990723, -1.0192135572433472, -0.9693864583969116, -0.9195593595504761, -0.8697322010993958, -0.8199050426483154, -0.7700779438018799, -0.7202508449554443, -0.670423686504364, -0.6205965280532837, -0.5707694292068481, -0.5209423303604126, -0.4711151719093323, -0.42128804326057434, -0.3714609146118164, -0.32163378596305847, -0.27180665731430054, -0.2219795286655426, -0.17215240001678467, -0.12232527136802673, -0.0724981427192688, -0.022671014070510864, 0.02715611457824707, 0.076983243227005, 0.12681037187576294, 0.17663750052452087, 0.2264646291732788, 0.27629175782203674, 0.3261188864707947, 0.3759460151195526, 0.42577314376831055, 0.4756002724170685, 0.5254274010658264, 0.5752545595169067, 0.6250816583633423, 0.6749087572097778, 0.7247359156608582, 0.7745630741119385, 0.824390172958374, 0.8742172718048096, 0.9240444302558899, 0.9738715887069702, 1.0236986875534058, 1.0735257863998413, 1.1233530044555664, 1.173180103302002, 1.2230072021484375, 1.272834300994873, 1.3226613998413086, 1.3724886178970337, 1.4223157167434692, 1.4721428155899048, 1.5219700336456299, 1.5717971324920654, 1.621624231338501]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 9.0, 11.0, 20.0, 34.0, 46.0, 87.0, 126.0, 215.0, 285.0, 535.0, 816.0, 1253.0, 2042.0, 2976.0, 4698.0, 7168.0, 11502.0, 18714.0, 33136.0, 68169.0, 162104.0, 296028.0, 230345.0, 100438.0, 45011.0, 23682.0, 14027.0, 9014.0, 5738.0, 3733.0, 2395.0, 1554.0, 947.0, 608.0, 437.0, 244.0, 166.0, 96.0, 66.0, 29.0, 11.0, 17.0, 9.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34375, -0.3317832946777344, -0.31981658935546875, -0.3078498840332031, -0.2958831787109375, -0.2839164733886719, -0.27194976806640625, -0.2599830627441406, -0.248016357421875, -0.23604965209960938, -0.22408294677734375, -0.21211624145507812, -0.2001495361328125, -0.18818283081054688, -0.17621612548828125, -0.16424942016601562, -0.15228271484375, -0.14031600952148438, -0.12834930419921875, -0.11638259887695312, -0.1044158935546875, -0.09244918823242188, -0.08048248291015625, -0.06851577758789062, -0.056549072265625, -0.044582366943359375, -0.03261566162109375, -0.020648956298828125, -0.0086822509765625, 0.003284454345703125, 0.01525115966796875, 0.027217864990234375, 0.0391845703125, 0.051151275634765625, 0.06311798095703125, 0.07508468627929688, 0.0870513916015625, 0.09901809692382812, 0.11098480224609375, 0.12295150756835938, 0.134918212890625, 0.14688491821289062, 0.15885162353515625, 0.17081832885742188, 0.1827850341796875, 0.19475173950195312, 0.20671844482421875, 0.21868515014648438, 0.23065185546875, 0.24261856079101562, 0.25458526611328125, 0.2665519714355469, 0.2785186767578125, 0.2904853820800781, 0.30245208740234375, 0.3144187927246094, 0.326385498046875, 0.3383522033691406, 0.35031890869140625, 0.3622856140136719, 0.3742523193359375, 0.3862190246582031, 0.39818572998046875, 0.4101524353027344, 0.422119140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 11.0, 16.0, 14.0, 18.0, 16.0, 21.0, 21.0, 26.0, 26.0, 33.0, 33.0, 37.0, 42.0, 42.0, 33.0, 43.0, 36.0, 45.0, 42.0, 41.0, 39.0, 44.0, 36.0, 35.0, 30.0, 27.0, 25.0, 27.0, 17.0, 16.0, 16.0, 16.0, 16.0, 8.0, 6.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2113037109375, -0.2046833038330078, -0.19806289672851562, -0.19144248962402344, -0.18482208251953125, -0.17820167541503906, -0.17158126831054688, -0.1649608612060547, -0.1583404541015625, -0.1517200469970703, -0.14509963989257812, -0.13847923278808594, -0.13185882568359375, -0.12523841857910156, -0.11861801147460938, -0.11199760437011719, -0.105377197265625, -0.09875679016113281, -0.09213638305664062, -0.08551597595214844, -0.07889556884765625, -0.07227516174316406, -0.06565475463867188, -0.05903434753417969, -0.0524139404296875, -0.04579353332519531, -0.039173126220703125, -0.03255271911621094, -0.02593231201171875, -0.019311904907226562, -0.012691497802734375, -0.0060710906982421875, 0.00054931640625, 0.0071697235107421875, 0.013790130615234375, 0.020410537719726562, 0.02703094482421875, 0.03365135192871094, 0.040271759033203125, 0.04689216613769531, 0.0535125732421875, 0.06013298034667969, 0.06675338745117188, 0.07337379455566406, 0.07999420166015625, 0.08661460876464844, 0.09323501586914062, 0.09985542297363281, 0.106475830078125, 0.11309623718261719, 0.11971664428710938, 0.12633705139160156, 0.13295745849609375, 0.13957786560058594, 0.14619827270507812, 0.1528186798095703, 0.1594390869140625, 0.1660594940185547, 0.17267990112304688, 0.17930030822753906, 0.18592071533203125, 0.19254112243652344, 0.19916152954101562, 0.2057819366455078, 0.21240234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 7.0, 7.0, 8.0, 11.0, 10.0, 18.0, 37.0, 25.0, 50.0, 63.0, 90.0, 128.0, 208.0, 345.0, 627.0, 1252.0, 2535.0, 5695.0, 13849.0, 36563.0, 121051.0, 476892.0, 281936.0, 66568.0, 23310.0, 9378.0, 3973.0, 1796.0, 877.0, 463.0, 259.0, 166.0, 102.0, 66.0, 49.0, 38.0, 28.0, 25.0, 13.0, 19.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.8447265625, -0.8217544555664062, -0.7987823486328125, -0.7758102416992188, -0.752838134765625, -0.7298660278320312, -0.7068939208984375, -0.6839218139648438, -0.66094970703125, -0.6379776000976562, -0.6150054931640625, -0.5920333862304688, -0.569061279296875, -0.5460891723632812, -0.5231170654296875, -0.5001449584960938, -0.4771728515625, -0.45420074462890625, -0.4312286376953125, -0.40825653076171875, -0.385284423828125, -0.36231231689453125, -0.3393402099609375, -0.31636810302734375, -0.29339599609375, -0.27042388916015625, -0.2474517822265625, -0.22447967529296875, -0.201507568359375, -0.17853546142578125, -0.1555633544921875, -0.13259124755859375, -0.109619140625, -0.08664703369140625, -0.0636749267578125, -0.04070281982421875, -0.017730712890625, 0.00524139404296875, 0.0282135009765625, 0.05118560791015625, 0.07415771484375, 0.09712982177734375, 0.1201019287109375, 0.14307403564453125, 0.166046142578125, 0.18901824951171875, 0.2119903564453125, 0.23496246337890625, 0.2579345703125, 0.28090667724609375, 0.3038787841796875, 0.32685089111328125, 0.349822998046875, 0.37279510498046875, 0.3957672119140625, 0.41873931884765625, 0.44171142578125, 0.46468353271484375, 0.4876556396484375, 0.5106277465820312, 0.533599853515625, 0.5565719604492188, 0.5795440673828125, 0.6025161743164062, 0.62548828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 9.0, 17.0, 12.0, 23.0, 29.0, 31.0, 43.0, 40.0, 54.0, 51.0, 60.0, 67.0, 68.0, 62.0, 63.0, 53.0, 59.0, 52.0, 33.0, 33.0, 31.0, 20.0, 26.0, 15.0, 13.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.224609375, -1.1919937133789062, -1.1593780517578125, -1.1267623901367188, -1.094146728515625, -1.0615310668945312, -1.0289154052734375, -0.9962997436523438, -0.96368408203125, -0.9310684204101562, -0.8984527587890625, -0.8658370971679688, -0.833221435546875, -0.8006057739257812, -0.7679901123046875, -0.7353744506835938, -0.7027587890625, -0.6701431274414062, -0.6375274658203125, -0.6049118041992188, -0.572296142578125, -0.5396804809570312, -0.5070648193359375, -0.47444915771484375, -0.44183349609375, -0.40921783447265625, -0.3766021728515625, -0.34398651123046875, -0.311370849609375, -0.27875518798828125, -0.2461395263671875, -0.21352386474609375, -0.180908203125, -0.14829254150390625, -0.1156768798828125, -0.08306121826171875, -0.050445556640625, -0.01782989501953125, 0.0147857666015625, 0.04740142822265625, 0.08001708984375, 0.11263275146484375, 0.1452484130859375, 0.17786407470703125, 0.210479736328125, 0.24309539794921875, 0.2757110595703125, 0.30832672119140625, 0.3409423828125, 0.37355804443359375, 0.4061737060546875, 0.43878936767578125, 0.471405029296875, 0.5040206909179688, 0.5366363525390625, 0.5692520141601562, 0.60186767578125, 0.6344833374023438, 0.6670989990234375, 0.6997146606445312, 0.732330322265625, 0.7649459838867188, 0.7975616455078125, 0.8301773071289062, 0.86279296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 8.0, 2.0, 8.0, 6.0, 7.0, 7.0, 29.0, 17.0, 39.0, 57.0, 92.0, 165.0, 247.0, 427.0, 708.0, 1307.0, 2413.0, 4724.0, 9615.0, 19942.0, 44618.0, 114098.0, 342489.0, 321636.0, 105531.0, 42368.0, 19090.0, 9163.0, 4408.0, 2359.0, 1236.0, 713.0, 365.0, 243.0, 133.0, 85.0, 56.0, 34.0, 26.0, 21.0, 17.0, 14.0, 6.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.20068359375, -0.1945953369140625, -0.188507080078125, -0.1824188232421875, -0.17633056640625, -0.1702423095703125, -0.164154052734375, -0.1580657958984375, -0.1519775390625, -0.1458892822265625, -0.139801025390625, -0.1337127685546875, -0.12762451171875, -0.1215362548828125, -0.115447998046875, -0.1093597412109375, -0.103271484375, -0.0971832275390625, -0.091094970703125, -0.0850067138671875, -0.07891845703125, -0.0728302001953125, -0.066741943359375, -0.0606536865234375, -0.0545654296875, -0.0484771728515625, -0.042388916015625, -0.0363006591796875, -0.03021240234375, -0.0241241455078125, -0.018035888671875, -0.0119476318359375, -0.005859375, 0.0002288818359375, 0.006317138671875, 0.0124053955078125, 0.01849365234375, 0.0245819091796875, 0.030670166015625, 0.0367584228515625, 0.0428466796875, 0.0489349365234375, 0.055023193359375, 0.0611114501953125, 0.06719970703125, 0.0732879638671875, 0.079376220703125, 0.0854644775390625, 0.091552734375, 0.0976409912109375, 0.103729248046875, 0.1098175048828125, 0.11590576171875, 0.1219940185546875, 0.128082275390625, 0.1341705322265625, 0.1402587890625, 0.1463470458984375, 0.152435302734375, 0.1585235595703125, 0.16461181640625, 0.1707000732421875, 0.176788330078125, 0.1828765869140625, 0.18896484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 9.0, 2.0, 16.0, 10.0, 22.0, 26.0, 38.0, 80.0, 139.0, 186.0, 178.0, 104.0, 54.0, 27.0, 13.0, 19.0, 16.0, 9.0, 11.0, 10.0, 0.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00010943412780761719, -0.00010660570114850998, -0.00010377727448940277, -0.00010094884783029556, -9.812042117118835e-05, -9.529199451208115e-05, -9.246356785297394e-05, -8.963514119386673e-05, -8.680671453475952e-05, -8.397828787565231e-05, -8.11498612165451e-05, -7.83214345574379e-05, -7.549300789833069e-05, -7.266458123922348e-05, -6.983615458011627e-05, -6.700772792100906e-05, -6.417930126190186e-05, -6.135087460279465e-05, -5.852244794368744e-05, -5.569402128458023e-05, -5.286559462547302e-05, -5.0037167966365814e-05, -4.7208741307258606e-05, -4.43803146481514e-05, -4.155188798904419e-05, -3.872346132993698e-05, -3.589503467082977e-05, -3.3066608011722565e-05, -3.0238181352615356e-05, -2.7409754693508148e-05, -2.458132803440094e-05, -2.175290137529373e-05, -1.8924474716186523e-05, -1.6096048057079315e-05, -1.3267621397972107e-05, -1.0439194738864899e-05, -7.6107680797576904e-06, -4.782341420650482e-06, -1.953914761543274e-06, 8.745118975639343e-07, 3.7029385566711426e-06, 6.531365215778351e-06, 9.359791874885559e-06, 1.2188218533992767e-05, 1.5016645193099976e-05, 1.7845071852207184e-05, 2.0673498511314392e-05, 2.35019251704216e-05, 2.633035182952881e-05, 2.9158778488636017e-05, 3.1987205147743225e-05, 3.481563180685043e-05, 3.764405846595764e-05, 4.047248512506485e-05, 4.330091178417206e-05, 4.6129338443279266e-05, 4.8957765102386475e-05, 5.178619176149368e-05, 5.461461842060089e-05, 5.74430450797081e-05, 6.027147173881531e-05, 6.309989839792252e-05, 6.592832505702972e-05, 6.875675171613693e-05, 7.158517837524414e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 6.0, 9.0, 13.0, 16.0, 21.0, 24.0, 33.0, 50.0, 65.0, 92.0, 142.0, 198.0, 320.0, 465.0, 893.0, 1681.0, 3525.0, 7903.0, 18641.0, 45373.0, 116221.0, 321300.0, 329039.0, 120657.0, 46512.0, 19540.0, 8040.0, 3732.0, 1700.0, 883.0, 490.0, 292.0, 206.0, 138.0, 84.0, 62.0, 62.0, 41.0, 28.0, 23.0, 13.0, 11.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20263671875, -0.19684982299804688, -0.19106292724609375, -0.18527603149414062, -0.1794891357421875, -0.17370223999023438, -0.16791534423828125, -0.16212844848632812, -0.156341552734375, -0.15055465698242188, -0.14476776123046875, -0.13898086547851562, -0.1331939697265625, -0.12740707397460938, -0.12162017822265625, -0.11583328247070312, -0.11004638671875, -0.10425949096679688, -0.09847259521484375, -0.09268569946289062, -0.0868988037109375, -0.08111190795898438, -0.07532501220703125, -0.06953811645507812, -0.063751220703125, -0.057964324951171875, -0.05217742919921875, -0.046390533447265625, -0.0406036376953125, -0.034816741943359375, -0.02902984619140625, -0.023242950439453125, -0.0174560546875, -0.011669158935546875, -0.00588226318359375, -9.5367431640625e-05, 0.0056915283203125, 0.011478424072265625, 0.01726531982421875, 0.023052215576171875, 0.028839111328125, 0.034626007080078125, 0.04041290283203125, 0.046199798583984375, 0.0519866943359375, 0.057773590087890625, 0.06356048583984375, 0.06934738159179688, 0.07513427734375, 0.08092117309570312, 0.08670806884765625, 0.09249496459960938, 0.0982818603515625, 0.10406875610351562, 0.10985565185546875, 0.11564254760742188, 0.121429443359375, 0.12721633911132812, 0.13300323486328125, 0.13879013061523438, 0.1445770263671875, 0.15036392211914062, 0.15615081787109375, 0.16193771362304688, 0.167724609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 10.0, 7.0, 12.0, 14.0, 22.0, 25.0, 25.0, 28.0, 38.0, 41.0, 55.0, 62.0, 75.0, 78.0, 86.0, 73.0, 53.0, 49.0, 34.0, 34.0, 32.0, 14.0, 20.0, 15.0, 13.0, 11.0, 15.0, 7.0, 8.0, 5.0, 5.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.1500244140625, -0.14404296875, -0.1380615234375, -0.132080078125, -0.1260986328125, -0.1201171875, -0.1141357421875, -0.108154296875, -0.1021728515625, -0.09619140625, -0.0902099609375, -0.084228515625, -0.0782470703125, -0.072265625, -0.0662841796875, -0.060302734375, -0.0543212890625, -0.04833984375, -0.0423583984375, -0.036376953125, -0.0303955078125, -0.0244140625, -0.0184326171875, -0.012451171875, -0.0064697265625, -0.00048828125, 0.0054931640625, 0.011474609375, 0.0174560546875, 0.0234375, 0.0294189453125, 0.035400390625, 0.0413818359375, 0.04736328125, 0.0533447265625, 0.059326171875, 0.0653076171875, 0.0712890625, 0.0772705078125, 0.083251953125, 0.0892333984375, 0.09521484375, 0.1011962890625, 0.107177734375, 0.1131591796875, 0.119140625, 0.1251220703125, 0.131103515625, 0.1370849609375, 0.14306640625, 0.1490478515625, 0.155029296875, 0.1610107421875, 0.1669921875, 0.1729736328125, 0.178955078125, 0.1849365234375, 0.19091796875, 0.1968994140625, 0.202880859375, 0.2088623046875, 0.21484375, 0.2208251953125, 0.226806640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 14.0, 19.0, 62.0, 146.0, 217.0, 230.0, 159.0, 91.0, 34.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.352656841278076, -6.17669153213501, -6.000726222991943, -5.824760913848877, -5.6487956047058105, -5.472830295562744, -5.2968645095825195, -5.120899200439453, -4.944933891296387, -4.76896858215332, -4.593003273010254, -4.4170379638671875, -4.241072654724121, -4.065107345581055, -3.889141798019409, -3.7131764888763428, -3.5372114181518555, -3.361246109008789, -3.1852807998657227, -3.0093154907226562, -2.83335018157959, -2.6573848724365234, -2.481419324874878, -2.3054540157318115, -2.129488706588745, -1.9535233974456787, -1.7775580883026123, -1.6015926599502563, -1.42562735080719, -1.2496620416641235, -1.0736966133117676, -0.8977313041687012, -0.7217655181884766, -0.5458002090454102, -0.369834840297699, -0.1938694715499878, -0.017904162406921387, 0.15806114673614502, 0.334026575088501, 0.5099918842315674, 0.6859571933746338, 0.8619225025177002, 1.0378878116607666, 1.2138532400131226, 1.389818549156189, 1.5657838582992554, 1.7417492866516113, 1.9177145957946777, 2.093679904937744, 2.2696452140808105, 2.445610523223877, 2.6215758323669434, 2.7975411415100098, 2.973506450653076, 3.1494719982147217, 3.325437307357788, 3.5014026165008545, 3.677367925643921, 3.8533332347869873, 4.029298782348633, 4.205264091491699, 4.381229400634766, 4.557194709777832, 4.733160018920898, 4.909125328063965]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 4.0, 5.0, 5.0, 13.0, 10.0, 10.0, 13.0, 17.0, 9.0, 25.0, 19.0, 22.0, 34.0, 14.0, 37.0, 25.0, 25.0, 42.0, 39.0, 49.0, 35.0, 31.0, 32.0, 51.0, 34.0, 42.0, 37.0, 36.0, 40.0, 25.0, 29.0, 19.0, 27.0, 19.0, 27.0, 20.0, 16.0, 16.0, 12.0, 11.0, 9.0, 1.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7826440334320068, -1.7286403179168701, -1.674636721611023, -1.6206330060958862, -1.5666292905807495, -1.5126256942749023, -1.4586219787597656, -1.404618263244629, -1.3506145477294922, -1.2966108322143555, -1.2426072359085083, -1.1886035203933716, -1.1345998048782349, -1.0805962085723877, -1.026592493057251, -0.9725887775421143, -0.9185851812362671, -0.8645815253257751, -0.8105778098106384, -0.7565741539001465, -0.7025704383850098, -0.6485667824745178, -0.5945631265640259, -0.5405594110488892, -0.4865557551383972, -0.4325520694255829, -0.37854838371276855, -0.3245447278022766, -0.2705410420894623, -0.21653735637664795, -0.162533700466156, -0.10853001475334167, -0.054526329040527344, -0.0005226507782936096, 0.053481027483940125, 0.10748469829559326, 0.1614883840084076, 0.21549206972122192, 0.26949572563171387, 0.3234994113445282, 0.37750309705734253, 0.43150678277015686, 0.4855104684829712, 0.5395141243934631, 0.5935177803039551, 0.6475214958190918, 0.7015251517295837, 0.7555288076400757, 0.8095325231552124, 0.8635361790657043, 0.9175398945808411, 0.971543550491333, 1.0255472660064697, 1.0795509815216064, 1.1335545778274536, 1.1875582933425903, 1.2415618896484375, 1.2955656051635742, 1.3495692014694214, 1.403572916984558, 1.4575766324996948, 1.511580228805542, 1.5655839443206787, 1.6195876598358154, 1.6735913753509521]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 6.0, 8.0, 13.0, 20.0, 27.0, 29.0, 52.0, 88.0, 138.0, 202.0, 311.0, 493.0, 850.0, 1440.0, 2452.0, 4335.0, 8095.0, 15054.0, 29420.0, 59536.0, 131706.0, 329281.0, 942850.0, 1533463.0, 684014.0, 246965.0, 103852.0, 48384.0, 23998.0, 12197.0, 6481.0, 3484.0, 2015.0, 1200.0, 724.0, 377.0, 259.0, 161.0, 114.0, 65.0, 45.0, 31.0, 25.0, 8.0, 5.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2435302734375, -0.2355060577392578, -0.22748184204101562, -0.21945762634277344, -0.21143341064453125, -0.20340919494628906, -0.19538497924804688, -0.1873607635498047, -0.1793365478515625, -0.1713123321533203, -0.16328811645507812, -0.15526390075683594, -0.14723968505859375, -0.13921546936035156, -0.13119125366210938, -0.12316703796386719, -0.115142822265625, -0.10711860656738281, -0.09909439086914062, -0.09107017517089844, -0.08304595947265625, -0.07502174377441406, -0.06699752807617188, -0.05897331237792969, -0.0509490966796875, -0.04292488098144531, -0.034900665283203125, -0.026876449584960938, -0.01885223388671875, -0.010828018188476562, -0.002803802490234375, 0.0052204132080078125, 0.01324462890625, 0.021268844604492188, 0.029293060302734375, 0.03731727600097656, 0.04534149169921875, 0.05336570739746094, 0.061389923095703125, 0.06941413879394531, 0.0774383544921875, 0.08546257019042969, 0.09348678588867188, 0.10151100158691406, 0.10953521728515625, 0.11755943298339844, 0.12558364868164062, 0.1336078643798828, 0.141632080078125, 0.1496562957763672, 0.15768051147460938, 0.16570472717285156, 0.17372894287109375, 0.18175315856933594, 0.18977737426757812, 0.1978015899658203, 0.2058258056640625, 0.2138500213623047, 0.22187423706054688, 0.22989845275878906, 0.23792266845703125, 0.24594688415527344, 0.2539710998535156, 0.2619953155517578, 0.27001953125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 1.0, 5.0, 2.0, 6.0, 3.0, 8.0, 6.0, 9.0, 6.0, 12.0, 12.0, 11.0, 17.0, 16.0, 20.0, 27.0, 33.0, 26.0, 37.0, 32.0, 27.0, 28.0, 32.0, 31.0, 43.0, 49.0, 51.0, 47.0, 42.0, 30.0, 45.0, 28.0, 31.0, 25.0, 30.0, 21.0, 23.0, 17.0, 20.0, 16.0, 18.0, 12.0, 10.0, 6.0, 6.0, 5.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.17143630981445312, -0.16526031494140625, -0.15908432006835938, -0.1529083251953125, -0.14673233032226562, -0.14055633544921875, -0.13438034057617188, -0.128204345703125, -0.12202835083007812, -0.11585235595703125, -0.10967636108398438, -0.1035003662109375, -0.09732437133789062, -0.09114837646484375, -0.08497238159179688, -0.07879638671875, -0.07262039184570312, -0.06644439697265625, -0.060268402099609375, -0.0540924072265625, -0.047916412353515625, -0.04174041748046875, -0.035564422607421875, -0.029388427734375, -0.023212432861328125, -0.01703643798828125, -0.010860443115234375, -0.0046844482421875, 0.001491546630859375, 0.00766754150390625, 0.013843536376953125, 0.02001953125, 0.026195526123046875, 0.03237152099609375, 0.038547515869140625, 0.0447235107421875, 0.050899505615234375, 0.05707550048828125, 0.06325149536132812, 0.069427490234375, 0.07560348510742188, 0.08177947998046875, 0.08795547485351562, 0.0941314697265625, 0.10030746459960938, 0.10648345947265625, 0.11265945434570312, 0.11883544921875, 0.12501144409179688, 0.13118743896484375, 0.13736343383789062, 0.1435394287109375, 0.14971542358398438, 0.15589141845703125, 0.16206741333007812, 0.168243408203125, 0.17441940307617188, 0.18059539794921875, 0.18677139282226562, 0.1929473876953125, 0.19912338256835938, 0.20529937744140625, 0.21147537231445312, 0.2176513671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 8.0, 14.0, 31.0, 30.0, 46.0, 87.0, 127.0, 193.0, 250.0, 457.0, 791.0, 1408.0, 2954.0, 6689.0, 16404.0, 46557.0, 141669.0, 493585.0, 2103897.0, 1012044.0, 245004.0, 76432.0, 26308.0, 10120.0, 4304.0, 2005.0, 1121.0, 625.0, 352.0, 254.0, 169.0, 107.0, 56.0, 38.0, 32.0, 21.0, 15.0, 21.0, 12.0, 8.0, 6.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.43994140625, -0.42462921142578125, -0.4093170166015625, -0.39400482177734375, -0.378692626953125, -0.36338043212890625, -0.3480682373046875, -0.33275604248046875, -0.31744384765625, -0.30213165283203125, -0.2868194580078125, -0.27150726318359375, -0.256195068359375, -0.24088287353515625, -0.2255706787109375, -0.21025848388671875, -0.1949462890625, -0.17963409423828125, -0.1643218994140625, -0.14900970458984375, -0.133697509765625, -0.11838531494140625, -0.1030731201171875, -0.08776092529296875, -0.07244873046875, -0.05713653564453125, -0.0418243408203125, -0.02651214599609375, -0.011199951171875, 0.00411224365234375, 0.0194244384765625, 0.03473663330078125, 0.050048828125, 0.06536102294921875, 0.0806732177734375, 0.09598541259765625, 0.111297607421875, 0.12660980224609375, 0.1419219970703125, 0.15723419189453125, 0.17254638671875, 0.18785858154296875, 0.2031707763671875, 0.21848297119140625, 0.233795166015625, 0.24910736083984375, 0.2644195556640625, 0.27973175048828125, 0.2950439453125, 0.31035614013671875, 0.3256683349609375, 0.34098052978515625, 0.356292724609375, 0.37160491943359375, 0.3869171142578125, 0.40222930908203125, 0.41754150390625, 0.43285369873046875, 0.4481658935546875, 0.46347808837890625, 0.478790283203125, 0.49410247802734375, 0.5094146728515625, 0.5247268676757812, 0.5400390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 13.0, 19.0, 28.0, 46.0, 66.0, 90.0, 122.0, 156.0, 237.0, 348.0, 527.0, 693.0, 588.0, 341.0, 225.0, 147.0, 102.0, 81.0, 60.0, 54.0, 35.0, 23.0, 18.0, 9.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5140228271484375, -0.493865966796875, -0.4737091064453125, -0.45355224609375, -0.4333953857421875, -0.413238525390625, -0.3930816650390625, -0.3729248046875, -0.3527679443359375, -0.332611083984375, -0.3124542236328125, -0.29229736328125, -0.2721405029296875, -0.251983642578125, -0.2318267822265625, -0.211669921875, -0.1915130615234375, -0.171356201171875, -0.1511993408203125, -0.13104248046875, -0.1108856201171875, -0.090728759765625, -0.0705718994140625, -0.0504150390625, -0.0302581787109375, -0.010101318359375, 0.0100555419921875, 0.03021240234375, 0.0503692626953125, 0.070526123046875, 0.0906829833984375, 0.11083984375, 0.1309967041015625, 0.151153564453125, 0.1713104248046875, 0.19146728515625, 0.2116241455078125, 0.231781005859375, 0.2519378662109375, 0.2720947265625, 0.2922515869140625, 0.312408447265625, 0.3325653076171875, 0.35272216796875, 0.3728790283203125, 0.393035888671875, 0.4131927490234375, 0.433349609375, 0.4535064697265625, 0.473663330078125, 0.4938201904296875, 0.51397705078125, 0.5341339111328125, 0.554290771484375, 0.5744476318359375, 0.5946044921875, 0.6147613525390625, 0.634918212890625, 0.6550750732421875, 0.67523193359375, 0.6953887939453125, 0.715545654296875, 0.7357025146484375, 0.755859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 13.0, 23.0, 63.0, 74.0, 121.0, 129.0, 145.0, 138.0, 104.0, 83.0, 39.0, 25.0, 15.0, 5.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9223976135253906, -3.7934978008270264, -3.664597988128662, -3.535698413848877, -3.4067986011505127, -3.2778987884521484, -3.1489992141723633, -3.020099401473999, -2.8911995887756348, -2.7622997760772705, -2.6333999633789062, -2.504500389099121, -2.375600576400757, -2.2467007637023926, -2.1178011894226074, -1.9889013767242432, -1.860001564025879, -1.7311017513275146, -1.60220205783844, -1.4733023643493652, -1.344402551651001, -1.2155027389526367, -1.086603045463562, -0.9577032923698425, -0.828803539276123, -0.6999037861824036, -0.5710040330886841, -0.4421042799949646, -0.3132045269012451, -0.18430477380752563, -0.05540502071380615, 0.07349473237991333, 0.2023940086364746, 0.3312937617301941, 0.4601935148239136, 0.5890932679176331, 0.7179930210113525, 0.846892774105072, 0.9757925271987915, 1.1046922206878662, 1.2335920333862305, 1.3624918460845947, 1.4913915395736694, 1.6202912330627441, 1.7491910457611084, 1.8780908584594727, 2.006990432739258, 2.135890245437622, 2.2647900581359863, 2.3936898708343506, 2.522589683532715, 2.6514892578125, 2.7803890705108643, 2.9092888832092285, 3.0381884574890137, 3.167088270187378, 3.295988082885742, 3.4248878955841064, 3.5537877082824707, 3.682687282562256, 3.81158709526062, 3.9404869079589844, 4.0693864822387695, 4.198286533355713, 4.327186107635498]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 9.0, 8.0, 14.0, 12.0, 14.0, 13.0, 19.0, 19.0, 20.0, 35.0, 38.0, 23.0, 32.0, 35.0, 45.0, 40.0, 45.0, 47.0, 46.0, 39.0, 46.0, 51.0, 32.0, 39.0, 30.0, 29.0, 29.0, 25.0, 35.0, 19.0, 17.0, 17.0, 11.0, 13.0, 8.0, 9.0, 13.0, 8.0, 1.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.1739280223846436, -2.1132686138153076, -2.0526092052459717, -1.9919497966766357, -1.9312903881072998, -1.8706309795379639, -1.809971570968628, -1.7493120431900024, -1.6886526346206665, -1.6279932260513306, -1.5673338174819946, -1.5066744089126587, -1.4460150003433228, -1.3853554725646973, -1.3246960639953613, -1.2640366554260254, -1.2033772468566895, -1.1427178382873535, -1.0820584297180176, -1.0213990211486816, -0.9607395529747009, -0.900080144405365, -0.839420735836029, -0.7787612676620483, -0.718101978302002, -0.657442569732666, -0.5967831611633301, -0.5361237525939941, -0.4754642844200134, -0.4148048758506775, -0.35414546728134155, -0.2934860289096832, -0.2328265905380249, -0.17216716706752777, -0.11150775104761124, -0.0508483350276947, 0.00981108844280243, 0.07047051191329956, 0.1311299204826355, 0.19178935885429382, 0.25244876742362976, 0.3131081759929657, 0.373767614364624, 0.43442702293395996, 0.4950864315032959, 0.5557458400726318, 0.6164052486419678, 0.6770647168159485, 0.7377241253852844, 0.7983835339546204, 0.8590429425239563, 0.919702410697937, 0.980361819267273, 1.0410212278366089, 1.1016806364059448, 1.1623400449752808, 1.2229994535446167, 1.2836588621139526, 1.3443182706832886, 1.4049776792526245, 1.4656370878219604, 1.526296615600586, 1.5869560241699219, 1.6476154327392578, 1.7082748413085938]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 8.0, 3.0, 7.0, 14.0, 12.0, 13.0, 18.0, 40.0, 57.0, 72.0, 107.0, 172.0, 254.0, 384.0, 501.0, 826.0, 1262.0, 1891.0, 2827.0, 4252.0, 6505.0, 10039.0, 15177.0, 23480.0, 37822.0, 65282.0, 119097.0, 198675.0, 216936.0, 142443.0, 77853.0, 44726.0, 27253.0, 17297.0, 11388.0, 7449.0, 4933.0, 3221.0, 2087.0, 1447.0, 912.0, 626.0, 392.0, 267.0, 187.0, 108.0, 90.0, 50.0, 38.0, 26.0, 13.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.287841796875, -0.27860260009765625, -0.2693634033203125, -0.26012420654296875, -0.250885009765625, -0.24164581298828125, -0.2324066162109375, -0.22316741943359375, -0.21392822265625, -0.20468902587890625, -0.1954498291015625, -0.18621063232421875, -0.176971435546875, -0.16773223876953125, -0.1584930419921875, -0.14925384521484375, -0.1400146484375, -0.13077545166015625, -0.1215362548828125, -0.11229705810546875, -0.103057861328125, -0.09381866455078125, -0.0845794677734375, -0.07534027099609375, -0.06610107421875, -0.05686187744140625, -0.0476226806640625, -0.03838348388671875, -0.029144287109375, -0.01990509033203125, -0.0106658935546875, -0.00142669677734375, 0.0078125, 0.01705169677734375, 0.0262908935546875, 0.03553009033203125, 0.044769287109375, 0.05400848388671875, 0.0632476806640625, 0.07248687744140625, 0.08172607421875, 0.09096527099609375, 0.1002044677734375, 0.10944366455078125, 0.118682861328125, 0.12792205810546875, 0.1371612548828125, 0.14640045166015625, 0.1556396484375, 0.16487884521484375, 0.1741180419921875, 0.18335723876953125, 0.192596435546875, 0.20183563232421875, 0.2110748291015625, 0.22031402587890625, 0.22955322265625, 0.23879241943359375, 0.2480316162109375, 0.25727081298828125, 0.266510009765625, 0.27574920654296875, 0.2849884033203125, 0.29422760009765625, 0.303466796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 10.0, 15.0, 18.0, 17.0, 20.0, 20.0, 32.0, 25.0, 38.0, 47.0, 34.0, 34.0, 43.0, 45.0, 42.0, 46.0, 43.0, 40.0, 43.0, 44.0, 45.0, 25.0, 31.0, 22.0, 30.0, 27.0, 13.0, 19.0, 23.0, 18.0, 17.0, 18.0, 4.0, 7.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2196044921875, -0.21258544921875, -0.20556640625, -0.19854736328125, -0.1915283203125, -0.18450927734375, -0.177490234375, -0.17047119140625, -0.1634521484375, -0.15643310546875, -0.1494140625, -0.14239501953125, -0.1353759765625, -0.12835693359375, -0.121337890625, -0.11431884765625, -0.1072998046875, -0.10028076171875, -0.09326171875, -0.08624267578125, -0.0792236328125, -0.07220458984375, -0.065185546875, -0.05816650390625, -0.0511474609375, -0.04412841796875, -0.037109375, -0.03009033203125, -0.0230712890625, -0.01605224609375, -0.009033203125, -0.00201416015625, 0.0050048828125, 0.01202392578125, 0.01904296875, 0.02606201171875, 0.0330810546875, 0.04010009765625, 0.047119140625, 0.05413818359375, 0.0611572265625, 0.06817626953125, 0.0751953125, 0.08221435546875, 0.0892333984375, 0.09625244140625, 0.103271484375, 0.11029052734375, 0.1173095703125, 0.12432861328125, 0.13134765625, 0.13836669921875, 0.1453857421875, 0.15240478515625, 0.159423828125, 0.16644287109375, 0.1734619140625, 0.18048095703125, 0.1875, 0.19451904296875, 0.2015380859375, 0.20855712890625, 0.215576171875, 0.22259521484375, 0.2296142578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 16.0, 19.0, 28.0, 40.0, 77.0, 122.0, 250.0, 488.0, 1004.0, 2812.0, 9748.0, 39841.0, 212664.0, 603277.0, 138179.0, 28794.0, 7348.0, 2165.0, 809.0, 359.0, 213.0, 96.0, 73.0, 42.0, 24.0, 21.0, 11.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7314834594726562, -0.6988067626953125, -0.6661300659179688, -0.633453369140625, -0.6007766723632812, -0.5680999755859375, -0.5354232788085938, -0.50274658203125, -0.47006988525390625, -0.4373931884765625, -0.40471649169921875, -0.372039794921875, -0.33936309814453125, -0.3066864013671875, -0.27400970458984375, -0.2413330078125, -0.20865631103515625, -0.1759796142578125, -0.14330291748046875, -0.110626220703125, -0.07794952392578125, -0.0452728271484375, -0.01259613037109375, 0.02008056640625, 0.05275726318359375, 0.0854339599609375, 0.11811065673828125, 0.150787353515625, 0.18346405029296875, 0.2161407470703125, 0.24881744384765625, 0.281494140625, 0.31417083740234375, 0.3468475341796875, 0.37952423095703125, 0.412200927734375, 0.44487762451171875, 0.4775543212890625, 0.5102310180664062, 0.54290771484375, 0.5755844116210938, 0.6082611083984375, 0.6409378051757812, 0.673614501953125, 0.7062911987304688, 0.7389678955078125, 0.7716445922851562, 0.8043212890625, 0.8369979858398438, 0.8696746826171875, 0.9023513793945312, 0.935028076171875, 0.9677047729492188, 1.0003814697265625, 1.0330581665039062, 1.06573486328125, 1.0984115600585938, 1.1310882568359375, 1.1637649536132812, 1.196441650390625, 1.2291183471679688, 1.2617950439453125, 1.2944717407226562, 1.3271484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 1.0, 2.0, 8.0, 4.0, 8.0, 10.0, 7.0, 15.0, 18.0, 22.0, 26.0, 35.0, 26.0, 33.0, 43.0, 29.0, 45.0, 42.0, 59.0, 53.0, 39.0, 47.0, 58.0, 47.0, 34.0, 43.0, 29.0, 19.0, 29.0, 39.0, 15.0, 20.0, 18.0, 10.0, 17.0, 11.0, 11.0, 5.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6632537841796875, -0.640472412109375, -0.6176910400390625, -0.59490966796875, -0.5721282958984375, -0.549346923828125, -0.5265655517578125, -0.5037841796875, -0.4810028076171875, -0.458221435546875, -0.4354400634765625, -0.41265869140625, -0.3898773193359375, -0.367095947265625, -0.3443145751953125, -0.321533203125, -0.2987518310546875, -0.275970458984375, -0.2531890869140625, -0.23040771484375, -0.2076263427734375, -0.184844970703125, -0.1620635986328125, -0.1392822265625, -0.1165008544921875, -0.093719482421875, -0.0709381103515625, -0.04815673828125, -0.0253753662109375, -0.002593994140625, 0.0201873779296875, 0.04296875, 0.0657501220703125, 0.088531494140625, 0.1113128662109375, 0.13409423828125, 0.1568756103515625, 0.179656982421875, 0.2024383544921875, 0.2252197265625, 0.2480010986328125, 0.270782470703125, 0.2935638427734375, 0.31634521484375, 0.3391265869140625, 0.361907958984375, 0.3846893310546875, 0.407470703125, 0.4302520751953125, 0.453033447265625, 0.4758148193359375, 0.49859619140625, 0.5213775634765625, 0.544158935546875, 0.5669403076171875, 0.5897216796875, 0.6125030517578125, 0.635284423828125, 0.6580657958984375, 0.68084716796875, 0.7036285400390625, 0.726409912109375, 0.7491912841796875, 0.77197265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 14.0, 27.0, 36.0, 75.0, 151.0, 279.0, 553.0, 1208.0, 3169.0, 8109.0, 22953.0, 79410.0, 340087.0, 436739.0, 109034.0, 29835.0, 10205.0, 3822.0, 1438.0, 679.0, 327.0, 157.0, 92.0, 50.0, 39.0, 23.0, 12.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2936267852783203, -0.2854957580566406, -0.27736473083496094, -0.26923370361328125, -0.26110267639160156, -0.2529716491699219, -0.2448406219482422, -0.2367095947265625, -0.2285785675048828, -0.22044754028320312, -0.21231651306152344, -0.20418548583984375, -0.19605445861816406, -0.18792343139648438, -0.1797924041748047, -0.171661376953125, -0.1635303497314453, -0.15539932250976562, -0.14726829528808594, -0.13913726806640625, -0.13100624084472656, -0.12287521362304688, -0.11474418640136719, -0.1066131591796875, -0.09848213195800781, -0.09035110473632812, -0.08222007751464844, -0.07408905029296875, -0.06595802307128906, -0.057826995849609375, -0.04969596862792969, -0.04156494140625, -0.03343391418457031, -0.025302886962890625, -0.017171859741210938, -0.00904083251953125, -0.0009098052978515625, 0.007221221923828125, 0.015352249145507812, 0.0234832763671875, 0.03161430358886719, 0.039745330810546875, 0.04787635803222656, 0.05600738525390625, 0.06413841247558594, 0.07226943969726562, 0.08040046691894531, 0.088531494140625, 0.09666252136230469, 0.10479354858398438, 0.11292457580566406, 0.12105560302734375, 0.12918663024902344, 0.13731765747070312, 0.1454486846923828, 0.1535797119140625, 0.1617107391357422, 0.16984176635742188, 0.17797279357910156, 0.18610382080078125, 0.19423484802246094, 0.20236587524414062, 0.2104969024658203, 0.2186279296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 4.0, 14.0, 11.0, 18.0, 32.0, 34.0, 70.0, 99.0, 134.0, 170.0, 124.0, 85.0, 53.0, 34.0, 22.0, 15.0, 17.0, 9.0, 4.0, 5.0, 7.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.07046890258789e-05, -7.820315659046173e-05, -7.570162415504456e-05, -7.320009171962738e-05, -7.06985592842102e-05, -6.819702684879303e-05, -6.569549441337585e-05, -6.319396197795868e-05, -6.0692429542541504e-05, -5.819089710712433e-05, -5.568936467170715e-05, -5.318783223628998e-05, -5.06862998008728e-05, -4.818476736545563e-05, -4.568323493003845e-05, -4.318170249462128e-05, -4.06801700592041e-05, -3.8178637623786926e-05, -3.567710518836975e-05, -3.3175572752952576e-05, -3.06740403175354e-05, -2.8172507882118225e-05, -2.567097544670105e-05, -2.3169443011283875e-05, -2.06679105758667e-05, -1.8166378140449524e-05, -1.566484570503235e-05, -1.3163313269615173e-05, -1.0661780834197998e-05, -8.160248398780823e-06, -5.6587159633636475e-06, -3.157183527946472e-06, -6.556510925292969e-07, 1.8458813428878784e-06, 4.347413778305054e-06, 6.848946213722229e-06, 9.350478649139404e-06, 1.185201108455658e-05, 1.4353543519973755e-05, 1.685507595539093e-05, 1.9356608390808105e-05, 2.185814082622528e-05, 2.4359673261642456e-05, 2.686120569705963e-05, 2.9362738132476807e-05, 3.186427056789398e-05, 3.436580300331116e-05, 3.686733543872833e-05, 3.936886787414551e-05, 4.187040030956268e-05, 4.437193274497986e-05, 4.6873465180397034e-05, 4.937499761581421e-05, 5.1876530051231384e-05, 5.437806248664856e-05, 5.6879594922065735e-05, 5.938112735748291e-05, 6.188265979290009e-05, 6.438419222831726e-05, 6.688572466373444e-05, 6.938725709915161e-05, 7.188878953456879e-05, 7.439032196998596e-05, 7.689185440540314e-05, 7.939338684082031e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 7.0, 6.0, 7.0, 5.0, 12.0, 21.0, 28.0, 35.0, 63.0, 76.0, 150.0, 182.0, 299.0, 511.0, 806.0, 1686.0, 3543.0, 8016.0, 19666.0, 53594.0, 146844.0, 343560.0, 289629.0, 111796.0, 40333.0, 15307.0, 6198.0, 2857.0, 1378.0, 728.0, 438.0, 253.0, 160.0, 105.0, 62.0, 59.0, 38.0, 29.0, 18.0, 12.0, 14.0, 5.0, 6.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.170654296875, -0.1652984619140625, -0.159942626953125, -0.1545867919921875, -0.14923095703125, -0.1438751220703125, -0.138519287109375, -0.1331634521484375, -0.1278076171875, -0.1224517822265625, -0.117095947265625, -0.1117401123046875, -0.10638427734375, -0.1010284423828125, -0.095672607421875, -0.0903167724609375, -0.0849609375, -0.0796051025390625, -0.074249267578125, -0.0688934326171875, -0.06353759765625, -0.0581817626953125, -0.052825927734375, -0.0474700927734375, -0.0421142578125, -0.0367584228515625, -0.031402587890625, -0.0260467529296875, -0.02069091796875, -0.0153350830078125, -0.009979248046875, -0.0046234130859375, 0.000732421875, 0.0060882568359375, 0.011444091796875, 0.0167999267578125, 0.02215576171875, 0.0275115966796875, 0.032867431640625, 0.0382232666015625, 0.0435791015625, 0.0489349365234375, 0.054290771484375, 0.0596466064453125, 0.06500244140625, 0.0703582763671875, 0.075714111328125, 0.0810699462890625, 0.08642578125, 0.0917816162109375, 0.097137451171875, 0.1024932861328125, 0.10784912109375, 0.1132049560546875, 0.118560791015625, 0.1239166259765625, 0.1292724609375, 0.1346282958984375, 0.139984130859375, 0.1453399658203125, 0.15069580078125, 0.1560516357421875, 0.161407470703125, 0.1667633056640625, 0.172119140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 13.0, 15.0, 19.0, 31.0, 38.0, 55.0, 61.0, 85.0, 72.0, 110.0, 94.0, 91.0, 66.0, 36.0, 42.0, 34.0, 35.0, 14.0, 18.0, 12.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21875, -0.21225357055664062, -0.20575714111328125, -0.19926071166992188, -0.1927642822265625, -0.18626785278320312, -0.17977142333984375, -0.17327499389648438, -0.166778564453125, -0.16028213500976562, -0.15378570556640625, -0.14728927612304688, -0.1407928466796875, -0.13429641723632812, -0.12779998779296875, -0.12130355834960938, -0.11480712890625, -0.10831069946289062, -0.10181427001953125, -0.09531784057617188, -0.0888214111328125, -0.08232498168945312, -0.07582855224609375, -0.06933212280273438, -0.062835693359375, -0.056339263916015625, -0.04984283447265625, -0.043346405029296875, -0.0368499755859375, -0.030353546142578125, -0.02385711669921875, -0.017360687255859375, -0.0108642578125, -0.004367828369140625, 0.00212860107421875, 0.008625030517578125, 0.0151214599609375, 0.021617889404296875, 0.02811431884765625, 0.034610748291015625, 0.041107177734375, 0.047603607177734375, 0.05410003662109375, 0.060596466064453125, 0.0670928955078125, 0.07358932495117188, 0.08008575439453125, 0.08658218383789062, 0.09307861328125, 0.09957504272460938, 0.10607147216796875, 0.11256790161132812, 0.1190643310546875, 0.12556076049804688, 0.13205718994140625, 0.13855361938476562, 0.145050048828125, 0.15154647827148438, 0.15804290771484375, 0.16453933715820312, 0.1710357666015625, 0.17753219604492188, 0.18402862548828125, 0.19052505493164062, 0.197021484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 10.0, 25.0, 35.0, 49.0, 71.0, 138.0, 137.0, 156.0, 123.0, 79.0, 69.0, 40.0, 17.0, 12.0, 10.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.483091354370117, -3.380591630935669, -3.2780919075012207, -3.1755921840667725, -3.073092460632324, -2.970592975616455, -2.868093252182007, -2.7655935287475586, -2.6630938053131104, -2.560594081878662, -2.458094358444214, -2.3555946350097656, -2.2530951499938965, -2.150595188140869, -2.048095703125, -1.9455959796905518, -1.8430962562561035, -1.7405965328216553, -1.638096809387207, -1.5355972051620483, -1.4330974817276, -1.3305977582931519, -1.2280981540679932, -1.125598430633545, -1.0230987071990967, -0.9205989837646484, -0.818099319934845, -0.7155996561050415, -0.6130999326705933, -0.510600209236145, -0.40810054540634155, -0.3056008815765381, -0.20310115814208984, -0.10060146450996399, 0.0018982291221618652, 0.10439792275428772, 0.20689761638641357, 0.3093973398208618, 0.4118970036506653, 0.5143966674804688, 0.616896390914917, 0.7193961143493652, 0.8218957781791687, 0.9243954420089722, 1.0268951654434204, 1.1293948888778687, 1.2318944931030273, 1.3343942165374756, 1.4368939399719238, 1.539393663406372, 1.6418933868408203, 1.744392991065979, 1.8468927145004272, 1.9493924379348755, 2.051892042160034, 2.1543917655944824, 2.2568914890289307, 2.359391212463379, 2.461890935897827, 2.5643906593322754, 2.6668901443481445, 2.769390106201172, 2.871889591217041, 2.9743893146514893, 3.0768890380859375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 8.0, 5.0, 6.0, 6.0, 10.0, 10.0, 14.0, 23.0, 17.0, 15.0, 30.0, 14.0, 21.0, 32.0, 41.0, 28.0, 34.0, 46.0, 31.0, 38.0, 42.0, 43.0, 35.0, 34.0, 44.0, 36.0, 33.0, 34.0, 32.0, 32.0, 28.0, 20.0, 34.0, 20.0, 22.0, 19.0, 15.0, 8.0, 7.0, 11.0, 4.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5926952362060547, -1.5439839363098145, -1.4952726364135742, -1.446561336517334, -1.3978500366210938, -1.3491387367248535, -1.3004274368286133, -1.251716136932373, -1.2030048370361328, -1.1542935371398926, -1.1055822372436523, -1.056870937347412, -1.0081596374511719, -0.9594483375549316, -0.9107370972633362, -0.862025797367096, -0.8133145570755005, -0.7646032571792603, -0.71589195728302, -0.6671806573867798, -0.6184693574905396, -0.5697580575942993, -0.5210468173027039, -0.4723355174064636, -0.4236242175102234, -0.37491291761398315, -0.3262016177177429, -0.2774903476238251, -0.22877904772758484, -0.1800677478313446, -0.13135647773742676, -0.08264517784118652, -0.03393387794494629, 0.014777414500713348, 0.06348870694637299, 0.11219999194145203, 0.16091129183769226, 0.2096225917339325, 0.25833386182785034, 0.3070451617240906, 0.3557564616203308, 0.40446776151657104, 0.4531790614128113, 0.5018903017044067, 0.550601601600647, 0.5993129014968872, 0.6480242013931274, 0.6967355012893677, 0.7454468011856079, 0.7941581010818481, 0.8428694009780884, 0.8915807008743286, 0.9402920007705688, 0.9890033006668091, 1.0377144813537598, 1.08642578125, 1.1351370811462402, 1.1838483810424805, 1.2325596809387207, 1.281270980834961, 1.3299822807312012, 1.3786935806274414, 1.4274048805236816, 1.4761161804199219, 1.524827480316162]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 16.0, 16.0, 35.0, 49.0, 55.0, 97.0, 149.0, 262.0, 363.0, 628.0, 1054.0, 1788.0, 3155.0, 5302.0, 9695.0, 17341.0, 33286.0, 64913.0, 138774.0, 329430.0, 812590.0, 1324185.0, 834153.0, 339431.0, 139769.0, 65273.0, 32890.0, 17243.0, 9412.0, 5251.0, 3051.0, 1781.0, 1110.0, 638.0, 401.0, 239.0, 140.0, 99.0, 69.0, 43.0, 31.0, 26.0, 12.0, 8.0, 6.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2005615234375, -0.1939868927001953, -0.18741226196289062, -0.18083763122558594, -0.17426300048828125, -0.16768836975097656, -0.16111373901367188, -0.1545391082763672, -0.1479644775390625, -0.1413898468017578, -0.13481521606445312, -0.12824058532714844, -0.12166595458984375, -0.11509132385253906, -0.10851669311523438, -0.10194206237792969, -0.095367431640625, -0.08879280090332031, -0.08221817016601562, -0.07564353942871094, -0.06906890869140625, -0.06249427795410156, -0.055919647216796875, -0.04934501647949219, -0.0427703857421875, -0.03619575500488281, -0.029621124267578125, -0.023046493530273438, -0.01647186279296875, -0.009897232055664062, -0.003322601318359375, 0.0032520294189453125, 0.00982666015625, 0.016401290893554688, 0.022975921630859375, 0.029550552368164062, 0.03612518310546875, 0.04269981384277344, 0.049274444580078125, 0.05584907531738281, 0.0624237060546875, 0.06899833679199219, 0.07557296752929688, 0.08214759826660156, 0.08872222900390625, 0.09529685974121094, 0.10187149047851562, 0.10844612121582031, 0.115020751953125, 0.12159538269042969, 0.12817001342773438, 0.13474464416503906, 0.14131927490234375, 0.14789390563964844, 0.15446853637695312, 0.1610431671142578, 0.1676177978515625, 0.1741924285888672, 0.18076705932617188, 0.18734169006347656, 0.19391632080078125, 0.20049095153808594, 0.20706558227539062, 0.2136402130126953, 0.22021484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 7.0, 5.0, 7.0, 4.0, 12.0, 12.0, 18.0, 24.0, 28.0, 25.0, 25.0, 37.0, 29.0, 22.0, 34.0, 38.0, 27.0, 40.0, 42.0, 37.0, 44.0, 38.0, 40.0, 34.0, 42.0, 44.0, 37.0, 26.0, 26.0, 30.0, 25.0, 25.0, 28.0, 17.0, 8.0, 15.0, 12.0, 7.0, 6.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.170166015625, -0.16399765014648438, -0.15782928466796875, -0.15166091918945312, -0.1454925537109375, -0.13932418823242188, -0.13315582275390625, -0.12698745727539062, -0.120819091796875, -0.11465072631835938, -0.10848236083984375, -0.10231399536132812, -0.0961456298828125, -0.08997726440429688, -0.08380889892578125, -0.07764053344726562, -0.07147216796875, -0.06530380249023438, -0.05913543701171875, -0.052967071533203125, -0.0467987060546875, -0.040630340576171875, -0.03446197509765625, -0.028293609619140625, -0.022125244140625, -0.015956878662109375, -0.00978851318359375, -0.003620147705078125, 0.0025482177734375, 0.008716583251953125, 0.01488494873046875, 0.021053314208984375, 0.0272216796875, 0.033390045166015625, 0.03955841064453125, 0.045726776123046875, 0.0518951416015625, 0.058063507080078125, 0.06423187255859375, 0.07040023803710938, 0.076568603515625, 0.08273696899414062, 0.08890533447265625, 0.09507369995117188, 0.1012420654296875, 0.10741043090820312, 0.11357879638671875, 0.11974716186523438, 0.12591552734375, 0.13208389282226562, 0.13825225830078125, 0.14442062377929688, 0.1505889892578125, 0.15675735473632812, 0.16292572021484375, 0.16909408569335938, 0.175262451171875, 0.18143081665039062, 0.18759918212890625, 0.19376754760742188, 0.1999359130859375, 0.20610427856445312, 0.21227264404296875, 0.21844100952148438, 0.224609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 15.0, 27.0, 26.0, 44.0, 58.0, 98.0, 120.0, 163.0, 284.0, 409.0, 703.0, 1188.0, 2456.0, 5112.0, 12398.0, 34283.0, 104178.0, 350703.0, 1561199.0, 1597131.0, 358796.0, 106474.0, 34875.0, 12679.0, 5304.0, 2449.0, 1178.0, 676.0, 414.0, 265.0, 178.0, 129.0, 67.0, 47.0, 41.0, 31.0, 22.0, 14.0, 15.0, 6.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.431884765625, -0.4183921813964844, -0.40489959716796875, -0.3914070129394531, -0.3779144287109375, -0.3644218444824219, -0.35092926025390625, -0.3374366760253906, -0.323944091796875, -0.3104515075683594, -0.29695892333984375, -0.2834663391113281, -0.2699737548828125, -0.2564811706542969, -0.24298858642578125, -0.22949600219726562, -0.21600341796875, -0.20251083374023438, -0.18901824951171875, -0.17552566528320312, -0.1620330810546875, -0.14854049682617188, -0.13504791259765625, -0.12155532836914062, -0.108062744140625, -0.09457015991210938, -0.08107757568359375, -0.06758499145507812, -0.0540924072265625, -0.040599822998046875, -0.02710723876953125, -0.013614654541015625, -0.0001220703125, 0.013370513916015625, 0.02686309814453125, 0.040355682373046875, 0.0538482666015625, 0.06734085083007812, 0.08083343505859375, 0.09432601928710938, 0.107818603515625, 0.12131118774414062, 0.13480377197265625, 0.14829635620117188, 0.1617889404296875, 0.17528152465820312, 0.18877410888671875, 0.20226669311523438, 0.21575927734375, 0.22925186157226562, 0.24274444580078125, 0.2562370300292969, 0.2697296142578125, 0.2832221984863281, 0.29671478271484375, 0.3102073669433594, 0.323699951171875, 0.3371925354003906, 0.35068511962890625, 0.3641777038574219, 0.3776702880859375, 0.3911628723144531, 0.40465545654296875, 0.4181480407714844, 0.431640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 1.0, 3.0, 8.0, 8.0, 8.0, 11.0, 14.0, 11.0, 8.0, 22.0, 35.0, 32.0, 29.0, 33.0, 52.0, 71.0, 79.0, 107.0, 106.0, 141.0, 168.0, 226.0, 283.0, 365.0, 389.0, 325.0, 290.0, 237.0, 179.0, 157.0, 127.0, 97.0, 87.0, 71.0, 50.0, 44.0, 41.0, 31.0, 20.0, 16.0, 22.0, 8.0, 9.0, 12.0, 12.0, 10.0, 5.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.3193359375, -0.30954742431640625, -0.2997589111328125, -0.28997039794921875, -0.280181884765625, -0.27039337158203125, -0.2606048583984375, -0.25081634521484375, -0.24102783203125, -0.23123931884765625, -0.2214508056640625, -0.21166229248046875, -0.201873779296875, -0.19208526611328125, -0.1822967529296875, -0.17250823974609375, -0.1627197265625, -0.15293121337890625, -0.1431427001953125, -0.13335418701171875, -0.123565673828125, -0.11377716064453125, -0.1039886474609375, -0.09420013427734375, -0.08441162109375, -0.07462310791015625, -0.0648345947265625, -0.05504608154296875, -0.045257568359375, -0.03546905517578125, -0.0256805419921875, -0.01589202880859375, -0.006103515625, 0.00368499755859375, 0.0134735107421875, 0.02326202392578125, 0.033050537109375, 0.04283905029296875, 0.0526275634765625, 0.06241607666015625, 0.07220458984375, 0.08199310302734375, 0.0917816162109375, 0.10157012939453125, 0.111358642578125, 0.12114715576171875, 0.1309356689453125, 0.14072418212890625, 0.1505126953125, 0.16030120849609375, 0.1700897216796875, 0.17987823486328125, 0.189666748046875, 0.19945526123046875, 0.2092437744140625, 0.21903228759765625, 0.22882080078125, 0.23860931396484375, 0.2483978271484375, 0.25818634033203125, 0.267974853515625, 0.27776336669921875, 0.2875518798828125, 0.29734039306640625, 0.30712890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 8.0, 28.0, 37.0, 78.0, 117.0, 136.0, 192.0, 138.0, 116.0, 75.0, 28.0, 22.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.516013145446777, -4.381528854370117, -4.247044086456299, -4.112559795379639, -3.9780752658843994, -3.84359073638916, -3.7091064453125, -3.5746219158172607, -3.4401373863220215, -3.3056528568267822, -3.171168565750122, -3.036684036254883, -2.9021995067596436, -2.7677149772644043, -2.633230686187744, -2.498746156692505, -2.3642618656158447, -2.2297773361206055, -2.0952930450439453, -1.960808515548706, -1.8263239860534668, -1.691839575767517, -1.5573551654815674, -1.4228706359863281, -1.2883862257003784, -1.1539018154144287, -1.0194172859191895, -0.8849328756332397, -0.7504484057426453, -0.6159639358520508, -0.4814795255661011, -0.3469950556755066, -0.2125105857849121, -0.07802613079547882, 0.05645832419395447, 0.19094276428222656, 0.32542723417282104, 0.4599117040634155, 0.5943961143493652, 0.7288805842399597, 0.8633650541305542, 0.9978495240211487, 1.1323339939117432, 1.2668184041976929, 1.4013028144836426, 1.5357873439788818, 1.6702717542648315, 1.8047561645507812, 1.9392406940460205, 2.0737252235412598, 2.20820951461792, 2.342694044113159, 2.4771785736083984, 2.6116628646850586, 2.746147394180298, 2.880631923675537, 3.0151162147521973, 3.1496007442474365, 3.2840850353240967, 3.418569564819336, 3.553054094314575, 3.6875386238098145, 3.8220229148864746, 3.956507444381714, 4.090991973876953]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 9.0, 4.0, 7.0, 8.0, 11.0, 16.0, 15.0, 15.0, 20.0, 20.0, 24.0, 25.0, 22.0, 36.0, 31.0, 32.0, 30.0, 30.0, 38.0, 35.0, 44.0, 57.0, 33.0, 43.0, 37.0, 31.0, 29.0, 38.0, 22.0, 40.0, 20.0, 35.0, 22.0, 19.0, 10.0, 22.0, 12.0, 12.0, 7.0, 6.0, 3.0, 6.0, 6.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.4504894018173218, -1.4076894521713257, -1.36488938331604, -1.322089433670044, -1.2792894840240479, -1.2364894151687622, -1.1936894655227661, -1.1508893966674805, -1.1080894470214844, -1.0652894973754883, -1.0224894285202026, -0.9796894788742065, -0.9368894696235657, -0.8940894603729248, -0.8512895107269287, -0.8084895014762878, -0.7656895518302917, -0.7228895425796509, -0.6800895929336548, -0.6372895836830139, -0.594489574432373, -0.551689624786377, -0.5088896155357361, -0.4660896062850952, -0.42328962683677673, -0.38048964738845825, -0.3376896381378174, -0.2948896586894989, -0.2520896792411804, -0.20928966999053955, -0.16648969054222107, -0.1236896812915802, -0.08088970184326172, -0.03808971121907234, 0.004710279405117035, 0.04751026630401611, 0.09031026065349579, 0.13311025500297546, 0.17591023445129395, 0.21871024370193481, 0.2615102231502533, 0.3043102025985718, 0.34711021184921265, 0.38991019129753113, 0.4327101707458496, 0.4755101799964905, 0.5183101892471313, 0.5611101388931274, 0.6039101481437683, 0.6467101573944092, 0.6895101070404053, 0.7323101162910461, 0.775110125541687, 0.8179100751876831, 0.860710084438324, 0.9035100936889648, 0.9463100433349609, 0.9891100525856018, 1.0319100618362427, 1.0747100114822388, 1.1175099611282349, 1.1603100299835205, 1.2031099796295166, 1.2459099292755127, 1.2887099981307983]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 14.0, 22.0, 35.0, 63.0, 82.0, 138.0, 194.0, 327.0, 518.0, 925.0, 1622.0, 2916.0, 5078.0, 9421.0, 17713.0, 33509.0, 61700.0, 107216.0, 161197.0, 193751.0, 173283.0, 121252.0, 71924.0, 39145.0, 21061.0, 11280.0, 6134.0, 3361.0, 1919.0, 1072.0, 642.0, 379.0, 228.0, 162.0, 78.0, 62.0, 43.0, 19.0, 12.0, 6.0, 3.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22093772888183594, -0.21348190307617188, -0.2060260772705078, -0.19857025146484375, -0.1911144256591797, -0.18365859985351562, -0.17620277404785156, -0.1687469482421875, -0.16129112243652344, -0.15383529663085938, -0.1463794708251953, -0.13892364501953125, -0.1314678192138672, -0.12401199340820312, -0.11655616760253906, -0.109100341796875, -0.10164451599121094, -0.09418869018554688, -0.08673286437988281, -0.07927703857421875, -0.07182121276855469, -0.06436538696289062, -0.05690956115722656, -0.0494537353515625, -0.04199790954589844, -0.034542083740234375, -0.027086257934570312, -0.01963043212890625, -0.012174606323242188, -0.004718780517578125, 0.0027370452880859375, 0.01019287109375, 0.017648696899414062, 0.025104522705078125, 0.03256034851074219, 0.04001617431640625, 0.04747200012207031, 0.054927825927734375, 0.06238365173339844, 0.0698394775390625, 0.07729530334472656, 0.08475112915039062, 0.09220695495605469, 0.09966278076171875, 0.10711860656738281, 0.11457443237304688, 0.12203025817871094, 0.129486083984375, 0.13694190979003906, 0.14439773559570312, 0.1518535614013672, 0.15930938720703125, 0.1667652130126953, 0.17422103881835938, 0.18167686462402344, 0.1891326904296875, 0.19658851623535156, 0.20404434204101562, 0.2115001678466797, 0.21895599365234375, 0.2264118194580078, 0.23386764526367188, 0.24132347106933594, 0.248779296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 13.0, 13.0, 17.0, 12.0, 12.0, 25.0, 25.0, 29.0, 37.0, 22.0, 36.0, 34.0, 46.0, 42.0, 33.0, 46.0, 45.0, 46.0, 46.0, 43.0, 33.0, 36.0, 34.0, 37.0, 28.0, 33.0, 30.0, 19.0, 14.0, 15.0, 24.0, 12.0, 17.0, 9.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.1735706329345703, -0.16708755493164062, -0.16060447692871094, -0.15412139892578125, -0.14763832092285156, -0.14115524291992188, -0.1346721649169922, -0.1281890869140625, -0.12170600891113281, -0.11522293090820312, -0.10873985290527344, -0.10225677490234375, -0.09577369689941406, -0.08929061889648438, -0.08280754089355469, -0.076324462890625, -0.06984138488769531, -0.06335830688476562, -0.05687522888183594, -0.05039215087890625, -0.04390907287597656, -0.037425994873046875, -0.030942916870117188, -0.0244598388671875, -0.017976760864257812, -0.011493682861328125, -0.0050106048583984375, 0.00147247314453125, 0.007955551147460938, 0.014438629150390625, 0.020921707153320312, 0.02740478515625, 0.03388786315917969, 0.040370941162109375, 0.04685401916503906, 0.05333709716796875, 0.05982017517089844, 0.06630325317382812, 0.07278633117675781, 0.0792694091796875, 0.08575248718261719, 0.09223556518554688, 0.09871864318847656, 0.10520172119140625, 0.11168479919433594, 0.11816787719726562, 0.12465095520019531, 0.131134033203125, 0.1376171112060547, 0.14410018920898438, 0.15058326721191406, 0.15706634521484375, 0.16354942321777344, 0.17003250122070312, 0.1765155792236328, 0.1829986572265625, 0.1894817352294922, 0.19596481323242188, 0.20244789123535156, 0.20893096923828125, 0.21541404724121094, 0.22189712524414062, 0.2283802032470703, 0.23486328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 15.0, 20.0, 24.0, 38.0, 65.0, 105.0, 222.0, 504.0, 1119.0, 3552.0, 12621.0, 53089.0, 231107.0, 469576.0, 211662.0, 48124.0, 11421.0, 3288.0, 1111.0, 370.0, 226.0, 102.0, 56.0, 38.0, 32.0, 19.0, 8.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.572265625, -0.5534820556640625, -0.534698486328125, -0.5159149169921875, -0.49713134765625, -0.4783477783203125, -0.459564208984375, -0.4407806396484375, -0.4219970703125, -0.4032135009765625, -0.384429931640625, -0.3656463623046875, -0.34686279296875, -0.3280792236328125, -0.309295654296875, -0.2905120849609375, -0.271728515625, -0.2529449462890625, -0.234161376953125, -0.2153778076171875, -0.19659423828125, -0.1778106689453125, -0.159027099609375, -0.1402435302734375, -0.1214599609375, -0.1026763916015625, -0.083892822265625, -0.0651092529296875, -0.04632568359375, -0.0275421142578125, -0.008758544921875, 0.0100250244140625, 0.02880859375, 0.0475921630859375, 0.066375732421875, 0.0851593017578125, 0.10394287109375, 0.1227264404296875, 0.141510009765625, 0.1602935791015625, 0.1790771484375, 0.1978607177734375, 0.216644287109375, 0.2354278564453125, 0.25421142578125, 0.2729949951171875, 0.291778564453125, 0.3105621337890625, 0.329345703125, 0.3481292724609375, 0.366912841796875, 0.3856964111328125, 0.40447998046875, 0.4232635498046875, 0.442047119140625, 0.4608306884765625, 0.4796142578125, 0.4983978271484375, 0.517181396484375, 0.5359649658203125, 0.55474853515625, 0.5735321044921875, 0.592315673828125, 0.6110992431640625, 0.6298828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 4.0, 7.0, 9.0, 9.0, 15.0, 16.0, 21.0, 16.0, 27.0, 32.0, 26.0, 41.0, 32.0, 43.0, 43.0, 40.0, 43.0, 50.0, 49.0, 32.0, 51.0, 41.0, 48.0, 47.0, 25.0, 24.0, 31.0, 31.0, 21.0, 15.0, 29.0, 18.0, 6.0, 7.0, 13.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.65673828125, -0.6382064819335938, -0.6196746826171875, -0.6011428833007812, -0.582611083984375, -0.5640792846679688, -0.5455474853515625, -0.5270156860351562, -0.50848388671875, -0.48995208740234375, -0.4714202880859375, -0.45288848876953125, -0.434356689453125, -0.41582489013671875, -0.3972930908203125, -0.37876129150390625, -0.3602294921875, -0.34169769287109375, -0.3231658935546875, -0.30463409423828125, -0.286102294921875, -0.26757049560546875, -0.2490386962890625, -0.23050689697265625, -0.21197509765625, -0.19344329833984375, -0.1749114990234375, -0.15637969970703125, -0.137847900390625, -0.11931610107421875, -0.1007843017578125, -0.08225250244140625, -0.063720703125, -0.04518890380859375, -0.0266571044921875, -0.00812530517578125, 0.010406494140625, 0.02893829345703125, 0.0474700927734375, 0.06600189208984375, 0.08453369140625, 0.10306549072265625, 0.1215972900390625, 0.14012908935546875, 0.158660888671875, 0.17719268798828125, 0.1957244873046875, 0.21425628662109375, 0.2327880859375, 0.25131988525390625, 0.2698516845703125, 0.28838348388671875, 0.306915283203125, 0.32544708251953125, 0.3439788818359375, 0.36251068115234375, 0.38104248046875, 0.39957427978515625, 0.4181060791015625, 0.43663787841796875, 0.455169677734375, 0.47370147705078125, 0.4922332763671875, 0.5107650756835938, 0.529296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 18.0, 27.0, 36.0, 35.0, 49.0, 113.0, 142.0, 247.0, 330.0, 604.0, 1057.0, 1818.0, 3542.0, 7103.0, 15579.0, 36163.0, 85685.0, 183725.0, 274149.0, 227294.0, 118487.0, 50960.0, 21529.0, 9552.0, 4707.0, 2306.0, 1259.0, 784.0, 439.0, 282.0, 173.0, 120.0, 89.0, 45.0, 28.0, 26.0, 18.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.12944984436035156, -0.12523269653320312, -0.12101554870605469, -0.11679840087890625, -0.11258125305175781, -0.10836410522460938, -0.10414695739746094, -0.0999298095703125, -0.09571266174316406, -0.09149551391601562, -0.08727836608886719, -0.08306121826171875, -0.07884407043457031, -0.07462692260742188, -0.07040977478027344, -0.066192626953125, -0.06197547912597656, -0.057758331298828125, -0.05354118347167969, -0.04932403564453125, -0.04510688781738281, -0.040889739990234375, -0.03667259216308594, -0.0324554443359375, -0.028238296508789062, -0.024021148681640625, -0.019804000854492188, -0.01558685302734375, -0.011369705200195312, -0.007152557373046875, -0.0029354095458984375, 0.00128173828125, 0.0054988861083984375, 0.009716033935546875, 0.013933181762695312, 0.01815032958984375, 0.022367477416992188, 0.026584625244140625, 0.030801773071289062, 0.0350189208984375, 0.03923606872558594, 0.043453216552734375, 0.04767036437988281, 0.05188751220703125, 0.05610466003417969, 0.060321807861328125, 0.06453895568847656, 0.068756103515625, 0.07297325134277344, 0.07719039916992188, 0.08140754699707031, 0.08562469482421875, 0.08984184265136719, 0.09405899047851562, 0.09827613830566406, 0.1024932861328125, 0.10671043395996094, 0.11092758178710938, 0.11514472961425781, 0.11936187744140625, 0.12357902526855469, 0.12779617309570312, 0.13201332092285156, 0.13623046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 13.0, 11.0, 12.0, 25.0, 26.0, 38.0, 42.0, 43.0, 53.0, 66.0, 75.0, 70.0, 77.0, 72.0, 68.0, 60.0, 47.0, 47.0, 36.0, 23.0, 21.0, 16.0, 16.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3511390686035156e-05, -4.224199801683426e-05, -4.097260534763336e-05, -3.9703212678432465e-05, -3.843382000923157e-05, -3.716442734003067e-05, -3.589503467082977e-05, -3.4625642001628876e-05, -3.335624933242798e-05, -3.208685666322708e-05, -3.0817463994026184e-05, -2.9548071324825287e-05, -2.827867865562439e-05, -2.7009285986423492e-05, -2.5739893317222595e-05, -2.4470500648021698e-05, -2.32011079788208e-05, -2.1931715309619904e-05, -2.0662322640419006e-05, -1.939292997121811e-05, -1.8123537302017212e-05, -1.6854144632816315e-05, -1.5584751963615417e-05, -1.431535929441452e-05, -1.3045966625213623e-05, -1.1776573956012726e-05, -1.0507181286811829e-05, -9.237788617610931e-06, -7.968395948410034e-06, -6.699003279209137e-06, -5.42961061000824e-06, -4.1602179408073425e-06, -2.8908252716064453e-06, -1.621432602405548e-06, -3.520399332046509e-07, 9.173527359962463e-07, 2.1867454051971436e-06, 3.4561380743980408e-06, 4.725530743598938e-06, 5.994923412799835e-06, 7.264316082000732e-06, 8.53370875120163e-06, 9.803101420402527e-06, 1.1072494089603424e-05, 1.2341886758804321e-05, 1.3611279428005219e-05, 1.4880672097206116e-05, 1.6150064766407013e-05, 1.741945743560791e-05, 1.8688850104808807e-05, 1.9958242774009705e-05, 2.1227635443210602e-05, 2.24970281124115e-05, 2.3766420781612396e-05, 2.5035813450813293e-05, 2.630520612001419e-05, 2.7574598789215088e-05, 2.8843991458415985e-05, 3.0113384127616882e-05, 3.138277679681778e-05, 3.265216946601868e-05, 3.3921562135219574e-05, 3.519095480442047e-05, 3.646034747362137e-05, 3.7729740142822266e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 17.0, 24.0, 30.0, 38.0, 63.0, 98.0, 162.0, 308.0, 675.0, 1413.0, 3324.0, 9105.0, 26822.0, 86008.0, 238657.0, 358824.0, 213041.0, 73382.0, 23179.0, 7844.0, 2860.0, 1323.0, 594.0, 293.0, 167.0, 102.0, 55.0, 44.0, 33.0, 13.0, 13.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.17337989807128906, -0.16768264770507812, -0.1619853973388672, -0.15628814697265625, -0.1505908966064453, -0.14489364624023438, -0.13919639587402344, -0.1334991455078125, -0.12780189514160156, -0.12210464477539062, -0.11640739440917969, -0.11071014404296875, -0.10501289367675781, -0.09931564331054688, -0.09361839294433594, -0.087921142578125, -0.08222389221191406, -0.07652664184570312, -0.07082939147949219, -0.06513214111328125, -0.05943489074707031, -0.053737640380859375, -0.04804039001464844, -0.0423431396484375, -0.03664588928222656, -0.030948638916015625, -0.025251388549804688, -0.01955413818359375, -0.013856887817382812, -0.008159637451171875, -0.0024623870849609375, 0.00323486328125, 0.008932113647460938, 0.014629364013671875, 0.020326614379882812, 0.02602386474609375, 0.03172111511230469, 0.037418365478515625, 0.04311561584472656, 0.0488128662109375, 0.05451011657714844, 0.060207366943359375, 0.06590461730957031, 0.07160186767578125, 0.07729911804199219, 0.08299636840820312, 0.08869361877441406, 0.094390869140625, 0.10008811950683594, 0.10578536987304688, 0.11148262023925781, 0.11717987060546875, 0.12287712097167969, 0.12857437133789062, 0.13427162170410156, 0.1399688720703125, 0.14566612243652344, 0.15136337280273438, 0.1570606231689453, 0.16275787353515625, 0.1684551239013672, 0.17415237426757812, 0.17984962463378906, 0.185546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 4.0, 7.0, 11.0, 14.0, 20.0, 30.0, 43.0, 65.0, 65.0, 94.0, 95.0, 116.0, 102.0, 72.0, 73.0, 49.0, 39.0, 35.0, 28.0, 17.0, 7.0, 4.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.147125244140625, -0.13995361328125, -0.132781982421875, -0.1256103515625, -0.118438720703125, -0.11126708984375, -0.104095458984375, -0.096923828125, -0.089752197265625, -0.08258056640625, -0.075408935546875, -0.0682373046875, -0.061065673828125, -0.05389404296875, -0.046722412109375, -0.03955078125, -0.032379150390625, -0.02520751953125, -0.018035888671875, -0.0108642578125, -0.003692626953125, 0.00347900390625, 0.010650634765625, 0.017822265625, 0.024993896484375, 0.03216552734375, 0.039337158203125, 0.0465087890625, 0.053680419921875, 0.06085205078125, 0.068023681640625, 0.0751953125, 0.082366943359375, 0.08953857421875, 0.096710205078125, 0.1038818359375, 0.111053466796875, 0.11822509765625, 0.125396728515625, 0.132568359375, 0.139739990234375, 0.14691162109375, 0.154083251953125, 0.1612548828125, 0.168426513671875, 0.17559814453125, 0.182769775390625, 0.18994140625, 0.197113037109375, 0.20428466796875, 0.211456298828125, 0.2186279296875, 0.225799560546875, 0.23297119140625, 0.240142822265625, 0.247314453125, 0.254486083984375, 0.26165771484375, 0.268829345703125, 0.2760009765625, 0.283172607421875, 0.29034423828125, 0.297515869140625, 0.3046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 9.0, 24.0, 41.0, 81.0, 132.0, 162.0, 201.0, 149.0, 99.0, 41.0, 22.0, 13.0, 8.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5538761615753174, -2.4527816772460938, -2.35168719291687, -2.2505927085876465, -2.1494979858398438, -2.048403739929199, -1.9473090171813965, -1.8462145328521729, -1.7451200485229492, -1.6440255641937256, -1.542931079864502, -1.4418364763259888, -1.3407419919967651, -1.2396475076675415, -1.1385529041290283, -1.0374584197998047, -0.936363935470581, -0.8352694511413574, -0.734174907207489, -0.6330803632736206, -0.531985878944397, -0.43089139461517334, -0.32979685068130493, -0.22870230674743652, -0.1276078224182129, -0.02651330828666687, 0.07458120584487915, 0.17567571997642517, 0.2767702341079712, 0.3778647184371948, 0.47895926237106323, 0.5800538063049316, 0.6811485290527344, 0.782243013381958, 0.8833375573158264, 0.9844321012496948, 1.0855265855789185, 1.186621069908142, 1.2877156734466553, 1.388810157775879, 1.4899046421051025, 1.5909991264343262, 1.6920936107635498, 1.793188214302063, 1.8942826986312866, 1.9953771829605103, 2.0964717864990234, 2.197566270828247, 2.2986607551574707, 2.3997552394866943, 2.500849723815918, 2.6019442081451416, 2.7030386924743652, 2.804133415222168, 2.9052278995513916, 3.0063223838806152, 3.107416868209839, 3.2085113525390625, 3.309605836868286, 3.4107003211975098, 3.5117950439453125, 3.612889289855957, 3.7139840126037598, 3.8150784969329834, 3.916172981262207]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 8.0, 8.0, 5.0, 8.0, 20.0, 11.0, 17.0, 13.0, 21.0, 23.0, 32.0, 34.0, 36.0, 41.0, 25.0, 40.0, 37.0, 50.0, 41.0, 30.0, 45.0, 27.0, 40.0, 42.0, 44.0, 29.0, 31.0, 23.0, 27.0, 24.0, 27.0, 23.0, 24.0, 11.0, 16.0, 14.0, 11.0, 8.0, 7.0, 8.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.451817274093628, -1.4054875373840332, -1.359157681465149, -1.3128279447555542, -1.26649808883667, -1.2201683521270752, -1.1738386154174805, -1.1275087594985962, -1.081178903579712, -1.0348491668701172, -0.9885193109512329, -0.9421895742416382, -0.8958597183227539, -0.8495299816131592, -0.8032001852989197, -0.7568703889846802, -0.7105406522750854, -0.664210855960846, -0.6178810596466064, -0.5715513229370117, -0.5252214670181274, -0.4788917005062103, -0.4325619339942932, -0.3862321376800537, -0.3399023413658142, -0.2935725450515747, -0.2472427636384964, -0.2009129822254181, -0.1545831859111786, -0.10825338959693909, -0.06192362308502197, -0.01559382677078247, 0.03073596954345703, 0.07706575840711594, 0.12339554727077484, 0.16972532868385315, 0.21605512499809265, 0.26238492131233215, 0.30871468782424927, 0.35504448413848877, 0.40137428045272827, 0.4477040767669678, 0.4940338730812073, 0.5403636693954468, 0.5866934061050415, 0.6330232620239258, 0.6793529987335205, 0.72568279504776, 0.7720125913619995, 0.818342387676239, 0.8646721839904785, 0.9110019207000732, 0.9573317766189575, 1.0036615133285522, 1.0499913692474365, 1.0963211059570312, 1.142650842666626, 1.1889805793762207, 1.235310435295105, 1.2816401720046997, 1.327970027923584, 1.3742997646331787, 1.4206295013427734, 1.4669593572616577, 1.513289213180542]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 12.0, 9.0, 25.0, 36.0, 58.0, 84.0, 178.0, 266.0, 424.0, 680.0, 1236.0, 2322.0, 4716.0, 9583.0, 21164.0, 50126.0, 129925.0, 399204.0, 1253434.0, 1515429.0, 531111.0, 166073.0, 60398.0, 24973.0, 11049.0, 5450.0, 2716.0, 1460.0, 841.0, 465.0, 297.0, 198.0, 116.0, 71.0, 52.0, 37.0, 17.0, 14.0, 12.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20380020141601562, -0.19568634033203125, -0.18757247924804688, -0.1794586181640625, -0.17134475708007812, -0.16323089599609375, -0.15511703491210938, -0.147003173828125, -0.13888931274414062, -0.13077545166015625, -0.12266159057617188, -0.1145477294921875, -0.10643386840820312, -0.09832000732421875, -0.09020614624023438, -0.08209228515625, -0.07397842407226562, -0.06586456298828125, -0.057750701904296875, -0.0496368408203125, -0.041522979736328125, -0.03340911865234375, -0.025295257568359375, -0.017181396484375, -0.009067535400390625, -0.00095367431640625, 0.007160186767578125, 0.0152740478515625, 0.023387908935546875, 0.03150177001953125, 0.039615631103515625, 0.0477294921875, 0.055843353271484375, 0.06395721435546875, 0.07207107543945312, 0.0801849365234375, 0.08829879760742188, 0.09641265869140625, 0.10452651977539062, 0.112640380859375, 0.12075424194335938, 0.12886810302734375, 0.13698196411132812, 0.1450958251953125, 0.15320968627929688, 0.16132354736328125, 0.16943740844726562, 0.17755126953125, 0.18566513061523438, 0.19377899169921875, 0.20189285278320312, 0.2100067138671875, 0.21812057495117188, 0.22623443603515625, 0.23434829711914062, 0.242462158203125, 0.2505760192871094, 0.25868988037109375, 0.2668037414550781, 0.2749176025390625, 0.2830314636230469, 0.29114532470703125, 0.2992591857910156, 0.307373046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 10.0, 7.0, 10.0, 10.0, 19.0, 17.0, 21.0, 17.0, 27.0, 30.0, 30.0, 33.0, 37.0, 35.0, 42.0, 43.0, 35.0, 68.0, 45.0, 39.0, 43.0, 42.0, 39.0, 34.0, 31.0, 27.0, 27.0, 33.0, 29.0, 20.0, 20.0, 20.0, 10.0, 9.0, 6.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.1710681915283203, -0.16452407836914062, -0.15797996520996094, -0.15143585205078125, -0.14489173889160156, -0.13834762573242188, -0.1318035125732422, -0.1252593994140625, -0.11871528625488281, -0.11217117309570312, -0.10562705993652344, -0.09908294677734375, -0.09253883361816406, -0.08599472045898438, -0.07945060729980469, -0.072906494140625, -0.06636238098144531, -0.059818267822265625, -0.05327415466308594, -0.04673004150390625, -0.04018592834472656, -0.033641815185546875, -0.027097702026367188, -0.0205535888671875, -0.014009475708007812, -0.007465362548828125, -0.0009212493896484375, 0.00562286376953125, 0.012166976928710938, 0.018711090087890625, 0.025255203247070312, 0.03179931640625, 0.03834342956542969, 0.044887542724609375, 0.05143165588378906, 0.05797576904296875, 0.06451988220214844, 0.07106399536132812, 0.07760810852050781, 0.0841522216796875, 0.09069633483886719, 0.09724044799804688, 0.10378456115722656, 0.11032867431640625, 0.11687278747558594, 0.12341690063476562, 0.1299610137939453, 0.136505126953125, 0.1430492401123047, 0.14959335327148438, 0.15613746643066406, 0.16268157958984375, 0.16922569274902344, 0.17576980590820312, 0.1823139190673828, 0.1888580322265625, 0.1954021453857422, 0.20194625854492188, 0.20849037170410156, 0.21503448486328125, 0.22157859802246094, 0.22812271118164062, 0.2346668243408203, 0.2412109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 10.0, 10.0, 21.0, 31.0, 47.0, 75.0, 117.0, 234.0, 377.0, 733.0, 1586.0, 3614.0, 9974.0, 32123.0, 131044.0, 739088.0, 2640858.0, 499043.0, 97150.0, 24550.0, 7932.0, 2865.0, 1249.0, 669.0, 336.0, 175.0, 128.0, 80.0, 56.0, 34.0, 21.0, 15.0, 9.0, 9.0, 6.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5248146057128906, -0.5091018676757812, -0.4933891296386719, -0.4776763916015625, -0.4619636535644531, -0.44625091552734375, -0.4305381774902344, -0.414825439453125, -0.3991127014160156, -0.38339996337890625, -0.3676872253417969, -0.3519744873046875, -0.3362617492675781, -0.32054901123046875, -0.3048362731933594, -0.28912353515625, -0.2734107971191406, -0.25769805908203125, -0.24198532104492188, -0.2262725830078125, -0.21055984497070312, -0.19484710693359375, -0.17913436889648438, -0.163421630859375, -0.14770889282226562, -0.13199615478515625, -0.11628341674804688, -0.1005706787109375, -0.08485794067382812, -0.06914520263671875, -0.053432464599609375, -0.0377197265625, -0.022006988525390625, -0.00629425048828125, 0.009418487548828125, 0.0251312255859375, 0.040843963623046875, 0.05655670166015625, 0.07226943969726562, 0.087982177734375, 0.10369491577148438, 0.11940765380859375, 0.13512039184570312, 0.1508331298828125, 0.16654586791992188, 0.18225860595703125, 0.19797134399414062, 0.21368408203125, 0.22939682006835938, 0.24510955810546875, 0.2608222961425781, 0.2765350341796875, 0.2922477722167969, 0.30796051025390625, 0.3236732482910156, 0.339385986328125, 0.3550987243652344, 0.37081146240234375, 0.3865242004394531, 0.4022369384765625, 0.4179496765136719, 0.43366241455078125, 0.4493751525878906, 0.465087890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 7.0, 15.0, 8.0, 13.0, 24.0, 31.0, 39.0, 52.0, 70.0, 107.0, 146.0, 191.0, 277.0, 406.0, 599.0, 619.0, 438.0, 320.0, 208.0, 140.0, 98.0, 65.0, 58.0, 41.0, 19.0, 14.0, 15.0, 14.0, 8.0, 4.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3681640625, -0.3545684814453125, -0.340972900390625, -0.3273773193359375, -0.31378173828125, -0.3001861572265625, -0.286590576171875, -0.2729949951171875, -0.2593994140625, -0.2458038330078125, -0.232208251953125, -0.2186126708984375, -0.20501708984375, -0.1914215087890625, -0.177825927734375, -0.1642303466796875, -0.150634765625, -0.1370391845703125, -0.123443603515625, -0.1098480224609375, -0.09625244140625, -0.0826568603515625, -0.069061279296875, -0.0554656982421875, -0.0418701171875, -0.0282745361328125, -0.014678955078125, -0.0010833740234375, 0.01251220703125, 0.0261077880859375, 0.039703369140625, 0.0532989501953125, 0.06689453125, 0.0804901123046875, 0.094085693359375, 0.1076812744140625, 0.12127685546875, 0.1348724365234375, 0.148468017578125, 0.1620635986328125, 0.1756591796875, 0.1892547607421875, 0.202850341796875, 0.2164459228515625, 0.23004150390625, 0.2436370849609375, 0.257232666015625, 0.2708282470703125, 0.284423828125, 0.2980194091796875, 0.311614990234375, 0.3252105712890625, 0.33880615234375, 0.3524017333984375, 0.365997314453125, 0.3795928955078125, 0.3931884765625, 0.4067840576171875, 0.420379638671875, 0.4339752197265625, 0.44757080078125, 0.4611663818359375, 0.474761962890625, 0.4883575439453125, 0.501953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 12.0, 29.0, 40.0, 76.0, 123.0, 129.0, 143.0, 153.0, 119.0, 77.0, 45.0, 20.0, 14.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.283090114593506, -4.17725944519043, -4.0714287757873535, -3.9655983448028564, -3.8597679138183594, -3.753937244415283, -3.648106575012207, -3.54227614402771, -3.436445474624634, -3.3306148052215576, -3.2247843742370605, -3.1189537048339844, -3.0131232738494873, -2.907292604446411, -2.801462173461914, -2.695631504058838, -2.5898008346557617, -2.4839701652526855, -2.3781397342681885, -2.2723090648651123, -2.1664786338806152, -2.060647964477539, -1.9548174142837524, -1.8489868640899658, -1.7431564331054688, -1.6373258829116821, -1.5314953327178955, -1.4256646633148193, -1.3198341131210327, -1.214003562927246, -1.1081730127334595, -1.0023424625396729, -0.8965117931365967, -0.7906812429428101, -0.6848506331443787, -0.579020082950592, -0.47318950295448303, -0.367358922958374, -0.2615283727645874, -0.155697762966156, -0.049867212772369385, 0.05596335977315903, 0.16179393231868744, 0.26762449741363525, 0.37345507740974426, 0.47928565740585327, 0.5851162075996399, 0.6909468173980713, 0.7967773675918579, 0.9026079177856445, 1.0084384679794312, 1.1142690181732178, 1.220099687576294, 1.3259302377700806, 1.4317607879638672, 1.5375914573669434, 1.6434218883514404, 1.749252438545227, 1.8550829887390137, 1.9609136581420898, 2.066744089126587, 2.172574758529663, 2.27840518951416, 2.3842358589172363, 2.4900665283203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 5.0, 8.0, 7.0, 11.0, 14.0, 13.0, 30.0, 18.0, 28.0, 30.0, 21.0, 35.0, 26.0, 34.0, 34.0, 41.0, 28.0, 45.0, 45.0, 50.0, 38.0, 39.0, 39.0, 29.0, 35.0, 29.0, 30.0, 36.0, 25.0, 22.0, 30.0, 19.0, 16.0, 13.0, 13.0, 8.0, 6.0, 9.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.3442909717559814, -1.3058111667633057, -1.2673313617706299, -1.228851556777954, -1.1903717517852783, -1.1518919467926025, -1.1134121417999268, -1.074932336807251, -1.0364525318145752, -0.9979727268218994, -0.9594929218292236, -0.9210131168365479, -0.8825333118438721, -0.8440535068511963, -0.8055737018585205, -0.7670938968658447, -0.728614091873169, -0.6901342868804932, -0.6516544818878174, -0.6131746768951416, -0.5746948719024658, -0.53621506690979, -0.49773526191711426, -0.4592554569244385, -0.4207756519317627, -0.3822958469390869, -0.34381604194641113, -0.30533623695373535, -0.26685643196105957, -0.2283766269683838, -0.189896821975708, -0.15141701698303223, -0.11293721199035645, -0.07445740699768066, -0.03597760200500488, 0.0025022029876708984, 0.04098200798034668, 0.07946181297302246, 0.11794161796569824, 0.15642142295837402, 0.1949012279510498, 0.23338103294372559, 0.27186083793640137, 0.31034064292907715, 0.34882044792175293, 0.3873002529144287, 0.4257800579071045, 0.4642598628997803, 0.502739667892456, 0.5412194728851318, 0.5796992778778076, 0.6181790828704834, 0.6566588878631592, 0.695138692855835, 0.7336184978485107, 0.7720983028411865, 0.8105781078338623, 0.8490579128265381, 0.8875377178192139, 0.9260175228118896, 0.9644973278045654, 1.0029771327972412, 1.041456937789917, 1.0799367427825928, 1.1184165477752686]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 21.0, 30.0, 35.0, 56.0, 62.0, 107.0, 228.0, 350.0, 630.0, 1149.0, 2064.0, 3920.0, 7853.0, 17351.0, 42224.0, 111220.0, 253911.0, 313132.0, 175752.0, 68604.0, 26506.0, 11563.0, 5512.0, 2782.0, 1501.0, 777.0, 473.0, 266.0, 163.0, 90.0, 66.0, 43.0, 36.0, 19.0, 14.0, 13.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.484130859375, -0.4711341857910156, -0.45813751220703125, -0.4451408386230469, -0.4321441650390625, -0.4191474914550781, -0.40615081787109375, -0.3931541442871094, -0.380157470703125, -0.3671607971191406, -0.35416412353515625, -0.3411674499511719, -0.3281707763671875, -0.3151741027832031, -0.30217742919921875, -0.2891807556152344, -0.27618408203125, -0.2631874084472656, -0.25019073486328125, -0.23719406127929688, -0.2241973876953125, -0.21120071411132812, -0.19820404052734375, -0.18520736694335938, -0.172210693359375, -0.15921401977539062, -0.14621734619140625, -0.13322067260742188, -0.1202239990234375, -0.10722732543945312, -0.09423065185546875, -0.08123397827148438, -0.0682373046875, -0.055240631103515625, -0.04224395751953125, -0.029247283935546875, -0.0162506103515625, -0.003253936767578125, 0.00974273681640625, 0.022739410400390625, 0.035736083984375, 0.048732757568359375, 0.06172943115234375, 0.07472610473632812, 0.0877227783203125, 0.10071945190429688, 0.11371612548828125, 0.12671279907226562, 0.13970947265625, 0.15270614624023438, 0.16570281982421875, 0.17869949340820312, 0.1916961669921875, 0.20469284057617188, 0.21768951416015625, 0.23068618774414062, 0.243682861328125, 0.2566795349121094, 0.26967620849609375, 0.2826728820800781, 0.2956695556640625, 0.3086662292480469, 0.32166290283203125, 0.3346595764160156, 0.34765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 16.0, 16.0, 15.0, 20.0, 23.0, 28.0, 28.0, 38.0, 36.0, 35.0, 40.0, 36.0, 50.0, 39.0, 41.0, 51.0, 45.0, 47.0, 49.0, 39.0, 36.0, 32.0, 30.0, 32.0, 29.0, 20.0, 23.0, 11.0, 11.0, 19.0, 10.0, 8.0, 4.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2005615234375, -0.19386672973632812, -0.18717193603515625, -0.18047714233398438, -0.1737823486328125, -0.16708755493164062, -0.16039276123046875, -0.15369796752929688, -0.147003173828125, -0.14030838012695312, -0.13361358642578125, -0.12691879272460938, -0.1202239990234375, -0.11352920532226562, -0.10683441162109375, -0.10013961791992188, -0.09344482421875, -0.08675003051757812, -0.08005523681640625, -0.07336044311523438, -0.0666656494140625, -0.059970855712890625, -0.05327606201171875, -0.046581268310546875, -0.039886474609375, -0.033191680908203125, -0.02649688720703125, -0.019802093505859375, -0.0131072998046875, -0.006412506103515625, 0.00028228759765625, 0.006977081298828125, 0.013671875, 0.020366668701171875, 0.02706146240234375, 0.033756256103515625, 0.0404510498046875, 0.047145843505859375, 0.05384063720703125, 0.060535430908203125, 0.067230224609375, 0.07392501831054688, 0.08061981201171875, 0.08731460571289062, 0.0940093994140625, 0.10070419311523438, 0.10739898681640625, 0.11409378051757812, 0.12078857421875, 0.12748336791992188, 0.13417816162109375, 0.14087295532226562, 0.1475677490234375, 0.15426254272460938, 0.16095733642578125, 0.16765213012695312, 0.174346923828125, 0.18104171752929688, 0.18773651123046875, 0.19443130493164062, 0.2011260986328125, 0.20782089233398438, 0.21451568603515625, 0.22121047973632812, 0.2279052734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 8.0, 8.0, 8.0, 15.0, 24.0, 42.0, 58.0, 78.0, 139.0, 237.0, 425.0, 834.0, 1514.0, 3121.0, 6021.0, 12834.0, 29181.0, 72781.0, 182088.0, 322079.0, 241483.0, 102290.0, 40069.0, 16912.0, 8112.0, 3911.0, 1931.0, 1009.0, 571.0, 306.0, 173.0, 94.0, 64.0, 37.0, 26.0, 18.0, 13.0, 5.0, 11.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3670845031738281, -0.35428619384765625, -0.3414878845214844, -0.3286895751953125, -0.3158912658691406, -0.30309295654296875, -0.2902946472167969, -0.277496337890625, -0.2646980285644531, -0.25189971923828125, -0.23910140991210938, -0.2263031005859375, -0.21350479125976562, -0.20070648193359375, -0.18790817260742188, -0.17510986328125, -0.16231155395507812, -0.14951324462890625, -0.13671493530273438, -0.1239166259765625, -0.11111831665039062, -0.09832000732421875, -0.08552169799804688, -0.072723388671875, -0.059925079345703125, -0.04712677001953125, -0.034328460693359375, -0.0215301513671875, -0.008731842041015625, 0.00406646728515625, 0.016864776611328125, 0.0296630859375, 0.042461395263671875, 0.05525970458984375, 0.06805801391601562, 0.0808563232421875, 0.09365463256835938, 0.10645294189453125, 0.11925125122070312, 0.132049560546875, 0.14484786987304688, 0.15764617919921875, 0.17044448852539062, 0.1832427978515625, 0.19604110717773438, 0.20883941650390625, 0.22163772583007812, 0.23443603515625, 0.24723434448242188, 0.26003265380859375, 0.2728309631347656, 0.2856292724609375, 0.2984275817871094, 0.31122589111328125, 0.3240242004394531, 0.336822509765625, 0.3496208190917969, 0.36241912841796875, 0.3752174377441406, 0.3880157470703125, 0.4008140563964844, 0.41361236572265625, 0.4264106750488281, 0.439208984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 7.0, 11.0, 6.0, 13.0, 13.0, 13.0, 17.0, 17.0, 28.0, 30.0, 27.0, 41.0, 41.0, 45.0, 35.0, 53.0, 48.0, 55.0, 49.0, 44.0, 52.0, 40.0, 44.0, 36.0, 33.0, 29.0, 27.0, 21.0, 31.0, 19.0, 20.0, 11.0, 12.0, 8.0, 9.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.677734375, -0.6579818725585938, -0.6382293701171875, -0.6184768676757812, -0.598724365234375, -0.5789718627929688, -0.5592193603515625, -0.5394668579101562, -0.51971435546875, -0.49996185302734375, -0.4802093505859375, -0.46045684814453125, -0.440704345703125, -0.42095184326171875, -0.4011993408203125, -0.38144683837890625, -0.3616943359375, -0.34194183349609375, -0.3221893310546875, -0.30243682861328125, -0.282684326171875, -0.26293182373046875, -0.2431793212890625, -0.22342681884765625, -0.20367431640625, -0.18392181396484375, -0.1641693115234375, -0.14441680908203125, -0.124664306640625, -0.10491180419921875, -0.0851593017578125, -0.06540679931640625, -0.045654296875, -0.02590179443359375, -0.0061492919921875, 0.01360321044921875, 0.033355712890625, 0.05310821533203125, 0.0728607177734375, 0.09261322021484375, 0.11236572265625, 0.13211822509765625, 0.1518707275390625, 0.17162322998046875, 0.191375732421875, 0.21112823486328125, 0.2308807373046875, 0.25063323974609375, 0.2703857421875, 0.29013824462890625, 0.3098907470703125, 0.32964324951171875, 0.349395751953125, 0.36914825439453125, 0.3889007568359375, 0.40865325927734375, 0.42840576171875, 0.44815826416015625, 0.4679107666015625, 0.48766326904296875, 0.507415771484375, 0.5271682739257812, 0.5469207763671875, 0.5666732788085938, 0.58642578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 6.0, 12.0, 25.0, 28.0, 49.0, 59.0, 113.0, 186.0, 294.0, 515.0, 929.0, 1774.0, 3399.0, 6590.0, 13699.0, 29905.0, 70039.0, 164068.0, 290699.0, 250128.0, 121722.0, 50820.0, 22160.0, 10473.0, 5167.0, 2568.0, 1349.0, 730.0, 402.0, 255.0, 151.0, 73.0, 59.0, 37.0, 18.0, 11.0, 9.0, 7.0, 5.0, 7.0, 3.0, 7.0, 2.0], "bins": [-0.1646728515625, -0.1605367660522461, -0.1564006805419922, -0.15226459503173828, -0.14812850952148438, -0.14399242401123047, -0.13985633850097656, -0.13572025299072266, -0.13158416748046875, -0.12744808197021484, -0.12331199645996094, -0.11917591094970703, -0.11503982543945312, -0.11090373992919922, -0.10676765441894531, -0.1026315689086914, -0.0984954833984375, -0.0943593978881836, -0.09022331237792969, -0.08608722686767578, -0.08195114135742188, -0.07781505584716797, -0.07367897033691406, -0.06954288482666016, -0.06540679931640625, -0.061270713806152344, -0.05713462829589844, -0.05299854278564453, -0.048862457275390625, -0.04472637176513672, -0.04059028625488281, -0.036454200744628906, -0.032318115234375, -0.028182029724121094, -0.024045944213867188, -0.01990985870361328, -0.015773773193359375, -0.011637687683105469, -0.0075016021728515625, -0.0033655166625976562, 0.00077056884765625, 0.004906654357910156, 0.009042739868164062, 0.013178825378417969, 0.017314910888671875, 0.02145099639892578, 0.025587081909179688, 0.029723167419433594, 0.0338592529296875, 0.037995338439941406, 0.04213142395019531, 0.04626750946044922, 0.050403594970703125, 0.05453968048095703, 0.05867576599121094, 0.06281185150146484, 0.06694793701171875, 0.07108402252197266, 0.07522010803222656, 0.07935619354248047, 0.08349227905273438, 0.08762836456298828, 0.09176445007324219, 0.0959005355834961, 0.10003662109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 9.0, 11.0, 13.0, 23.0, 27.0, 42.0, 61.0, 107.0, 120.0, 138.0, 137.0, 90.0, 62.0, 34.0, 33.0, 23.0, 15.0, 17.0, 12.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.751848220825195e-05, -5.5339187383651733e-05, -5.3159892559051514e-05, -5.0980597734451294e-05, -4.8801302909851074e-05, -4.6622008085250854e-05, -4.4442713260650635e-05, -4.2263418436050415e-05, -4.0084123611450195e-05, -3.7904828786849976e-05, -3.5725533962249756e-05, -3.3546239137649536e-05, -3.1366944313049316e-05, -2.9187649488449097e-05, -2.7008354663848877e-05, -2.4829059839248657e-05, -2.2649765014648438e-05, -2.0470470190048218e-05, -1.8291175365447998e-05, -1.611188054084778e-05, -1.3932585716247559e-05, -1.1753290891647339e-05, -9.573996067047119e-06, -7.394701242446899e-06, -5.21540641784668e-06, -3.03611159324646e-06, -8.568167686462402e-07, 1.3224780559539795e-06, 3.5017728805541992e-06, 5.681067705154419e-06, 7.860362529754639e-06, 1.0039657354354858e-05, 1.2218952178955078e-05, 1.4398247003555298e-05, 1.6577541828155518e-05, 1.8756836652755737e-05, 2.0936131477355957e-05, 2.3115426301956177e-05, 2.5294721126556396e-05, 2.7474015951156616e-05, 2.9653310775756836e-05, 3.1832605600357056e-05, 3.4011900424957275e-05, 3.6191195249557495e-05, 3.8370490074157715e-05, 4.0549784898757935e-05, 4.2729079723358154e-05, 4.4908374547958374e-05, 4.7087669372558594e-05, 4.9266964197158813e-05, 5.144625902175903e-05, 5.362555384635925e-05, 5.580484867095947e-05, 5.798414349555969e-05, 6.016343832015991e-05, 6.234273314476013e-05, 6.452202796936035e-05, 6.670132279396057e-05, 6.888061761856079e-05, 7.105991244316101e-05, 7.323920726776123e-05, 7.541850209236145e-05, 7.759779691696167e-05, 7.977709174156189e-05, 8.195638656616211e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 5.0, 17.0, 22.0, 29.0, 39.0, 52.0, 69.0, 127.0, 171.0, 263.0, 410.0, 740.0, 1429.0, 2812.0, 5442.0, 11232.0, 24141.0, 54925.0, 118129.0, 214855.0, 258346.0, 183274.0, 93112.0, 41746.0, 19084.0, 8754.0, 4257.0, 2136.0, 1147.0, 654.0, 416.0, 222.0, 155.0, 100.0, 55.0, 49.0, 39.0, 21.0, 20.0, 11.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1158447265625, -0.11202621459960938, -0.10820770263671875, -0.10438919067382812, -0.1005706787109375, -0.09675216674804688, -0.09293365478515625, -0.08911514282226562, -0.085296630859375, -0.08147811889648438, -0.07765960693359375, -0.07384109497070312, -0.0700225830078125, -0.06620407104492188, -0.06238555908203125, -0.058567047119140625, -0.05474853515625, -0.050930023193359375, -0.04711151123046875, -0.043292999267578125, -0.0394744873046875, -0.035655975341796875, -0.03183746337890625, -0.028018951416015625, -0.024200439453125, -0.020381927490234375, -0.01656341552734375, -0.012744903564453125, -0.0089263916015625, -0.005107879638671875, -0.00128936767578125, 0.002529144287109375, 0.00634765625, 0.010166168212890625, 0.01398468017578125, 0.017803192138671875, 0.0216217041015625, 0.025440216064453125, 0.02925872802734375, 0.033077239990234375, 0.036895751953125, 0.040714263916015625, 0.04453277587890625, 0.048351287841796875, 0.0521697998046875, 0.055988311767578125, 0.05980682373046875, 0.06362533569335938, 0.06744384765625, 0.07126235961914062, 0.07508087158203125, 0.07889938354492188, 0.0827178955078125, 0.08653640747070312, 0.09035491943359375, 0.09417343139648438, 0.097991943359375, 0.10181045532226562, 0.10562896728515625, 0.10944747924804688, 0.1132659912109375, 0.11708450317382812, 0.12090301513671875, 0.12472152709960938, 0.1285400390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 10.0, 16.0, 27.0, 35.0, 34.0, 52.0, 55.0, 75.0, 66.0, 76.0, 87.0, 62.0, 63.0, 61.0, 52.0, 41.0, 36.0, 26.0, 20.0, 14.0, 16.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.185791015625, -0.1803741455078125, -0.174957275390625, -0.1695404052734375, -0.16412353515625, -0.1587066650390625, -0.153289794921875, -0.1478729248046875, -0.1424560546875, -0.1370391845703125, -0.131622314453125, -0.1262054443359375, -0.12078857421875, -0.1153717041015625, -0.109954833984375, -0.1045379638671875, -0.09912109375, -0.0937042236328125, -0.088287353515625, -0.0828704833984375, -0.07745361328125, -0.0720367431640625, -0.066619873046875, -0.0612030029296875, -0.0557861328125, -0.0503692626953125, -0.044952392578125, -0.0395355224609375, -0.03411865234375, -0.0287017822265625, -0.023284912109375, -0.0178680419921875, -0.012451171875, -0.0070343017578125, -0.001617431640625, 0.0037994384765625, 0.00921630859375, 0.0146331787109375, 0.020050048828125, 0.0254669189453125, 0.0308837890625, 0.0363006591796875, 0.041717529296875, 0.0471343994140625, 0.05255126953125, 0.0579681396484375, 0.063385009765625, 0.0688018798828125, 0.07421875, 0.0796356201171875, 0.085052490234375, 0.0904693603515625, 0.09588623046875, 0.1013031005859375, 0.106719970703125, 0.1121368408203125, 0.1175537109375, 0.1229705810546875, 0.128387451171875, 0.1338043212890625, 0.13922119140625, 0.1446380615234375, 0.150054931640625, 0.1554718017578125, 0.160888671875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 11.0, 15.0, 55.0, 139.0, 252.0, 274.0, 150.0, 66.0, 22.0, 11.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9352967739105225, -2.771942615509033, -2.608588695526123, -2.445234537124634, -2.2818803787231445, -2.1185264587402344, -1.9551723003387451, -1.7918182611465454, -1.6284642219543457, -1.465110182762146, -1.3017561435699463, -1.138401985168457, -0.9750479459762573, -0.8116939067840576, -0.6483398079872131, -0.48498570919036865, -0.32163166999816895, -0.15827760100364685, 0.005076467990875244, 0.16843053698539734, 0.33178460597991943, 0.49513864517211914, 0.6584927439689636, 0.8218468427658081, 0.9852008819580078, 1.1485549211502075, 1.3119089603424072, 1.4752631187438965, 1.6386171579360962, 1.801971197128296, 1.9653253555297852, 2.1286792755126953, 2.2920331954956055, 2.4553873538970947, 2.618741273880005, 2.782095432281494, 2.9454493522644043, 3.1088035106658936, 3.272157669067383, 3.435511589050293, 3.5988657474517822, 3.7622199058532715, 3.9255738258361816, 4.088927745819092, 4.25228214263916, 4.41563606262207, 4.5789899826049805, 4.742344379425049, 4.905698299407959, 5.069052219390869, 5.2324066162109375, 5.395760536193848, 5.559114456176758, 5.722468376159668, 5.885822772979736, 6.0491766929626465, 6.212531089782715, 6.375885009765625, 6.539239406585693, 6.7025933265686035, 6.865947246551514, 7.029301643371582, 7.192655563354492, 7.356009483337402, 7.5193634033203125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 4.0, 6.0, 4.0, 7.0, 11.0, 18.0, 14.0, 15.0, 20.0, 21.0, 24.0, 24.0, 22.0, 40.0, 26.0, 32.0, 26.0, 40.0, 27.0, 24.0, 30.0, 46.0, 42.0, 43.0, 38.0, 36.0, 36.0, 34.0, 30.0, 25.0, 31.0, 29.0, 13.0, 30.0, 19.0, 16.0, 10.0, 12.0, 7.0, 10.0, 15.0, 9.0, 8.0, 11.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4249085187911987, -1.3807636499404907, -1.3366187810897827, -1.2924739122390747, -1.2483291625976562, -1.2041842937469482, -1.1600394248962402, -1.1158945560455322, -1.0717496871948242, -1.0276048183441162, -0.9834599494934082, -0.939315140247345, -0.895170271396637, -0.851025402545929, -0.8068805932998657, -0.7627357244491577, -0.7185908555984497, -0.6744459867477417, -0.6303011178970337, -0.5861563086509705, -0.5420114398002625, -0.49786657094955444, -0.4537217319011688, -0.4095768928527832, -0.3654320240020752, -0.3212871551513672, -0.27714231610298157, -0.23299746215343475, -0.18885260820388794, -0.14470775425434113, -0.10056290030479431, -0.05641806125640869, -0.012273311614990234, 0.03187154233455658, 0.0760163962841034, 0.12016125023365021, 0.16430610418319702, 0.20845095813274384, 0.25259581208229065, 0.29674065113067627, 0.3408855199813843, 0.3850303888320923, 0.4291752278804779, 0.4733200669288635, 0.5174649357795715, 0.5616098046302795, 0.6057546138763428, 0.6498994827270508, 0.6940443515777588, 0.7381892204284668, 0.7823340892791748, 0.826478898525238, 0.870623767375946, 0.914768636226654, 0.9589134454727173, 1.0030583143234253, 1.0472031831741333, 1.0913480520248413, 1.1354929208755493, 1.1796377897262573, 1.2237825393676758, 1.2679274082183838, 1.3120722770690918, 1.3562171459197998, 1.4003620147705078]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 16.0, 21.0, 35.0, 45.0, 83.0, 124.0, 192.0, 244.0, 421.0, 704.0, 1084.0, 1935.0, 3224.0, 5390.0, 9608.0, 17428.0, 33312.0, 66206.0, 136676.0, 302434.0, 662435.0, 1139512.0, 942053.0, 466947.0, 208195.0, 95385.0, 46223.0, 23999.0, 12694.0, 7178.0, 4034.0, 2420.0, 1551.0, 933.0, 544.0, 312.0, 216.0, 129.0, 92.0, 79.0, 44.0, 35.0, 27.0, 22.0, 7.0, 4.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.17626953125, -0.17053985595703125, -0.1648101806640625, -0.15908050537109375, -0.153350830078125, -0.14762115478515625, -0.1418914794921875, -0.13616180419921875, -0.13043212890625, -0.12470245361328125, -0.1189727783203125, -0.11324310302734375, -0.107513427734375, -0.10178375244140625, -0.0960540771484375, -0.09032440185546875, -0.0845947265625, -0.07886505126953125, -0.0731353759765625, -0.06740570068359375, -0.061676025390625, -0.05594635009765625, -0.0502166748046875, -0.04448699951171875, -0.03875732421875, -0.03302764892578125, -0.0272979736328125, -0.02156829833984375, -0.015838623046875, -0.01010894775390625, -0.0043792724609375, 0.00135040283203125, 0.007080078125, 0.01280975341796875, 0.0185394287109375, 0.02426910400390625, 0.029998779296875, 0.03572845458984375, 0.0414581298828125, 0.04718780517578125, 0.05291748046875, 0.05864715576171875, 0.0643768310546875, 0.07010650634765625, 0.075836181640625, 0.08156585693359375, 0.0872955322265625, 0.09302520751953125, 0.0987548828125, 0.10448455810546875, 0.1102142333984375, 0.11594390869140625, 0.121673583984375, 0.12740325927734375, 0.1331329345703125, 0.13886260986328125, 0.14459228515625, 0.15032196044921875, 0.1560516357421875, 0.16178131103515625, 0.167510986328125, 0.17324066162109375, 0.1789703369140625, 0.18470001220703125, 0.1904296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 10.0, 12.0, 7.0, 15.0, 18.0, 15.0, 15.0, 22.0, 22.0, 36.0, 31.0, 33.0, 41.0, 41.0, 50.0, 42.0, 53.0, 53.0, 60.0, 35.0, 55.0, 40.0, 46.0, 44.0, 31.0, 28.0, 29.0, 26.0, 20.0, 20.0, 21.0, 10.0, 4.0, 4.0, 1.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23779296875, -0.2305450439453125, -0.223297119140625, -0.2160491943359375, -0.20880126953125, -0.2015533447265625, -0.194305419921875, -0.1870574951171875, -0.1798095703125, -0.1725616455078125, -0.165313720703125, -0.1580657958984375, -0.15081787109375, -0.1435699462890625, -0.136322021484375, -0.1290740966796875, -0.121826171875, -0.1145782470703125, -0.107330322265625, -0.1000823974609375, -0.09283447265625, -0.0855865478515625, -0.078338623046875, -0.0710906982421875, -0.0638427734375, -0.0565948486328125, -0.049346923828125, -0.0420989990234375, -0.03485107421875, -0.0276031494140625, -0.020355224609375, -0.0131072998046875, -0.005859375, 0.0013885498046875, 0.008636474609375, 0.0158843994140625, 0.02313232421875, 0.0303802490234375, 0.037628173828125, 0.0448760986328125, 0.0521240234375, 0.0593719482421875, 0.066619873046875, 0.0738677978515625, 0.08111572265625, 0.0883636474609375, 0.095611572265625, 0.1028594970703125, 0.110107421875, 0.1173553466796875, 0.124603271484375, 0.1318511962890625, 0.13909912109375, 0.1463470458984375, 0.153594970703125, 0.1608428955078125, 0.1680908203125, 0.1753387451171875, 0.182586669921875, 0.1898345947265625, 0.19708251953125, 0.2043304443359375, 0.211578369140625, 0.2188262939453125, 0.22607421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 7.0, 15.0, 11.0, 34.0, 35.0, 54.0, 123.0, 165.0, 304.0, 605.0, 1310.0, 3393.0, 10106.0, 37172.0, 174952.0, 1193251.0, 2330249.0, 351298.0, 66125.0, 16380.0, 5031.0, 1942.0, 808.0, 395.0, 187.0, 121.0, 83.0, 33.0, 28.0, 19.0, 12.0, 12.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3784599304199219, -0.36214447021484375, -0.3458290100097656, -0.3295135498046875, -0.3131980895996094, -0.29688262939453125, -0.2805671691894531, -0.264251708984375, -0.24793624877929688, -0.23162078857421875, -0.21530532836914062, -0.1989898681640625, -0.18267440795898438, -0.16635894775390625, -0.15004348754882812, -0.13372802734375, -0.11741256713867188, -0.10109710693359375, -0.08478164672851562, -0.0684661865234375, -0.052150726318359375, -0.03583526611328125, -0.019519805908203125, -0.003204345703125, 0.013111114501953125, 0.02942657470703125, 0.045742034912109375, 0.0620574951171875, 0.07837295532226562, 0.09468841552734375, 0.11100387573242188, 0.1273193359375, 0.14363479614257812, 0.15995025634765625, 0.17626571655273438, 0.1925811767578125, 0.20889663696289062, 0.22521209716796875, 0.24152755737304688, 0.257843017578125, 0.2741584777832031, 0.29047393798828125, 0.3067893981933594, 0.3231048583984375, 0.3394203186035156, 0.35573577880859375, 0.3720512390136719, 0.38836669921875, 0.4046821594238281, 0.42099761962890625, 0.4373130798339844, 0.4536285400390625, 0.4699440002441406, 0.48625946044921875, 0.5025749206542969, 0.518890380859375, 0.5352058410644531, 0.5515213012695312, 0.5678367614746094, 0.5841522216796875, 0.6004676818847656, 0.6167831420898438, 0.6330986022949219, 0.6494140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 5.0, 6.0, 10.0, 13.0, 15.0, 16.0, 26.0, 36.0, 55.0, 68.0, 99.0, 143.0, 174.0, 228.0, 363.0, 431.0, 548.0, 424.0, 391.0, 262.0, 189.0, 146.0, 104.0, 75.0, 64.0, 48.0, 30.0, 18.0, 13.0, 15.0, 14.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3437004089355469, -0.33119964599609375, -0.3186988830566406, -0.3061981201171875, -0.2936973571777344, -0.28119659423828125, -0.2686958312988281, -0.256195068359375, -0.24369430541992188, -0.23119354248046875, -0.21869277954101562, -0.2061920166015625, -0.19369125366210938, -0.18119049072265625, -0.16868972778320312, -0.15618896484375, -0.14368820190429688, -0.13118743896484375, -0.11868667602539062, -0.1061859130859375, -0.09368515014648438, -0.08118438720703125, -0.06868362426757812, -0.056182861328125, -0.043682098388671875, -0.03118133544921875, -0.018680572509765625, -0.0061798095703125, 0.006320953369140625, 0.01882171630859375, 0.031322479248046875, 0.0438232421875, 0.056324005126953125, 0.06882476806640625, 0.08132553100585938, 0.0938262939453125, 0.10632705688476562, 0.11882781982421875, 0.13132858276367188, 0.143829345703125, 0.15633010864257812, 0.16883087158203125, 0.18133163452148438, 0.1938323974609375, 0.20633316040039062, 0.21883392333984375, 0.23133468627929688, 0.24383544921875, 0.2563362121582031, 0.26883697509765625, 0.2813377380371094, 0.2938385009765625, 0.3063392639160156, 0.31884002685546875, 0.3313407897949219, 0.343841552734375, 0.3563423156738281, 0.36884307861328125, 0.3813438415527344, 0.3938446044921875, 0.4063453674316406, 0.41884613037109375, 0.4313468933105469, 0.44384765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 9.0, 15.0, 25.0, 53.0, 68.0, 86.0, 115.0, 143.0, 139.0, 109.0, 89.0, 50.0, 32.0, 21.0, 17.0, 6.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.999173164367676, -2.9131922721862793, -2.827211380004883, -2.7412302494049072, -2.6552493572235107, -2.5692684650421143, -2.4832873344421387, -2.397306442260742, -2.3113255500793457, -2.225344657897949, -2.1393637657165527, -2.053382635116577, -1.9674017429351807, -1.8814208507537842, -1.7954398393630981, -1.709458827972412, -1.6234779357910156, -1.5374970436096191, -1.451516032218933, -1.365535020828247, -1.2795541286468506, -1.193573236465454, -1.107592225074768, -1.021611213684082, -0.9356303215026855, -0.8496493697166443, -0.763668417930603, -0.6776874661445618, -0.5917065143585205, -0.5057255625724792, -0.419744610786438, -0.33376365900039673, -0.24778270721435547, -0.1618017554283142, -0.07582080364227295, 0.01016014814376831, 0.09614109992980957, 0.18212205171585083, 0.2681030035018921, 0.35408395528793335, 0.4400649070739746, 0.5260458588600159, 0.6120268106460571, 0.6980077624320984, 0.7839887142181396, 0.8699696660041809, 0.9559506177902222, 1.0419316291809082, 1.1279125213623047, 1.2138934135437012, 1.2998744249343872, 1.3858554363250732, 1.4718363285064697, 1.5578172206878662, 1.6437982320785522, 1.7297792434692383, 1.8157601356506348, 1.9017410278320312, 1.9877220392227173, 2.0737030506134033, 2.1596839427948, 2.2456648349761963, 2.331645965576172, 2.4176268577575684, 2.503607749938965]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 6.0, 6.0, 11.0, 9.0, 15.0, 18.0, 9.0, 12.0, 20.0, 20.0, 26.0, 35.0, 21.0, 28.0, 31.0, 47.0, 46.0, 38.0, 41.0, 44.0, 45.0, 46.0, 60.0, 43.0, 49.0, 29.0, 25.0, 39.0, 30.0, 26.0, 26.0, 14.0, 18.0, 18.0, 9.0, 9.0, 5.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7047348022460938, -1.6578364372253418, -1.6109380722045898, -1.564039707183838, -1.5171414613723755, -1.4702430963516235, -1.4233447313308716, -1.3764463663101196, -1.3295480012893677, -1.2826496362686157, -1.2357512712478638, -1.1888530254364014, -1.1419546604156494, -1.0950562953948975, -1.0481579303741455, -1.0012595653533936, -0.9543612599372864, -0.9074628949165344, -0.8605645895004272, -0.8136662244796753, -0.7667678594589233, -0.7198694944381714, -0.6729711890220642, -0.6260728240013123, -0.5791745185852051, -0.5322761535644531, -0.48537781834602356, -0.438479483127594, -0.39158111810684204, -0.3446827828884125, -0.2977844476699829, -0.25088608264923096, -0.203987717628479, -0.15708936750888824, -0.11019102483987808, -0.06329268217086792, -0.01639433205127716, 0.0305040180683136, 0.07740235328674316, 0.12430071830749512, 0.17119905352592468, 0.21809740364551544, 0.2649957537651062, 0.31189408898353577, 0.35879242420196533, 0.4056907892227173, 0.45258912444114685, 0.4994874894618988, 0.5463858246803284, 0.5932841897010803, 0.6401824951171875, 0.6870808601379395, 0.7339792251586914, 0.7808775901794434, 0.8277758955955505, 0.8746742606163025, 0.9215725660324097, 0.9684709310531616, 1.0153692960739136, 1.062267541885376, 1.109165906906128, 1.1560642719268799, 1.2029626369476318, 1.2498610019683838, 1.2967593669891357]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 14.0, 33.0, 45.0, 84.0, 139.0, 241.0, 447.0, 893.0, 1679.0, 3324.0, 6948.0, 14865.0, 35873.0, 96663.0, 235101.0, 321310.0, 199470.0, 77992.0, 29021.0, 12513.0, 5767.0, 2949.0, 1504.0, 777.0, 374.0, 227.0, 100.0, 70.0, 45.0, 18.0, 15.0, 16.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444091796875, -0.4289817810058594, -0.41387176513671875, -0.3987617492675781, -0.3836517333984375, -0.3685417175292969, -0.35343170166015625, -0.3383216857910156, -0.323211669921875, -0.3081016540527344, -0.29299163818359375, -0.2778816223144531, -0.2627716064453125, -0.24766159057617188, -0.23255157470703125, -0.21744155883789062, -0.20233154296875, -0.18722152709960938, -0.17211151123046875, -0.15700149536132812, -0.1418914794921875, -0.12678146362304688, -0.11167144775390625, -0.09656143188476562, -0.081451416015625, -0.06634140014648438, -0.05123138427734375, -0.036121368408203125, -0.0210113525390625, -0.005901336669921875, 0.00920867919921875, 0.024318695068359375, 0.0394287109375, 0.054538726806640625, 0.06964874267578125, 0.08475875854492188, 0.0998687744140625, 0.11497879028320312, 0.13008880615234375, 0.14519882202148438, 0.160308837890625, 0.17541885375976562, 0.19052886962890625, 0.20563888549804688, 0.2207489013671875, 0.23585891723632812, 0.25096893310546875, 0.2660789489746094, 0.28118896484375, 0.2962989807128906, 0.31140899658203125, 0.3265190124511719, 0.3416290283203125, 0.3567390441894531, 0.37184906005859375, 0.3869590759277344, 0.402069091796875, 0.4171791076660156, 0.43228912353515625, 0.4473991394042969, 0.4625091552734375, 0.4776191711425781, 0.49272918701171875, 0.5078392028808594, 0.52294921875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 8.0, 13.0, 12.0, 10.0, 10.0, 17.0, 14.0, 12.0, 24.0, 31.0, 30.0, 29.0, 31.0, 37.0, 33.0, 41.0, 36.0, 45.0, 43.0, 48.0, 41.0, 37.0, 54.0, 33.0, 37.0, 34.0, 28.0, 22.0, 24.0, 27.0, 18.0, 20.0, 16.0, 14.0, 8.0, 10.0, 11.0, 10.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.1758136749267578, -0.16937637329101562, -0.16293907165527344, -0.15650177001953125, -0.15006446838378906, -0.14362716674804688, -0.1371898651123047, -0.1307525634765625, -0.12431526184082031, -0.11787796020507812, -0.11144065856933594, -0.10500335693359375, -0.09856605529785156, -0.09212875366210938, -0.08569145202636719, -0.079254150390625, -0.07281684875488281, -0.06637954711914062, -0.05994224548339844, -0.05350494384765625, -0.04706764221191406, -0.040630340576171875, -0.03419303894042969, -0.0277557373046875, -0.021318435668945312, -0.014881134033203125, -0.008443832397460938, -0.00200653076171875, 0.0044307708740234375, 0.010868072509765625, 0.017305374145507812, 0.02374267578125, 0.030179977416992188, 0.036617279052734375, 0.04305458068847656, 0.04949188232421875, 0.05592918395996094, 0.062366485595703125, 0.06880378723144531, 0.0752410888671875, 0.08167839050292969, 0.08811569213867188, 0.09455299377441406, 0.10099029541015625, 0.10742759704589844, 0.11386489868164062, 0.12030220031738281, 0.126739501953125, 0.1331768035888672, 0.13961410522460938, 0.14605140686035156, 0.15248870849609375, 0.15892601013183594, 0.16536331176757812, 0.1718006134033203, 0.1782379150390625, 0.1846752166748047, 0.19111251831054688, 0.19754981994628906, 0.20398712158203125, 0.21042442321777344, 0.21686172485351562, 0.2232990264892578, 0.229736328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 8.0, 15.0, 8.0, 19.0, 31.0, 35.0, 75.0, 117.0, 227.0, 438.0, 1135.0, 3037.0, 9037.0, 29719.0, 124726.0, 434887.0, 334296.0, 79950.0, 20261.0, 6487.0, 2277.0, 863.0, 385.0, 191.0, 124.0, 71.0, 38.0, 35.0, 19.0, 9.0, 7.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80908203125, -0.784454345703125, -0.75982666015625, -0.735198974609375, -0.7105712890625, -0.685943603515625, -0.66131591796875, -0.636688232421875, -0.612060546875, -0.587432861328125, -0.56280517578125, -0.538177490234375, -0.5135498046875, -0.488922119140625, -0.46429443359375, -0.439666748046875, -0.4150390625, -0.390411376953125, -0.36578369140625, -0.341156005859375, -0.3165283203125, -0.291900634765625, -0.26727294921875, -0.242645263671875, -0.218017578125, -0.193389892578125, -0.16876220703125, -0.144134521484375, -0.1195068359375, -0.094879150390625, -0.07025146484375, -0.045623779296875, -0.02099609375, 0.003631591796875, 0.02825927734375, 0.052886962890625, 0.0775146484375, 0.102142333984375, 0.12677001953125, 0.151397705078125, 0.176025390625, 0.200653076171875, 0.22528076171875, 0.249908447265625, 0.2745361328125, 0.299163818359375, 0.32379150390625, 0.348419189453125, 0.373046875, 0.397674560546875, 0.42230224609375, 0.446929931640625, 0.4715576171875, 0.496185302734375, 0.52081298828125, 0.545440673828125, 0.570068359375, 0.594696044921875, 0.61932373046875, 0.643951416015625, 0.6685791015625, 0.693206787109375, 0.71783447265625, 0.742462158203125, 0.76708984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 10.0, 13.0, 7.0, 21.0, 18.0, 27.0, 24.0, 16.0, 33.0, 31.0, 24.0, 51.0, 48.0, 41.0, 46.0, 36.0, 49.0, 49.0, 43.0, 45.0, 45.0, 38.0, 37.0, 30.0, 36.0, 23.0, 16.0, 23.0, 20.0, 19.0, 16.0, 12.0, 10.0, 9.0, 3.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6669921875, -0.6449661254882812, -0.6229400634765625, -0.6009140014648438, -0.578887939453125, -0.5568618774414062, -0.5348358154296875, -0.5128097534179688, -0.49078369140625, -0.46875762939453125, -0.4467315673828125, -0.42470550537109375, -0.402679443359375, -0.38065338134765625, -0.3586273193359375, -0.33660125732421875, -0.3145751953125, -0.29254913330078125, -0.2705230712890625, -0.24849700927734375, -0.226470947265625, -0.20444488525390625, -0.1824188232421875, -0.16039276123046875, -0.13836669921875, -0.11634063720703125, -0.0943145751953125, -0.07228851318359375, -0.050262451171875, -0.02823638916015625, -0.0062103271484375, 0.01581573486328125, 0.037841796875, 0.05986785888671875, 0.0818939208984375, 0.10391998291015625, 0.125946044921875, 0.14797210693359375, 0.1699981689453125, 0.19202423095703125, 0.21405029296875, 0.23607635498046875, 0.2581024169921875, 0.28012847900390625, 0.302154541015625, 0.32418060302734375, 0.3462066650390625, 0.36823272705078125, 0.3902587890625, 0.41228485107421875, 0.4343109130859375, 0.45633697509765625, 0.478363037109375, 0.5003890991210938, 0.5224151611328125, 0.5444412231445312, 0.56646728515625, 0.5884933471679688, 0.6105194091796875, 0.6325454711914062, 0.654571533203125, 0.6765975952148438, 0.6986236572265625, 0.7206497192382812, 0.74267578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 14.0, 12.0, 25.0, 49.0, 71.0, 111.0, 167.0, 270.0, 492.0, 837.0, 1399.0, 2460.0, 4692.0, 9055.0, 18211.0, 43110.0, 111206.0, 253851.0, 309037.0, 172691.0, 67226.0, 26795.0, 12434.0, 6409.0, 3443.0, 1964.0, 988.0, 578.0, 338.0, 218.0, 122.0, 93.0, 52.0, 31.0, 33.0, 24.0, 8.0, 7.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1573486328125, -0.15261459350585938, -0.14788055419921875, -0.14314651489257812, -0.1384124755859375, -0.13367843627929688, -0.12894439697265625, -0.12421035766601562, -0.119476318359375, -0.11474227905273438, -0.11000823974609375, -0.10527420043945312, -0.1005401611328125, -0.09580612182617188, -0.09107208251953125, -0.08633804321289062, -0.08160400390625, -0.07686996459960938, -0.07213592529296875, -0.06740188598632812, -0.0626678466796875, -0.057933807373046875, -0.05319976806640625, -0.048465728759765625, -0.043731689453125, -0.038997650146484375, -0.03426361083984375, -0.029529571533203125, -0.0247955322265625, -0.020061492919921875, -0.01532745361328125, -0.010593414306640625, -0.005859375, -0.001125335693359375, 0.00360870361328125, 0.008342742919921875, 0.0130767822265625, 0.017810821533203125, 0.02254486083984375, 0.027278900146484375, 0.032012939453125, 0.036746978759765625, 0.04148101806640625, 0.046215057373046875, 0.0509490966796875, 0.055683135986328125, 0.06041717529296875, 0.06515121459960938, 0.06988525390625, 0.07461929321289062, 0.07935333251953125, 0.08408737182617188, 0.0888214111328125, 0.09355545043945312, 0.09828948974609375, 0.10302352905273438, 0.107757568359375, 0.11249160766601562, 0.11722564697265625, 0.12195968627929688, 0.1266937255859375, 0.13142776489257812, 0.13616180419921875, 0.14089584350585938, 0.1456298828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 12.0, 19.0, 28.0, 34.0, 50.0, 67.0, 83.0, 104.0, 118.0, 97.0, 87.0, 70.0, 69.0, 34.0, 27.0, 21.0, 16.0, 5.0, 8.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.312131881713867e-05, -6.10649585723877e-05, -5.900859832763672e-05, -5.695223808288574e-05, -5.4895877838134766e-05, -5.283951759338379e-05, -5.078315734863281e-05, -4.8726797103881836e-05, -4.667043685913086e-05, -4.461407661437988e-05, -4.2557716369628906e-05, -4.050135612487793e-05, -3.844499588012695e-05, -3.6388635635375977e-05, -3.4332275390625e-05, -3.2275915145874023e-05, -3.0219554901123047e-05, -2.816319465637207e-05, -2.6106834411621094e-05, -2.4050474166870117e-05, -2.199411392211914e-05, -1.9937753677368164e-05, -1.7881393432617188e-05, -1.582503318786621e-05, -1.3768672943115234e-05, -1.1712312698364258e-05, -9.655952453613281e-06, -7.599592208862305e-06, -5.543231964111328e-06, -3.4868717193603516e-06, -1.430511474609375e-06, 6.258487701416016e-07, 2.682209014892578e-06, 4.738569259643555e-06, 6.794929504394531e-06, 8.851289749145508e-06, 1.0907649993896484e-05, 1.2964010238647461e-05, 1.5020370483398438e-05, 1.7076730728149414e-05, 1.913309097290039e-05, 2.1189451217651367e-05, 2.3245811462402344e-05, 2.530217170715332e-05, 2.7358531951904297e-05, 2.9414892196655273e-05, 3.147125244140625e-05, 3.3527612686157227e-05, 3.55839729309082e-05, 3.764033317565918e-05, 3.9696693420410156e-05, 4.175305366516113e-05, 4.380941390991211e-05, 4.5865774154663086e-05, 4.792213439941406e-05, 4.997849464416504e-05, 5.2034854888916016e-05, 5.409121513366699e-05, 5.614757537841797e-05, 5.8203935623168945e-05, 6.026029586791992e-05, 6.23166561126709e-05, 6.437301635742188e-05, 6.642937660217285e-05, 6.848573684692383e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 6.0, 8.0, 15.0, 16.0, 27.0, 41.0, 99.0, 132.0, 256.0, 442.0, 989.0, 2198.0, 5811.0, 16260.0, 49573.0, 149797.0, 327879.0, 303718.0, 127480.0, 41128.0, 13827.0, 4995.0, 1913.0, 880.0, 444.0, 247.0, 155.0, 67.0, 57.0, 32.0, 16.0, 12.0, 8.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.187255859375, -0.18156814575195312, -0.17588043212890625, -0.17019271850585938, -0.1645050048828125, -0.15881729125976562, -0.15312957763671875, -0.14744186401367188, -0.141754150390625, -0.13606643676757812, -0.13037872314453125, -0.12469100952148438, -0.1190032958984375, -0.11331558227539062, -0.10762786865234375, -0.10194015502929688, -0.09625244140625, -0.09056472778320312, -0.08487701416015625, -0.07918930053710938, -0.0735015869140625, -0.06781387329101562, -0.06212615966796875, -0.056438446044921875, -0.050750732421875, -0.045063018798828125, -0.03937530517578125, -0.033687591552734375, -0.0279998779296875, -0.022312164306640625, -0.01662445068359375, -0.010936737060546875, -0.0052490234375, 0.000438690185546875, 0.00612640380859375, 0.011814117431640625, 0.0175018310546875, 0.023189544677734375, 0.02887725830078125, 0.034564971923828125, 0.040252685546875, 0.045940399169921875, 0.05162811279296875, 0.057315826416015625, 0.0630035400390625, 0.06869125366210938, 0.07437896728515625, 0.08006668090820312, 0.08575439453125, 0.09144210815429688, 0.09712982177734375, 0.10281753540039062, 0.1085052490234375, 0.11419296264648438, 0.11988067626953125, 0.12556838989257812, 0.131256103515625, 0.13694381713867188, 0.14263153076171875, 0.14831924438476562, 0.1540069580078125, 0.15969467163085938, 0.16538238525390625, 0.17107009887695312, 0.1767578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 12.0, 14.0, 11.0, 16.0, 17.0, 36.0, 33.0, 33.0, 31.0, 46.0, 46.0, 43.0, 44.0, 68.0, 61.0, 65.0, 74.0, 64.0, 39.0, 35.0, 38.0, 32.0, 22.0, 21.0, 18.0, 13.0, 12.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12562179565429688, -0.12062835693359375, -0.11563491821289062, -0.1106414794921875, -0.10564804077148438, -0.10065460205078125, -0.09566116333007812, -0.090667724609375, -0.08567428588867188, -0.08068084716796875, -0.07568740844726562, -0.0706939697265625, -0.06570053100585938, -0.06070709228515625, -0.055713653564453125, -0.05072021484375, -0.045726776123046875, -0.04073333740234375, -0.035739898681640625, -0.0307464599609375, -0.025753021240234375, -0.02075958251953125, -0.015766143798828125, -0.010772705078125, -0.005779266357421875, -0.00078582763671875, 0.004207611083984375, 0.0092010498046875, 0.014194488525390625, 0.01918792724609375, 0.024181365966796875, 0.0291748046875, 0.034168243408203125, 0.03916168212890625, 0.044155120849609375, 0.0491485595703125, 0.054141998291015625, 0.05913543701171875, 0.06412887573242188, 0.069122314453125, 0.07411575317382812, 0.07910919189453125, 0.08410263061523438, 0.0890960693359375, 0.09408950805664062, 0.09908294677734375, 0.10407638549804688, 0.10906982421875, 0.11406326293945312, 0.11905670166015625, 0.12405014038085938, 0.1290435791015625, 0.13403701782226562, 0.13903045654296875, 0.14402389526367188, 0.149017333984375, 0.15401077270507812, 0.15900421142578125, 0.16399765014648438, 0.1689910888671875, 0.17398452758789062, 0.17897796630859375, 0.18397140502929688, 0.18896484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 0.0, 6.0, 9.0, 19.0, 31.0, 55.0, 75.0, 120.0, 153.0, 170.0, 140.0, 81.0, 63.0, 37.0, 17.0, 13.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9310479164123535, -2.8197879791259766, -2.7085282802581787, -2.5972683429718018, -2.486008644104004, -2.374748706817627, -2.26348876953125, -2.152229070663452, -2.0409693717956543, -1.929709553718567, -1.8184497356414795, -1.7071897983551025, -1.5959300994873047, -1.4846701622009277, -1.3734103441238403, -1.262150526046753, -1.150890588760376, -1.0396307706832886, -0.9283709526062012, -0.817111074924469, -0.7058512568473816, -0.5945914387702942, -0.483331561088562, -0.3720717430114746, -0.2608119249343872, -0.1495520919561386, -0.038292258977890015, 0.07296758890151978, 0.18422740697860718, 0.2954872250556946, 0.40674710273742676, 0.5180069208145142, 0.6292667388916016, 0.740526556968689, 0.8517863750457764, 0.9630462527275085, 1.0743060111999512, 1.1855659484863281, 1.2968257665634155, 1.408085584640503, 1.5193454027175903, 1.6306052207946777, 1.7418650388717651, 1.8531248569488525, 1.9643847942352295, 2.0756444931030273, 2.1869044303894043, 2.2981643676757812, 2.409424066543579, 2.520684003829956, 2.631943702697754, 2.743203639984131, 2.8544633388519287, 2.9657232761383057, 3.0769829750061035, 3.1882429122924805, 3.2995028495788574, 3.4107627868652344, 3.5220224857330322, 3.633282423019409, 3.744542121887207, 3.855802059173584, 3.967061996459961, 4.07832145690918, 4.189581394195557]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 11.0, 10.0, 17.0, 17.0, 13.0, 19.0, 21.0, 27.0, 24.0, 27.0, 32.0, 28.0, 32.0, 34.0, 34.0, 41.0, 44.0, 39.0, 44.0, 38.0, 35.0, 41.0, 46.0, 44.0, 24.0, 31.0, 37.0, 35.0, 16.0, 26.0, 15.0, 14.0, 16.0, 10.0, 13.0, 8.0, 10.0, 2.0, 9.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.9154976606369019, -1.8640453815460205, -1.8125929832458496, -1.7611405849456787, -1.7096883058547974, -1.658236026763916, -1.6067836284637451, -1.5553312301635742, -1.5038789510726929, -1.4524266719818115, -1.4009742736816406, -1.3495218753814697, -1.2980695962905884, -1.246617317199707, -1.1951649188995361, -1.1437125205993652, -1.0922602415084839, -1.0408079624176025, -0.9893555641174316, -0.9379032254219055, -0.8864508867263794, -0.8349985480308533, -0.7835462093353271, -0.732093870639801, -0.6806415319442749, -0.6291891932487488, -0.5777368545532227, -0.5262845158576965, -0.4748321771621704, -0.4233798384666443, -0.37192749977111816, -0.32047516107559204, -0.26902270317077637, -0.21757036447525024, -0.16611802577972412, -0.114665687084198, -0.06321334838867188, -0.011761009693145752, 0.03969132900238037, 0.0911436676979065, 0.14259600639343262, 0.19404834508895874, 0.24550068378448486, 0.296953022480011, 0.3484053611755371, 0.39985769987106323, 0.45131003856658936, 0.5027623772621155, 0.5542147159576416, 0.6056670546531677, 0.6571193933486938, 0.70857173204422, 0.7600240707397461, 0.8114764094352722, 0.8629287481307983, 0.9143810868263245, 0.9658334255218506, 1.0172858238220215, 1.0687381029129028, 1.1201903820037842, 1.171642780303955, 1.223095178604126, 1.2745474576950073, 1.3259997367858887, 1.3774521350860596]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 10.0, 19.0, 16.0, 34.0, 42.0, 71.0, 126.0, 158.0, 231.0, 432.0, 711.0, 1213.0, 2031.0, 3451.0, 6076.0, 11007.0, 21756.0, 43937.0, 96380.0, 221005.0, 501852.0, 989783.0, 1135452.0, 645504.0, 285541.0, 119807.0, 53043.0, 25284.0, 13088.0, 6781.0, 3847.0, 2141.0, 1265.0, 825.0, 500.0, 286.0, 200.0, 136.0, 80.0, 56.0, 33.0, 21.0, 23.0, 9.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.17130088806152344, -0.16498947143554688, -0.1586780548095703, -0.15236663818359375, -0.1460552215576172, -0.13974380493164062, -0.13343238830566406, -0.1271209716796875, -0.12080955505371094, -0.11449813842773438, -0.10818672180175781, -0.10187530517578125, -0.09556388854980469, -0.08925247192382812, -0.08294105529785156, -0.076629638671875, -0.07031822204589844, -0.06400680541992188, -0.05769538879394531, -0.05138397216796875, -0.04507255554199219, -0.038761138916015625, -0.03244972229003906, -0.0261383056640625, -0.019826889038085938, -0.013515472412109375, -0.0072040557861328125, -0.00089263916015625, 0.0054187774658203125, 0.011730194091796875, 0.018041610717773438, 0.02435302734375, 0.030664443969726562, 0.036975860595703125, 0.04328727722167969, 0.04959869384765625, 0.05591011047363281, 0.062221527099609375, 0.06853294372558594, 0.0748443603515625, 0.08115577697753906, 0.08746719360351562, 0.09377861022949219, 0.10009002685546875, 0.10640144348144531, 0.11271286010742188, 0.11902427673339844, 0.125335693359375, 0.13164710998535156, 0.13795852661132812, 0.1442699432373047, 0.15058135986328125, 0.1568927764892578, 0.16320419311523438, 0.16951560974121094, 0.1758270263671875, 0.18213844299316406, 0.18844985961914062, 0.1947612762451172, 0.20107269287109375, 0.2073841094970703, 0.21369552612304688, 0.22000694274902344, 0.226318359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 14.0, 13.0, 5.0, 11.0, 24.0, 20.0, 21.0, 18.0, 24.0, 20.0, 32.0, 35.0, 40.0, 38.0, 50.0, 42.0, 48.0, 47.0, 43.0, 36.0, 38.0, 38.0, 37.0, 39.0, 23.0, 30.0, 26.0, 23.0, 22.0, 18.0, 18.0, 14.0, 7.0, 12.0, 11.0, 6.0, 6.0, 10.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1881103515625, -0.18162155151367188, -0.17513275146484375, -0.16864395141601562, -0.1621551513671875, -0.15566635131835938, -0.14917755126953125, -0.14268875122070312, -0.136199951171875, -0.12971115112304688, -0.12322235107421875, -0.11673355102539062, -0.1102447509765625, -0.10375595092773438, -0.09726715087890625, -0.09077835083007812, -0.08428955078125, -0.07780075073242188, -0.07131195068359375, -0.06482315063476562, -0.0583343505859375, -0.051845550537109375, -0.04535675048828125, -0.038867950439453125, -0.032379150390625, -0.025890350341796875, -0.01940155029296875, -0.012912750244140625, -0.0064239501953125, 6.4849853515625e-05, 0.00655364990234375, 0.013042449951171875, 0.01953125, 0.026020050048828125, 0.03250885009765625, 0.038997650146484375, 0.0454864501953125, 0.051975250244140625, 0.05846405029296875, 0.06495285034179688, 0.071441650390625, 0.07793045043945312, 0.08441925048828125, 0.09090805053710938, 0.0973968505859375, 0.10388565063476562, 0.11037445068359375, 0.11686325073242188, 0.12335205078125, 0.12984085083007812, 0.13632965087890625, 0.14281845092773438, 0.1493072509765625, 0.15579605102539062, 0.16228485107421875, 0.16877365112304688, 0.175262451171875, 0.18175125122070312, 0.18824005126953125, 0.19472885131835938, 0.2012176513671875, 0.20770645141601562, 0.21419525146484375, 0.22068405151367188, 0.2271728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 10.0, 10.0, 17.0, 33.0, 48.0, 69.0, 131.0, 249.0, 436.0, 968.0, 2332.0, 6455.0, 20357.0, 80436.0, 421312.0, 2449237.0, 1000042.0, 159054.0, 36237.0, 10414.0, 3677.0, 1414.0, 616.0, 293.0, 197.0, 87.0, 60.0, 34.0, 21.0, 13.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3900489807128906, -0.37360382080078125, -0.3571586608886719, -0.3407135009765625, -0.3242683410644531, -0.30782318115234375, -0.2913780212402344, -0.274932861328125, -0.2584877014160156, -0.24204254150390625, -0.22559738159179688, -0.2091522216796875, -0.19270706176757812, -0.17626190185546875, -0.15981674194335938, -0.14337158203125, -0.12692642211914062, -0.11048126220703125, -0.09403610229492188, -0.0775909423828125, -0.061145782470703125, -0.04470062255859375, -0.028255462646484375, -0.011810302734375, 0.004634857177734375, 0.02108001708984375, 0.037525177001953125, 0.0539703369140625, 0.07041549682617188, 0.08686065673828125, 0.10330581665039062, 0.1197509765625, 0.13619613647460938, 0.15264129638671875, 0.16908645629882812, 0.1855316162109375, 0.20197677612304688, 0.21842193603515625, 0.23486709594726562, 0.251312255859375, 0.2677574157714844, 0.28420257568359375, 0.3006477355957031, 0.3170928955078125, 0.3335380554199219, 0.34998321533203125, 0.3664283752441406, 0.38287353515625, 0.3993186950683594, 0.41576385498046875, 0.4322090148925781, 0.4486541748046875, 0.4650993347167969, 0.48154449462890625, 0.4979896545410156, 0.514434814453125, 0.5308799743652344, 0.5473251342773438, 0.5637702941894531, 0.5802154541015625, 0.5966606140136719, 0.6131057739257812, 0.6295509338378906, 0.64599609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 12.0, 15.0, 23.0, 34.0, 43.0, 74.0, 109.0, 133.0, 277.0, 408.0, 610.0, 696.0, 519.0, 388.0, 223.0, 168.0, 113.0, 74.0, 51.0, 28.0, 22.0, 17.0, 16.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3515625, -0.33330535888671875, -0.3150482177734375, -0.29679107666015625, -0.278533935546875, -0.26027679443359375, -0.2420196533203125, -0.22376251220703125, -0.20550537109375, -0.18724822998046875, -0.1689910888671875, -0.15073394775390625, -0.132476806640625, -0.11421966552734375, -0.0959625244140625, -0.07770538330078125, -0.0594482421875, -0.04119110107421875, -0.0229339599609375, -0.00467681884765625, 0.013580322265625, 0.03183746337890625, 0.0500946044921875, 0.06835174560546875, 0.08660888671875, 0.10486602783203125, 0.1231231689453125, 0.14138031005859375, 0.159637451171875, 0.17789459228515625, 0.1961517333984375, 0.21440887451171875, 0.232666015625, 0.25092315673828125, 0.2691802978515625, 0.28743743896484375, 0.305694580078125, 0.32395172119140625, 0.3422088623046875, 0.36046600341796875, 0.37872314453125, 0.39698028564453125, 0.4152374267578125, 0.43349456787109375, 0.451751708984375, 0.47000885009765625, 0.4882659912109375, 0.5065231323242188, 0.5247802734375, 0.5430374145507812, 0.5612945556640625, 0.5795516967773438, 0.597808837890625, 0.6160659790039062, 0.6343231201171875, 0.6525802612304688, 0.67083740234375, 0.6890945434570312, 0.7073516845703125, 0.7256088256835938, 0.743865966796875, 0.7621231079101562, 0.7803802490234375, 0.7986373901367188, 0.81689453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 7.0, 33.0, 83.0, 179.0, 297.0, 211.0, 121.0, 43.0, 15.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668066024780273, -6.467572212219238, -6.267077922821045, -6.06658411026001, -5.866089820861816, -5.665596008300781, -5.465102195739746, -5.264607906341553, -5.064113616943359, -4.863619804382324, -4.663125514984131, -4.462631702423096, -4.262137413024902, -4.061643600463867, -3.861149549484253, -3.6606554985046387, -3.4601616859436035, -3.2596676349639893, -3.059173583984375, -2.85867977142334, -2.6581854820251465, -2.4576916694641113, -2.257197618484497, -2.056703567504883, -1.8562095165252686, -1.6557154655456543, -1.45522141456604, -1.2547274827957153, -1.054233431816101, -0.8537393808364868, -0.6532454490661621, -0.45275139808654785, -0.2522573471069336, -0.051763325929641724, 0.14873069524765015, 0.34922468662261963, 0.5497187376022339, 0.7502127885818481, 0.9507067203521729, 1.151200771331787, 1.3516948223114014, 1.5521888732910156, 1.7526829242706299, 1.9531768560409546, 2.1536707878112793, 2.3541650772094727, 2.554658889770508, 2.755152940750122, 2.9556469917297363, 3.1561410427093506, 3.356635093688965, 3.55712890625, 3.7576231956481934, 3.9581170082092285, 4.158611297607422, 4.359105110168457, 4.559598922729492, 4.760092735290527, 4.960587024688721, 5.161080837249756, 5.361575126647949, 5.562068939208984, 5.7625627517700195, 5.963057041168213, 6.163551330566406]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 4.0, 3.0, 8.0, 7.0, 6.0, 10.0, 10.0, 13.0, 16.0, 18.0, 18.0, 28.0, 22.0, 34.0, 33.0, 22.0, 28.0, 35.0, 43.0, 41.0, 40.0, 33.0, 45.0, 40.0, 41.0, 43.0, 36.0, 39.0, 32.0, 24.0, 24.0, 21.0, 29.0, 26.0, 19.0, 17.0, 11.0, 17.0, 11.0, 13.0, 9.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-1.6624239683151245, -1.6147022247314453, -1.5669806003570557, -1.5192588567733765, -1.4715372323989868, -1.4238154888153076, -1.376093864440918, -1.3283721208572388, -1.2806503772735596, -1.2329286336898804, -1.1852070093154907, -1.1374852657318115, -1.0897636413574219, -1.0420418977737427, -0.9943202137947083, -0.9465985298156738, -0.8988768458366394, -0.851155161857605, -0.8034334778785706, -0.7557117938995361, -0.7079900503158569, -0.6602683663368225, -0.6125466823577881, -0.5648249387741089, -0.5171033143997192, -0.4693816304206848, -0.421659916639328, -0.3739382326602936, -0.32621651887893677, -0.27849483489990234, -0.23077315092086792, -0.1830514371395111, -0.1353297233581543, -0.08760802447795868, -0.03988633304834366, 0.007835358381271362, 0.05555705726146698, 0.1032787561416626, 0.15100044012069702, 0.19872215390205383, 0.24644383788108826, 0.2941655218601227, 0.3418872356414795, 0.3896089196205139, 0.43733060359954834, 0.48505231738090515, 0.5327739715576172, 0.5804957151412964, 0.6282173991203308, 0.6759390830993652, 0.7236607670783997, 0.7713824510574341, 0.8191041946411133, 0.8668258786201477, 0.9145475625991821, 0.9622693061828613, 1.009990930557251, 1.0577126741409302, 1.1054342985153198, 1.153156042098999, 1.2008776664733887, 1.2485994100570679, 1.296321153640747, 1.3440427780151367, 1.391764521598816]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 5.0, 10.0, 26.0, 16.0, 26.0, 40.0, 73.0, 80.0, 122.0, 234.0, 377.0, 584.0, 1002.0, 1875.0, 3620.0, 7460.0, 16431.0, 39754.0, 95109.0, 194353.0, 268755.0, 217967.0, 113809.0, 48890.0, 19918.0, 8714.0, 4076.0, 2186.0, 1171.0, 731.0, 415.0, 250.0, 153.0, 111.0, 73.0, 37.0, 23.0, 21.0, 19.0, 14.0, 11.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.397216796875, -0.38465118408203125, -0.3720855712890625, -0.35951995849609375, -0.346954345703125, -0.33438873291015625, -0.3218231201171875, -0.30925750732421875, -0.29669189453125, -0.28412628173828125, -0.2715606689453125, -0.25899505615234375, -0.246429443359375, -0.23386383056640625, -0.2212982177734375, -0.20873260498046875, -0.1961669921875, -0.18360137939453125, -0.1710357666015625, -0.15847015380859375, -0.145904541015625, -0.13333892822265625, -0.1207733154296875, -0.10820770263671875, -0.09564208984375, -0.08307647705078125, -0.0705108642578125, -0.05794525146484375, -0.045379638671875, -0.03281402587890625, -0.0202484130859375, -0.00768280029296875, 0.0048828125, 0.01744842529296875, 0.0300140380859375, 0.04257965087890625, 0.055145263671875, 0.06771087646484375, 0.0802764892578125, 0.09284210205078125, 0.10540771484375, 0.11797332763671875, 0.1305389404296875, 0.14310455322265625, 0.155670166015625, 0.16823577880859375, 0.1808013916015625, 0.19336700439453125, 0.2059326171875, 0.21849822998046875, 0.2310638427734375, 0.24362945556640625, 0.256195068359375, 0.26876068115234375, 0.2813262939453125, 0.29389190673828125, 0.30645751953125, 0.31902313232421875, 0.3315887451171875, 0.34415435791015625, 0.356719970703125, 0.36928558349609375, 0.3818511962890625, 0.39441680908203125, 0.406982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 7.0, 13.0, 8.0, 17.0, 14.0, 19.0, 22.0, 23.0, 32.0, 25.0, 38.0, 37.0, 53.0, 30.0, 34.0, 33.0, 39.0, 39.0, 43.0, 41.0, 47.0, 47.0, 42.0, 33.0, 38.0, 34.0, 24.0, 27.0, 22.0, 20.0, 16.0, 11.0, 14.0, 9.0, 9.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2294921875, -0.22152328491210938, -0.21355438232421875, -0.20558547973632812, -0.1976165771484375, -0.18964767456054688, -0.18167877197265625, -0.17370986938476562, -0.165740966796875, -0.15777206420898438, -0.14980316162109375, -0.14183425903320312, -0.1338653564453125, -0.12589645385742188, -0.11792755126953125, -0.10995864868164062, -0.10198974609375, -0.09402084350585938, -0.08605194091796875, -0.07808303833007812, -0.0701141357421875, -0.062145233154296875, -0.05417633056640625, -0.046207427978515625, -0.038238525390625, -0.030269622802734375, -0.02230072021484375, -0.014331817626953125, -0.0063629150390625, 0.001605987548828125, 0.00957489013671875, 0.017543792724609375, 0.0255126953125, 0.033481597900390625, 0.04145050048828125, 0.049419403076171875, 0.0573883056640625, 0.06535720825195312, 0.07332611083984375, 0.08129501342773438, 0.089263916015625, 0.09723281860351562, 0.10520172119140625, 0.11317062377929688, 0.1211395263671875, 0.12910842895507812, 0.13707733154296875, 0.14504623413085938, 0.15301513671875, 0.16098403930664062, 0.16895294189453125, 0.17692184448242188, 0.1848907470703125, 0.19285964965820312, 0.20082855224609375, 0.20879745483398438, 0.216766357421875, 0.22473526000976562, 0.23270416259765625, 0.24067306518554688, 0.2486419677734375, 0.2566108703613281, 0.26457977294921875, 0.2725486755371094, 0.280517578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 13.0, 22.0, 43.0, 52.0, 104.0, 164.0, 327.0, 666.0, 1192.0, 2603.0, 5693.0, 13766.0, 38079.0, 111645.0, 280261.0, 337954.0, 164645.0, 56356.0, 20058.0, 8064.0, 3580.0, 1578.0, 764.0, 377.0, 226.0, 137.0, 74.0, 26.0, 18.0, 16.0, 15.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5810546875, -0.5654296875, -0.5498046875, -0.5341796875, -0.5185546875, -0.5029296875, -0.4873046875, -0.4716796875, -0.4560546875, -0.4404296875, -0.4248046875, -0.4091796875, -0.3935546875, -0.3779296875, -0.3623046875, -0.3466796875, -0.3310546875, -0.3154296875, -0.2998046875, -0.2841796875, -0.2685546875, -0.2529296875, -0.2373046875, -0.2216796875, -0.2060546875, -0.1904296875, -0.1748046875, -0.1591796875, -0.1435546875, -0.1279296875, -0.1123046875, -0.0966796875, -0.0810546875, -0.0654296875, -0.0498046875, -0.0341796875, -0.0185546875, -0.0029296875, 0.0126953125, 0.0283203125, 0.0439453125, 0.0595703125, 0.0751953125, 0.0908203125, 0.1064453125, 0.1220703125, 0.1376953125, 0.1533203125, 0.1689453125, 0.1845703125, 0.2001953125, 0.2158203125, 0.2314453125, 0.2470703125, 0.2626953125, 0.2783203125, 0.2939453125, 0.3095703125, 0.3251953125, 0.3408203125, 0.3564453125, 0.3720703125, 0.3876953125, 0.4033203125, 0.4189453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 11.0, 14.0, 13.0, 9.0, 17.0, 17.0, 22.0, 22.0, 23.0, 31.0, 48.0, 47.0, 56.0, 49.0, 46.0, 45.0, 41.0, 46.0, 61.0, 39.0, 43.0, 36.0, 34.0, 35.0, 41.0, 19.0, 21.0, 17.0, 16.0, 15.0, 8.0, 8.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6678314208984375, -0.644744873046875, -0.6216583251953125, -0.59857177734375, -0.5754852294921875, -0.552398681640625, -0.5293121337890625, -0.5062255859375, -0.4831390380859375, -0.460052490234375, -0.4369659423828125, -0.41387939453125, -0.3907928466796875, -0.367706298828125, -0.3446197509765625, -0.321533203125, -0.2984466552734375, -0.275360107421875, -0.2522735595703125, -0.22918701171875, -0.2061004638671875, -0.183013916015625, -0.1599273681640625, -0.1368408203125, -0.1137542724609375, -0.090667724609375, -0.0675811767578125, -0.04449462890625, -0.0214080810546875, 0.001678466796875, 0.0247650146484375, 0.0478515625, 0.0709381103515625, 0.094024658203125, 0.1171112060546875, 0.14019775390625, 0.1632843017578125, 0.186370849609375, 0.2094573974609375, 0.2325439453125, 0.2556304931640625, 0.278717041015625, 0.3018035888671875, 0.32489013671875, 0.3479766845703125, 0.371063232421875, 0.3941497802734375, 0.417236328125, 0.4403228759765625, 0.463409423828125, 0.4864959716796875, 0.50958251953125, 0.5326690673828125, 0.555755615234375, 0.5788421630859375, 0.6019287109375, 0.6250152587890625, 0.648101806640625, 0.6711883544921875, 0.69427490234375, 0.7173614501953125, 0.740447998046875, 0.7635345458984375, 0.78662109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 16.0, 28.0, 59.0, 107.0, 161.0, 363.0, 787.0, 1724.0, 4557.0, 11837.0, 32471.0, 88906.0, 213075.0, 320852.0, 222534.0, 95113.0, 34913.0, 12619.0, 4830.0, 1985.0, 862.0, 363.0, 155.0, 90.0, 53.0, 39.0, 14.0, 3.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10772705078125, -0.1036672592163086, -0.09960746765136719, -0.09554767608642578, -0.09148788452148438, -0.08742809295654297, -0.08336830139160156, -0.07930850982666016, -0.07524871826171875, -0.07118892669677734, -0.06712913513183594, -0.06306934356689453, -0.059009552001953125, -0.05494976043701172, -0.05088996887207031, -0.046830177307128906, -0.0427703857421875, -0.038710594177246094, -0.03465080261230469, -0.03059101104736328, -0.026531219482421875, -0.02247142791748047, -0.018411636352539062, -0.014351844787597656, -0.01029205322265625, -0.006232261657714844, -0.0021724700927734375, 0.0018873214721679688, 0.005947113037109375, 0.010006904602050781, 0.014066696166992188, 0.018126487731933594, 0.022186279296875, 0.026246070861816406, 0.030305862426757812, 0.03436565399169922, 0.038425445556640625, 0.04248523712158203, 0.04654502868652344, 0.050604820251464844, 0.05466461181640625, 0.058724403381347656, 0.06278419494628906, 0.06684398651123047, 0.07090377807617188, 0.07496356964111328, 0.07902336120605469, 0.0830831527709961, 0.0871429443359375, 0.0912027359008789, 0.09526252746582031, 0.09932231903076172, 0.10338211059570312, 0.10744190216064453, 0.11150169372558594, 0.11556148529052734, 0.11962127685546875, 0.12368106842041016, 0.12774085998535156, 0.13180065155029297, 0.13586044311523438, 0.13992023468017578, 0.1439800262451172, 0.1480398178100586, 0.152099609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 7.0, 4.0, 5.0, 14.0, 18.0, 26.0, 28.0, 41.0, 37.0, 49.0, 66.0, 69.0, 89.0, 75.0, 72.0, 71.0, 55.0, 47.0, 50.0, 35.0, 39.0, 24.0, 16.0, 12.0, 7.0, 4.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.2928924560546875e-05, -5.1480717957019806e-05, -5.003251135349274e-05, -4.858430474996567e-05, -4.71360981464386e-05, -4.568789154291153e-05, -4.423968493938446e-05, -4.279147833585739e-05, -4.134327173233032e-05, -3.989506512880325e-05, -3.8446858525276184e-05, -3.6998651921749115e-05, -3.5550445318222046e-05, -3.410223871469498e-05, -3.265403211116791e-05, -3.120582550764084e-05, -2.975761890411377e-05, -2.83094123005867e-05, -2.686120569705963e-05, -2.5412999093532562e-05, -2.3964792490005493e-05, -2.2516585886478424e-05, -2.1068379282951355e-05, -1.9620172679424286e-05, -1.8171966075897217e-05, -1.6723759472370148e-05, -1.527555286884308e-05, -1.382734626531601e-05, -1.237913966178894e-05, -1.0930933058261871e-05, -9.482726454734802e-06, -8.034519851207733e-06, -6.586313247680664e-06, -5.138106644153595e-06, -3.689900040626526e-06, -2.2416934370994568e-06, -7.934868335723877e-07, 6.547197699546814e-07, 2.1029263734817505e-06, 3.5511329770088196e-06, 4.999339580535889e-06, 6.447546184062958e-06, 7.895752787590027e-06, 9.343959391117096e-06, 1.0792165994644165e-05, 1.2240372598171234e-05, 1.3688579201698303e-05, 1.5136785805225372e-05, 1.658499240875244e-05, 1.803319901227951e-05, 1.948140561580658e-05, 2.092961221933365e-05, 2.2377818822860718e-05, 2.3826025426387787e-05, 2.5274232029914856e-05, 2.6722438633441925e-05, 2.8170645236968994e-05, 2.9618851840496063e-05, 3.106705844402313e-05, 3.25152650475502e-05, 3.396347165107727e-05, 3.541167825460434e-05, 3.685988485813141e-05, 3.830809146165848e-05, 3.975629806518555e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 3.0, 14.0, 11.0, 13.0, 43.0, 58.0, 75.0, 113.0, 181.0, 323.0, 604.0, 1028.0, 2024.0, 4187.0, 9307.0, 21142.0, 49221.0, 109415.0, 204692.0, 263349.0, 197124.0, 103052.0, 45832.0, 19797.0, 8690.0, 3989.0, 1918.0, 996.0, 531.0, 306.0, 206.0, 88.0, 71.0, 52.0, 32.0, 18.0, 9.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.12481689453125, -0.12129688262939453, -0.11777687072753906, -0.1142568588256836, -0.11073684692382812, -0.10721683502197266, -0.10369682312011719, -0.10017681121826172, -0.09665679931640625, -0.09313678741455078, -0.08961677551269531, -0.08609676361083984, -0.08257675170898438, -0.0790567398071289, -0.07553672790527344, -0.07201671600341797, -0.0684967041015625, -0.06497669219970703, -0.06145668029785156, -0.057936668395996094, -0.054416656494140625, -0.050896644592285156, -0.04737663269042969, -0.04385662078857422, -0.04033660888671875, -0.03681659698486328, -0.03329658508300781, -0.029776573181152344, -0.026256561279296875, -0.022736549377441406, -0.019216537475585938, -0.01569652557373047, -0.012176513671875, -0.008656501770019531, -0.0051364898681640625, -0.0016164779663085938, 0.001903533935546875, 0.005423545837402344, 0.008943557739257812, 0.012463569641113281, 0.01598358154296875, 0.01950359344482422, 0.023023605346679688, 0.026543617248535156, 0.030063629150390625, 0.033583641052246094, 0.03710365295410156, 0.04062366485595703, 0.0441436767578125, 0.04766368865966797, 0.05118370056152344, 0.054703712463378906, 0.058223724365234375, 0.061743736267089844, 0.06526374816894531, 0.06878376007080078, 0.07230377197265625, 0.07582378387451172, 0.07934379577636719, 0.08286380767822266, 0.08638381958007812, 0.0899038314819336, 0.09342384338378906, 0.09694385528564453, 0.1004638671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 10.0, 7.0, 13.0, 11.0, 12.0, 14.0, 17.0, 26.0, 32.0, 28.0, 46.0, 43.0, 46.0, 54.0, 65.0, 63.0, 47.0, 57.0, 51.0, 53.0, 40.0, 39.0, 41.0, 44.0, 30.0, 20.0, 20.0, 16.0, 15.0, 12.0, 8.0, 7.0, 9.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14590072631835938, -0.14153289794921875, -0.13716506958007812, -0.1327972412109375, -0.12842941284179688, -0.12406158447265625, -0.11969375610351562, -0.115325927734375, -0.11095809936523438, -0.10659027099609375, -0.10222244262695312, -0.0978546142578125, -0.09348678588867188, -0.08911895751953125, -0.08475112915039062, -0.08038330078125, -0.07601547241210938, -0.07164764404296875, -0.06727981567382812, -0.0629119873046875, -0.058544158935546875, -0.05417633056640625, -0.049808502197265625, -0.045440673828125, -0.041072845458984375, -0.03670501708984375, -0.032337188720703125, -0.0279693603515625, -0.023601531982421875, -0.01923370361328125, -0.014865875244140625, -0.010498046875, -0.006130218505859375, -0.00176239013671875, 0.002605438232421875, 0.0069732666015625, 0.011341094970703125, 0.01570892333984375, 0.020076751708984375, 0.024444580078125, 0.028812408447265625, 0.03318023681640625, 0.037548065185546875, 0.0419158935546875, 0.046283721923828125, 0.05065155029296875, 0.055019378662109375, 0.05938720703125, 0.06375503540039062, 0.06812286376953125, 0.07249069213867188, 0.0768585205078125, 0.08122634887695312, 0.08559417724609375, 0.08996200561523438, 0.094329833984375, 0.09869766235351562, 0.10306549072265625, 0.10743331909179688, 0.1118011474609375, 0.11616897583007812, 0.12053680419921875, 0.12490463256835938, 0.1292724609375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 5.0, 5.0, 27.0, 35.0, 38.0, 74.0, 94.0, 146.0, 145.0, 156.0, 97.0, 65.0, 46.0, 28.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0944294929504395, -1.9904919862747192, -1.8865545988082886, -1.7826170921325684, -1.6786795854568481, -1.574742078781128, -1.4708046913146973, -1.366867184638977, -1.2629296779632568, -1.1589921712875366, -1.055054783821106, -0.9511172771453857, -0.8471797704696655, -0.7432423233985901, -0.6393048763275146, -0.5353673696517944, -0.43142998218536377, -0.32749250531196594, -0.2235550433397293, -0.11961758136749268, -0.01568010449409485, 0.08825737237930298, 0.19219481945037842, 0.29613232612609863, 0.4000697731971741, 0.5040072202682495, 0.6079447269439697, 0.7118821740150452, 0.8158196210861206, 0.9197571277618408, 1.0236945152282715, 1.1276321411132812, 1.231569528579712, 1.3355070352554321, 1.4394444227218628, 1.543381929397583, 1.6473194360733032, 1.7512569427490234, 1.855194330215454, 1.9591318368911743, 2.0630693435668945, 2.167006731033325, 2.270944356918335, 2.3748817443847656, 2.4788191318511963, 2.582756757736206, 2.6866941452026367, 2.7906317710876465, 2.894568920135498, 2.9985063076019287, 3.1024439334869385, 3.206381320953369, 3.3103187084198, 3.4142563343048096, 3.5181937217712402, 3.62213134765625, 3.7260687351226807, 3.8300061225891113, 3.933943748474121, 4.037880897521973, 4.141818523406982, 4.245756149291992, 4.349693298339844, 4.4536309242248535, 4.557568550109863]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 11.0, 13.0, 7.0, 4.0, 14.0, 11.0, 13.0, 17.0, 10.0, 19.0, 23.0, 24.0, 23.0, 22.0, 22.0, 30.0, 35.0, 29.0, 37.0, 46.0, 24.0, 44.0, 40.0, 46.0, 31.0, 37.0, 33.0, 40.0, 40.0, 27.0, 31.0, 28.0, 25.0, 21.0, 19.0, 12.0, 13.0, 15.0, 14.0, 10.0, 12.0, 7.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7009193897247314, -1.646073341369629, -1.5912272930145264, -1.5363812446594238, -1.4815351963043213, -1.4266891479492188, -1.3718432188034058, -1.3169971704483032, -1.2621511220932007, -1.2073050737380981, -1.1524590253829956, -1.097612977027893, -1.04276704788208, -0.9879209399223328, -0.933074951171875, -0.8782289028167725, -0.8233828544616699, -0.7685368061065674, -0.7136907577514648, -0.6588447690010071, -0.6039987206459045, -0.549152672290802, -0.49430665373802185, -0.4394606351852417, -0.38461458683013916, -0.3297685384750366, -0.27492251992225647, -0.22007648646831512, -0.16523045301437378, -0.11038440465927124, -0.05553838610649109, -0.0006923675537109375, 0.05415356159210205, 0.1089995950460434, 0.16384562849998474, 0.2186916619539261, 0.27353769540786743, 0.32838374376296997, 0.3832297623157501, 0.4380757808685303, 0.4929218292236328, 0.5477678775787354, 0.6026139259338379, 0.6574599146842957, 0.7123059630393982, 0.7671520113945007, 0.8219980001449585, 0.876844048500061, 0.9316900968551636, 0.9865361452102661, 1.0413821935653687, 1.0962282419204712, 1.1510741710662842, 1.2059202194213867, 1.2607662677764893, 1.3156123161315918, 1.3704583644866943, 1.4253044128417969, 1.4801504611968994, 1.534996509552002, 1.5898425579071045, 1.644688606262207, 1.69953453540802, 1.7543805837631226, 1.809226632118225]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 26.0, 23.0, 52.0, 79.0, 160.0, 275.0, 435.0, 782.0, 1383.0, 2545.0, 4511.0, 8838.0, 18549.0, 43714.0, 116084.0, 356995.0, 1063370.0, 1566267.0, 674976.0, 208242.0, 71182.0, 28629.0, 12887.0, 6535.0, 3357.0, 1892.0, 1041.0, 596.0, 338.0, 197.0, 131.0, 74.0, 42.0, 22.0, 20.0, 5.0, 7.0, 8.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.21488571166992188, -0.20565032958984375, -0.19641494750976562, -0.1871795654296875, -0.17794418334960938, -0.16870880126953125, -0.15947341918945312, -0.150238037109375, -0.14100265502929688, -0.13176727294921875, -0.12253189086914062, -0.1132965087890625, -0.10406112670898438, -0.09482574462890625, -0.08559036254882812, -0.07635498046875, -0.06711959838867188, -0.05788421630859375, -0.048648834228515625, -0.0394134521484375, -0.030178070068359375, -0.02094268798828125, -0.011707305908203125, -0.002471923828125, 0.006763458251953125, 0.01599884033203125, 0.025234222412109375, 0.0344696044921875, 0.043704986572265625, 0.05294036865234375, 0.062175750732421875, 0.0714111328125, 0.08064651489257812, 0.08988189697265625, 0.09911727905273438, 0.1083526611328125, 0.11758804321289062, 0.12682342529296875, 0.13605880737304688, 0.145294189453125, 0.15452957153320312, 0.16376495361328125, 0.17300033569335938, 0.1822357177734375, 0.19147109985351562, 0.20070648193359375, 0.20994186401367188, 0.21917724609375, 0.22841262817382812, 0.23764801025390625, 0.24688339233398438, 0.2561187744140625, 0.2653541564941406, 0.27458953857421875, 0.2838249206542969, 0.293060302734375, 0.3022956848144531, 0.31153106689453125, 0.3207664489746094, 0.3300018310546875, 0.3392372131347656, 0.34847259521484375, 0.3577079772949219, 0.366943359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 6.0, 4.0, 13.0, 17.0, 11.0, 11.0, 17.0, 18.0, 25.0, 35.0, 28.0, 28.0, 34.0, 27.0, 38.0, 45.0, 37.0, 34.0, 41.0, 44.0, 43.0, 33.0, 25.0, 42.0, 34.0, 29.0, 26.0, 25.0, 26.0, 20.0, 27.0, 18.0, 18.0, 20.0, 12.0, 9.0, 9.0, 8.0, 6.0, 9.0, 4.0, 8.0, 5.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1768798828125, -0.17090415954589844, -0.16492843627929688, -0.1589527130126953, -0.15297698974609375, -0.1470012664794922, -0.14102554321289062, -0.13504981994628906, -0.1290740966796875, -0.12309837341308594, -0.11712265014648438, -0.11114692687988281, -0.10517120361328125, -0.09919548034667969, -0.09321975708007812, -0.08724403381347656, -0.081268310546875, -0.07529258728027344, -0.06931686401367188, -0.06334114074707031, -0.05736541748046875, -0.05138969421386719, -0.045413970947265625, -0.03943824768066406, -0.0334625244140625, -0.027486801147460938, -0.021511077880859375, -0.015535354614257812, -0.00955963134765625, -0.0035839080810546875, 0.002391815185546875, 0.008367538452148438, 0.01434326171875, 0.020318984985351562, 0.026294708251953125, 0.03227043151855469, 0.03824615478515625, 0.04422187805175781, 0.050197601318359375, 0.05617332458496094, 0.0621490478515625, 0.06812477111816406, 0.07410049438476562, 0.08007621765136719, 0.08605194091796875, 0.09202766418457031, 0.09800338745117188, 0.10397911071777344, 0.109954833984375, 0.11593055725097656, 0.12190628051757812, 0.1278820037841797, 0.13385772705078125, 0.1398334503173828, 0.14580917358398438, 0.15178489685058594, 0.1577606201171875, 0.16373634338378906, 0.16971206665039062, 0.1756877899169922, 0.18166351318359375, 0.1876392364501953, 0.19361495971679688, 0.19959068298339844, 0.20556640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 26.0, 20.0, 42.0, 53.0, 106.0, 186.0, 353.0, 558.0, 1013.0, 1871.0, 3682.0, 7552.0, 16981.0, 42101.0, 123714.0, 458745.0, 2061875.0, 1108216.0, 242554.0, 74064.0, 27408.0, 11802.0, 5392.0, 2694.0, 1412.0, 767.0, 432.0, 270.0, 145.0, 94.0, 61.0, 29.0, 13.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.46337890625, -0.45111083984375, -0.4388427734375, -0.42657470703125, -0.414306640625, -0.40203857421875, -0.3897705078125, -0.37750244140625, -0.365234375, -0.35296630859375, -0.3406982421875, -0.32843017578125, -0.316162109375, -0.30389404296875, -0.2916259765625, -0.27935791015625, -0.26708984375, -0.25482177734375, -0.2425537109375, -0.23028564453125, -0.218017578125, -0.20574951171875, -0.1934814453125, -0.18121337890625, -0.1689453125, -0.15667724609375, -0.1444091796875, -0.13214111328125, -0.119873046875, -0.10760498046875, -0.0953369140625, -0.08306884765625, -0.07080078125, -0.05853271484375, -0.0462646484375, -0.03399658203125, -0.021728515625, -0.00946044921875, 0.0028076171875, 0.01507568359375, 0.02734375, 0.03961181640625, 0.0518798828125, 0.06414794921875, 0.076416015625, 0.08868408203125, 0.1009521484375, 0.11322021484375, 0.12548828125, 0.13775634765625, 0.1500244140625, 0.16229248046875, 0.174560546875, 0.18682861328125, 0.1990966796875, 0.21136474609375, 0.2236328125, 0.23590087890625, 0.2481689453125, 0.26043701171875, 0.272705078125, 0.28497314453125, 0.2972412109375, 0.30950927734375, 0.32177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 6.0, 6.0, 6.0, 13.0, 15.0, 22.0, 24.0, 36.0, 53.0, 67.0, 80.0, 94.0, 175.0, 198.0, 313.0, 430.0, 571.0, 504.0, 391.0, 288.0, 216.0, 146.0, 102.0, 74.0, 55.0, 41.0, 37.0, 27.0, 20.0, 14.0, 8.0, 4.0, 5.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.497802734375, -0.4835548400878906, -0.46930694580078125, -0.4550590515136719, -0.4408111572265625, -0.4265632629394531, -0.41231536865234375, -0.3980674743652344, -0.383819580078125, -0.3695716857910156, -0.35532379150390625, -0.3410758972167969, -0.3268280029296875, -0.3125801086425781, -0.29833221435546875, -0.2840843200683594, -0.26983642578125, -0.2555885314941406, -0.24134063720703125, -0.22709274291992188, -0.2128448486328125, -0.19859695434570312, -0.18434906005859375, -0.17010116577148438, -0.155853271484375, -0.14160537719726562, -0.12735748291015625, -0.11310958862304688, -0.0988616943359375, -0.08461380004882812, -0.07036590576171875, -0.056118011474609375, -0.0418701171875, -0.027622222900390625, -0.01337432861328125, 0.000873565673828125, 0.0151214599609375, 0.029369354248046875, 0.04361724853515625, 0.057865142822265625, 0.072113037109375, 0.08636093139648438, 0.10060882568359375, 0.11485671997070312, 0.1291046142578125, 0.14335250854492188, 0.15760040283203125, 0.17184829711914062, 0.18609619140625, 0.20034408569335938, 0.21459197998046875, 0.22883987426757812, 0.2430877685546875, 0.2573356628417969, 0.27158355712890625, 0.2858314514160156, 0.300079345703125, 0.3143272399902344, 0.32857513427734375, 0.3428230285644531, 0.3570709228515625, 0.3713188171386719, 0.38556671142578125, 0.3998146057128906, 0.4140625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 1.0, 8.0, 25.0, 57.0, 155.0, 292.0, 284.0, 115.0, 42.0, 12.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.028602600097656, -9.77835750579834, -9.528112411499023, -9.277868270874023, -9.027623176574707, -8.77737808227539, -8.527132987976074, -8.276887893676758, -8.026643753051758, -7.776398658752441, -7.526154041290283, -7.275908946990967, -7.025664329528809, -6.775419235229492, -6.525174140930176, -6.274929046630859, -6.024683952331543, -5.774438858032227, -5.524194240570068, -5.273949146270752, -5.023704528808594, -4.773459434509277, -4.523214340209961, -4.2729692459106445, -4.022724628448486, -3.772479772567749, -3.5222349166870117, -3.2719898223876953, -3.021744966506958, -2.7715001106262207, -2.5212550163269043, -2.271010160446167, -2.020766258239746, -1.7705214023590088, -1.520276427268982, -1.270031452178955, -1.0197865962982178, -0.7695417404174805, -0.5192967653274536, -0.26905179023742676, -0.018806934356689453, 0.23143798112869263, 0.4816828966140747, 0.7319278120994568, 0.9821727275848389, 1.2324175834655762, 1.482662558555603, 1.7329075336456299, 1.9831523895263672, 2.2333972454071045, 2.483642101287842, 2.733887195587158, 2.9841320514678955, 3.234376907348633, 3.484622001647949, 3.7348668575286865, 3.985111713409424, 4.23535680770874, 4.485601425170898, 4.735846519470215, 4.986091613769531, 5.2363362312316895, 5.486581325531006, 5.736825942993164, 5.9870710372924805]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 10.0, 7.0, 7.0, 8.0, 18.0, 20.0, 25.0, 20.0, 35.0, 33.0, 46.0, 44.0, 36.0, 39.0, 50.0, 45.0, 59.0, 53.0, 36.0, 34.0, 52.0, 45.0, 50.0, 38.0, 24.0, 23.0, 33.0, 24.0, 15.0, 15.0, 15.0, 7.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7441456317901611, -1.6884320974349976, -1.632718563079834, -1.5770050287246704, -1.5212914943695068, -1.4655779600143433, -1.4098644256591797, -1.3541508913040161, -1.2984373569488525, -1.242723822593689, -1.1870102882385254, -1.1312967538833618, -1.0755832195281982, -1.0198696851730347, -0.9641561508178711, -0.9084426164627075, -0.8527290225028992, -0.7970154881477356, -0.741301953792572, -0.6855884194374084, -0.6298748850822449, -0.5741612911224365, -0.518447756767273, -0.46273425221443176, -0.4070207178592682, -0.3513071835041046, -0.29559364914894104, -0.23988009989261627, -0.1841665655374527, -0.12845301628112793, -0.07273948192596436, -0.01702594757080078, 0.03868758678436279, 0.09440112113952637, 0.15011465549468994, 0.2058282047510147, 0.2615417242050171, 0.31725528836250305, 0.3729688227176666, 0.4286823570728302, 0.4843958914279938, 0.5401094555854797, 0.5958229899406433, 0.6515365242958069, 0.7072500586509705, 0.762963593006134, 0.8186771273612976, 0.8743906617164612, 0.9301041960716248, 0.9858177304267883, 1.0415313243865967, 1.0972448587417603, 1.1529583930969238, 1.2086719274520874, 1.264385461807251, 1.3200989961624146, 1.3758125305175781, 1.4315260648727417, 1.4872395992279053, 1.5429531335830688, 1.5986666679382324, 1.654380202293396, 1.7100937366485596, 1.7658072710037231, 1.8215208053588867]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 18.0, 19.0, 22.0, 33.0, 49.0, 75.0, 121.0, 187.0, 293.0, 478.0, 775.0, 1185.0, 2024.0, 3526.0, 5638.0, 9983.0, 17431.0, 30186.0, 50777.0, 81988.0, 121059.0, 155436.0, 163133.0, 141129.0, 101836.0, 66133.0, 39902.0, 23056.0, 13298.0, 7614.0, 4423.0, 2599.0, 1602.0, 875.0, 553.0, 374.0, 246.0, 162.0, 89.0, 63.0, 53.0, 30.0, 19.0, 17.0, 12.0, 6.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1995849609375, -0.19298934936523438, -0.18639373779296875, -0.17979812622070312, -0.1732025146484375, -0.16660690307617188, -0.16001129150390625, -0.15341567993164062, -0.146820068359375, -0.14022445678710938, -0.13362884521484375, -0.12703323364257812, -0.1204376220703125, -0.11384201049804688, -0.10724639892578125, -0.10065078735351562, -0.09405517578125, -0.08745956420898438, -0.08086395263671875, -0.07426834106445312, -0.0676727294921875, -0.061077117919921875, -0.05448150634765625, -0.047885894775390625, -0.041290283203125, -0.034694671630859375, -0.02809906005859375, -0.021503448486328125, -0.0149078369140625, -0.008312225341796875, -0.00171661376953125, 0.004878997802734375, 0.011474609375, 0.018070220947265625, 0.02466583251953125, 0.031261444091796875, 0.0378570556640625, 0.044452667236328125, 0.05104827880859375, 0.057643890380859375, 0.064239501953125, 0.07083511352539062, 0.07743072509765625, 0.08402633666992188, 0.0906219482421875, 0.09721755981445312, 0.10381317138671875, 0.11040878295898438, 0.11700439453125, 0.12360000610351562, 0.13019561767578125, 0.13679122924804688, 0.1433868408203125, 0.14998245239257812, 0.15657806396484375, 0.16317367553710938, 0.169769287109375, 0.17636489868164062, 0.18296051025390625, 0.18955612182617188, 0.1961517333984375, 0.20274734497070312, 0.20934295654296875, 0.21593856811523438, 0.2225341796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 2.0, 6.0, 6.0, 9.0, 7.0, 16.0, 16.0, 16.0, 24.0, 19.0, 25.0, 24.0, 24.0, 34.0, 38.0, 29.0, 26.0, 34.0, 41.0, 46.0, 40.0, 31.0, 37.0, 38.0, 39.0, 38.0, 40.0, 41.0, 20.0, 23.0, 29.0, 20.0, 25.0, 18.0, 20.0, 9.0, 8.0, 13.0, 15.0, 12.0, 10.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.21240234375, -0.20580101013183594, -0.19919967651367188, -0.1925983428955078, -0.18599700927734375, -0.1793956756591797, -0.17279434204101562, -0.16619300842285156, -0.1595916748046875, -0.15299034118652344, -0.14638900756835938, -0.1397876739501953, -0.13318634033203125, -0.1265850067138672, -0.11998367309570312, -0.11338233947753906, -0.106781005859375, -0.10017967224121094, -0.09357833862304688, -0.08697700500488281, -0.08037567138671875, -0.07377433776855469, -0.06717300415039062, -0.06057167053222656, -0.0539703369140625, -0.04736900329589844, -0.040767669677734375, -0.03416633605957031, -0.02756500244140625, -0.020963668823242188, -0.014362335205078125, -0.0077610015869140625, -0.00115966796875, 0.0054416656494140625, 0.012042999267578125, 0.018644332885742188, 0.02524566650390625, 0.03184700012207031, 0.038448333740234375, 0.04504966735839844, 0.0516510009765625, 0.05825233459472656, 0.06485366821289062, 0.07145500183105469, 0.07805633544921875, 0.08465766906738281, 0.09125900268554688, 0.09786033630371094, 0.104461669921875, 0.11106300354003906, 0.11766433715820312, 0.12426567077636719, 0.13086700439453125, 0.1374683380126953, 0.14406967163085938, 0.15067100524902344, 0.1572723388671875, 0.16387367248535156, 0.17047500610351562, 0.1770763397216797, 0.18367767333984375, 0.1902790069580078, 0.19688034057617188, 0.20348167419433594, 0.2100830078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 13.0, 10.0, 13.0, 32.0, 43.0, 52.0, 78.0, 99.0, 153.0, 241.0, 379.0, 629.0, 1003.0, 1647.0, 2832.0, 4971.0, 9120.0, 17262.0, 32962.0, 61620.0, 111686.0, 181553.0, 246692.0, 163073.0, 97808.0, 53100.0, 28125.0, 14563.0, 8031.0, 4397.0, 2473.0, 1490.0, 832.0, 543.0, 327.0, 214.0, 133.0, 87.0, 78.0, 54.0, 38.0, 33.0, 11.0, 16.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.260498046875, -0.2524528503417969, -0.24440765380859375, -0.23636245727539062, -0.2283172607421875, -0.22027206420898438, -0.21222686767578125, -0.20418167114257812, -0.196136474609375, -0.18809127807617188, -0.18004608154296875, -0.17200088500976562, -0.1639556884765625, -0.15591049194335938, -0.14786529541015625, -0.13982009887695312, -0.13177490234375, -0.12372970581054688, -0.11568450927734375, -0.10763931274414062, -0.0995941162109375, -0.09154891967773438, -0.08350372314453125, -0.07545852661132812, -0.067413330078125, -0.059368133544921875, -0.05132293701171875, -0.043277740478515625, -0.0352325439453125, -0.027187347412109375, -0.01914215087890625, -0.011096954345703125, -0.0030517578125, 0.004993438720703125, 0.01303863525390625, 0.021083831787109375, 0.0291290283203125, 0.037174224853515625, 0.04521942138671875, 0.053264617919921875, 0.061309814453125, 0.06935501098632812, 0.07740020751953125, 0.08544540405273438, 0.0934906005859375, 0.10153579711914062, 0.10958099365234375, 0.11762619018554688, 0.12567138671875, 0.13371658325195312, 0.14176177978515625, 0.14980697631835938, 0.1578521728515625, 0.16589736938476562, 0.17394256591796875, 0.18198776245117188, 0.190032958984375, 0.19807815551757812, 0.20612335205078125, 0.21416854858398438, 0.2222137451171875, 0.23025894165039062, 0.23830413818359375, 0.24634933471679688, 0.25439453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 9.0, 6.0, 12.0, 13.0, 25.0, 33.0, 21.0, 31.0, 38.0, 57.0, 37.0, 66.0, 51.0, 75.0, 68.0, 59.0, 52.0, 54.0, 54.0, 37.0, 28.0, 37.0, 25.0, 27.0, 18.0, 16.0, 14.0, 14.0, 7.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.7985000610351562, -0.7718048095703125, -0.7451095581054688, -0.718414306640625, -0.6917190551757812, -0.6650238037109375, -0.6383285522460938, -0.61163330078125, -0.5849380493164062, -0.5582427978515625, -0.5315475463867188, -0.504852294921875, -0.47815704345703125, -0.4514617919921875, -0.42476654052734375, -0.3980712890625, -0.37137603759765625, -0.3446807861328125, -0.31798553466796875, -0.291290283203125, -0.26459503173828125, -0.2378997802734375, -0.21120452880859375, -0.18450927734375, -0.15781402587890625, -0.1311187744140625, -0.10442352294921875, -0.077728271484375, -0.05103302001953125, -0.0243377685546875, 0.00235748291015625, 0.029052734375, 0.05574798583984375, 0.0824432373046875, 0.10913848876953125, 0.135833740234375, 0.16252899169921875, 0.1892242431640625, 0.21591949462890625, 0.24261474609375, 0.26930999755859375, 0.2960052490234375, 0.32270050048828125, 0.349395751953125, 0.37609100341796875, 0.4027862548828125, 0.42948150634765625, 0.4561767578125, 0.48287200927734375, 0.5095672607421875, 0.5362625122070312, 0.562957763671875, 0.5896530151367188, 0.6163482666015625, 0.6430435180664062, 0.66973876953125, 0.6964340209960938, 0.7231292724609375, 0.7498245239257812, 0.776519775390625, 0.8032150268554688, 0.8299102783203125, 0.8566055297851562, 0.88330078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 14.0, 26.0, 27.0, 43.0, 48.0, 73.0, 101.0, 153.0, 228.0, 310.0, 463.0, 684.0, 1026.0, 1556.0, 2425.0, 4007.0, 6370.0, 10949.0, 18780.0, 31772.0, 54155.0, 88833.0, 137680.0, 208709.0, 174886.0, 119361.0, 74959.0, 44869.0, 26616.0, 15351.0, 9147.0, 5384.0, 3283.0, 2087.0, 1385.0, 891.0, 576.0, 364.0, 282.0, 204.0, 135.0, 87.0, 61.0, 49.0, 50.0, 22.0, 23.0, 16.0, 6.0, 8.0, 1.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.05047607421875, -0.04893827438354492, -0.047400474548339844, -0.045862674713134766, -0.04432487487792969, -0.04278707504272461, -0.04124927520751953, -0.03971147537231445, -0.038173675537109375, -0.0366358757019043, -0.03509807586669922, -0.03356027603149414, -0.03202247619628906, -0.030484676361083984, -0.028946876525878906, -0.027409076690673828, -0.02587127685546875, -0.024333477020263672, -0.022795677185058594, -0.021257877349853516, -0.019720077514648438, -0.01818227767944336, -0.01664447784423828, -0.015106678009033203, -0.013568878173828125, -0.012031078338623047, -0.010493278503417969, -0.00895547866821289, -0.0074176788330078125, -0.005879878997802734, -0.004342079162597656, -0.002804279327392578, -0.0012664794921875, 0.0002713203430175781, 0.0018091201782226562, 0.0033469200134277344, 0.0048847198486328125, 0.006422519683837891, 0.007960319519042969, 0.009498119354248047, 0.011035919189453125, 0.012573719024658203, 0.014111518859863281, 0.01564931869506836, 0.017187118530273438, 0.018724918365478516, 0.020262718200683594, 0.021800518035888672, 0.02333831787109375, 0.024876117706298828, 0.026413917541503906, 0.027951717376708984, 0.029489517211914062, 0.03102731704711914, 0.03256511688232422, 0.0341029167175293, 0.035640716552734375, 0.03717851638793945, 0.03871631622314453, 0.04025411605834961, 0.04179191589355469, 0.043329715728759766, 0.044867515563964844, 0.04640531539916992, 0.047943115234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 12.0, 7.0, 12.0, 14.0, 15.0, 11.0, 23.0, 29.0, 20.0, 24.0, 42.0, 40.0, 37.0, 47.0, 40.0, 46.0, 60.0, 65.0, 42.0, 41.0, 39.0, 36.0, 34.0, 31.0, 32.0, 17.0, 20.0, 24.0, 17.0, 16.0, 15.0, 9.0, 10.0, 9.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.580881118774414e-05, -2.5054439902305603e-05, -2.4300068616867065e-05, -2.3545697331428528e-05, -2.279132604598999e-05, -2.2036954760551453e-05, -2.1282583475112915e-05, -2.0528212189674377e-05, -1.977384090423584e-05, -1.9019469618797302e-05, -1.8265098333358765e-05, -1.7510727047920227e-05, -1.675635576248169e-05, -1.6001984477043152e-05, -1.5247613191604614e-05, -1.4493241906166077e-05, -1.3738870620727539e-05, -1.2984499335289001e-05, -1.2230128049850464e-05, -1.1475756764411926e-05, -1.0721385478973389e-05, -9.967014193534851e-06, -9.212642908096313e-06, -8.458271622657776e-06, -7.703900337219238e-06, -6.949529051780701e-06, -6.195157766342163e-06, -5.4407864809036255e-06, -4.686415195465088e-06, -3.93204391002655e-06, -3.1776726245880127e-06, -2.423301339149475e-06, -1.6689300537109375e-06, -9.145587682723999e-07, -1.601874828338623e-07, 5.941838026046753e-07, 1.3485550880432129e-06, 2.1029263734817505e-06, 2.857297658920288e-06, 3.6116689443588257e-06, 4.366040229797363e-06, 5.120411515235901e-06, 5.8747828006744385e-06, 6.629154086112976e-06, 7.383525371551514e-06, 8.137896656990051e-06, 8.892267942428589e-06, 9.646639227867126e-06, 1.0401010513305664e-05, 1.1155381798744202e-05, 1.190975308418274e-05, 1.2664124369621277e-05, 1.3418495655059814e-05, 1.4172866940498352e-05, 1.492723822593689e-05, 1.5681609511375427e-05, 1.6435980796813965e-05, 1.7190352082252502e-05, 1.794472336769104e-05, 1.8699094653129578e-05, 1.9453465938568115e-05, 2.0207837224006653e-05, 2.096220850944519e-05, 2.1716579794883728e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 9.0, 5.0, 12.0, 10.0, 20.0, 26.0, 34.0, 68.0, 139.0, 188.0, 306.0, 530.0, 965.0, 1757.0, 3351.0, 6230.0, 12728.0, 25073.0, 51516.0, 101355.0, 183061.0, 274419.0, 183409.0, 101122.0, 50680.0, 25435.0, 12405.0, 6360.0, 3209.0, 1708.0, 1014.0, 590.0, 313.0, 174.0, 122.0, 71.0, 59.0, 25.0, 19.0, 17.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.07958984375, -0.07740926742553711, -0.07522869110107422, -0.07304811477661133, -0.07086753845214844, -0.06868696212768555, -0.06650638580322266, -0.06432580947875977, -0.062145233154296875, -0.059964656829833984, -0.057784080505371094, -0.0556035041809082, -0.05342292785644531, -0.05124235153198242, -0.04906177520751953, -0.04688119888305664, -0.04470062255859375, -0.04252004623413086, -0.04033946990966797, -0.03815889358520508, -0.03597831726074219, -0.0337977409362793, -0.031617164611816406, -0.029436588287353516, -0.027256011962890625, -0.025075435638427734, -0.022894859313964844, -0.020714282989501953, -0.018533706665039062, -0.016353130340576172, -0.014172554016113281, -0.01199197769165039, -0.0098114013671875, -0.007630825042724609, -0.005450248718261719, -0.003269672393798828, -0.0010890960693359375, 0.0010914802551269531, 0.0032720565795898438, 0.005452632904052734, 0.007633209228515625, 0.009813785552978516, 0.011994361877441406, 0.014174938201904297, 0.016355514526367188, 0.018536090850830078, 0.02071666717529297, 0.02289724349975586, 0.02507781982421875, 0.02725839614868164, 0.02943897247314453, 0.03161954879760742, 0.03380012512207031, 0.0359807014465332, 0.038161277770996094, 0.040341854095458984, 0.042522430419921875, 0.044703006744384766, 0.046883583068847656, 0.04906415939331055, 0.05124473571777344, 0.05342531204223633, 0.05560588836669922, 0.05778646469116211, 0.059967041015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 11.0, 7.0, 9.0, 19.0, 22.0, 13.0, 23.0, 27.0, 36.0, 31.0, 49.0, 52.0, 59.0, 64.0, 64.0, 70.0, 70.0, 56.0, 42.0, 49.0, 43.0, 41.0, 31.0, 30.0, 13.0, 10.0, 12.0, 7.0, 4.0, 9.0, 7.0, 6.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10845947265625, -0.10482215881347656, -0.10118484497070312, -0.09754753112792969, -0.09391021728515625, -0.09027290344238281, -0.08663558959960938, -0.08299827575683594, -0.0793609619140625, -0.07572364807128906, -0.07208633422851562, -0.06844902038574219, -0.06481170654296875, -0.06117439270019531, -0.057537078857421875, -0.05389976501464844, -0.050262451171875, -0.04662513732910156, -0.042987823486328125, -0.03935050964355469, -0.03571319580078125, -0.03207588195800781, -0.028438568115234375, -0.024801254272460938, -0.0211639404296875, -0.017526626586914062, -0.013889312744140625, -0.010251998901367188, -0.00661468505859375, -0.0029773712158203125, 0.000659942626953125, 0.0042972564697265625, 0.0079345703125, 0.011571884155273438, 0.015209197998046875, 0.018846511840820312, 0.02248382568359375, 0.026121139526367188, 0.029758453369140625, 0.03339576721191406, 0.0370330810546875, 0.04067039489746094, 0.044307708740234375, 0.04794502258300781, 0.05158233642578125, 0.05521965026855469, 0.058856964111328125, 0.06249427795410156, 0.066131591796875, 0.06976890563964844, 0.07340621948242188, 0.07704353332519531, 0.08068084716796875, 0.08431816101074219, 0.08795547485351562, 0.09159278869628906, 0.0952301025390625, 0.09886741638183594, 0.10250473022460938, 0.10614204406738281, 0.10977935791015625, 0.11341667175292969, 0.11705398559570312, 0.12069129943847656, 0.12432861328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 18.0, 22.0, 43.0, 60.0, 96.0, 115.0, 117.0, 151.0, 117.0, 84.0, 59.0, 43.0, 19.0, 11.0, 9.0, 10.0, 5.0, 4.0, 4.0, 0.0, 2.0], "bins": [-4.130890369415283, -4.047792434692383, -3.9646944999694824, -3.881596565246582, -3.7984986305236816, -3.715400457382202, -3.6323025226593018, -3.5492045879364014, -3.466106653213501, -3.3830087184906006, -3.2999107837677, -3.2168128490448, -3.1337146759033203, -3.05061674118042, -2.9675188064575195, -2.884420871734619, -2.8013229370117188, -2.7182250022888184, -2.635127067565918, -2.5520291328430176, -2.468931198120117, -2.3858330249786377, -2.3027350902557373, -2.219637155532837, -2.1365392208099365, -2.053441286087036, -1.9703433513641357, -1.8872452974319458, -1.8041473627090454, -1.721049427986145, -1.637951374053955, -1.5548534393310547, -1.4717552661895752, -1.3886573314666748, -1.3055593967437744, -1.2224613428115845, -1.139363408088684, -1.0562654733657837, -0.9731674790382385, -0.8900694847106934, -0.806971549987793, -0.7238736152648926, -0.6407756209373474, -0.5576776266098022, -0.47457969188690186, -0.3914817273616791, -0.3083837628364563, -0.22528576850891113, -0.14218783378601074, -0.059089869260787964, 0.024008095264434814, 0.10710605978965759, 0.19020402431488037, 0.27330198884010315, 0.3563999533653259, 0.4394979476928711, 0.5225958824157715, 0.6056938171386719, 0.688791811466217, 0.7718898057937622, 0.8549877405166626, 0.938085675239563, 1.021183729171753, 1.1042816638946533, 1.1873795986175537]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 10.0, 8.0, 4.0, 13.0, 14.0, 11.0, 17.0, 18.0, 25.0, 26.0, 24.0, 32.0, 39.0, 40.0, 40.0, 29.0, 41.0, 38.0, 32.0, 49.0, 50.0, 49.0, 48.0, 26.0, 25.0, 35.0, 27.0, 24.0, 29.0, 24.0, 23.0, 22.0, 17.0, 13.0, 8.0, 12.0, 8.0, 8.0, 8.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6128857135772705, -1.564487338066101, -1.516088843345642, -1.4676904678344727, -1.4192919731140137, -1.3708935976028442, -1.3224952220916748, -1.2740967273712158, -1.2256983518600464, -1.177299976348877, -1.128901481628418, -1.0805031061172485, -1.032104730606079, -0.9837062358856201, -0.9353078603744507, -0.8869094252586365, -0.8385109901428223, -0.7901125550270081, -0.7417141199111938, -0.6933157444000244, -0.6449173092842102, -0.596518874168396, -0.5481204986572266, -0.49972206354141235, -0.45132362842559814, -0.40292519330978394, -0.3545267879962921, -0.3061283826828003, -0.2577299475669861, -0.20933152735233307, -0.16093310713768005, -0.11253470182418823, -0.06413626670837402, -0.01573784649372101, 0.03266057372093201, 0.08105899393558502, 0.12945741415023804, 0.17785583436489105, 0.22625425457954407, 0.2746526598930359, 0.3230510950088501, 0.3714495301246643, 0.41984793543815613, 0.46824634075164795, 0.5166447758674622, 0.5650432109832764, 0.6134415864944458, 0.66184002161026, 0.7102384567260742, 0.7586368918418884, 0.8070353269577026, 0.8554337024688721, 0.9038321375846863, 0.9522305727005005, 1.00062894821167, 1.049027442932129, 1.0974258184432983, 1.1458241939544678, 1.1942226886749268, 1.2426210641860962, 1.2910194396972656, 1.3394179344177246, 1.387816309928894, 1.4362146854400635, 1.4846131801605225]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 11.0, 12.0, 11.0, 26.0, 37.0, 58.0, 77.0, 119.0, 212.0, 376.0, 722.0, 1543.0, 3463.0, 8239.0, 21265.0, 63758.0, 237497.0, 760903.0, 1392295.0, 1112261.0, 422194.0, 112685.0, 34297.0, 12438.0, 5148.0, 2295.0, 1071.0, 538.0, 301.0, 166.0, 84.0, 65.0, 36.0, 29.0, 19.0, 10.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2169189453125, -0.2077770233154297, -0.19863510131835938, -0.18949317932128906, -0.18035125732421875, -0.17120933532714844, -0.16206741333007812, -0.1529254913330078, -0.1437835693359375, -0.1346416473388672, -0.12549972534179688, -0.11635780334472656, -0.10721588134765625, -0.09807395935058594, -0.08893203735351562, -0.07979011535644531, -0.070648193359375, -0.06150627136230469, -0.052364349365234375, -0.04322242736816406, -0.03408050537109375, -0.024938583374023438, -0.015796661376953125, -0.0066547393798828125, 0.0024871826171875, 0.011629104614257812, 0.020771026611328125, 0.029912948608398438, 0.03905487060546875, 0.04819679260253906, 0.057338714599609375, 0.06648063659667969, 0.07562255859375, 0.08476448059082031, 0.09390640258789062, 0.10304832458496094, 0.11219024658203125, 0.12133216857910156, 0.13047409057617188, 0.1396160125732422, 0.1487579345703125, 0.1578998565673828, 0.16704177856445312, 0.17618370056152344, 0.18532562255859375, 0.19446754455566406, 0.20360946655273438, 0.2127513885498047, 0.221893310546875, 0.2310352325439453, 0.24017715454101562, 0.24931907653808594, 0.25846099853515625, 0.26760292053222656, 0.2767448425292969, 0.2858867645263672, 0.2950286865234375, 0.3041706085205078, 0.3133125305175781, 0.32245445251464844, 0.33159637451171875, 0.34073829650878906, 0.3498802185058594, 0.3590221405029297, 0.3681640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 6.0, 9.0, 4.0, 14.0, 13.0, 14.0, 18.0, 22.0, 26.0, 18.0, 28.0, 28.0, 38.0, 31.0, 38.0, 40.0, 35.0, 29.0, 40.0, 49.0, 40.0, 35.0, 38.0, 35.0, 41.0, 37.0, 35.0, 24.0, 23.0, 26.0, 23.0, 23.0, 23.0, 14.0, 11.0, 12.0, 12.0, 10.0, 10.0, 5.0, 7.0, 6.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.19677734375, -0.1908130645751953, -0.18484878540039062, -0.17888450622558594, -0.17292022705078125, -0.16695594787597656, -0.16099166870117188, -0.1550273895263672, -0.1490631103515625, -0.1430988311767578, -0.13713455200195312, -0.13117027282714844, -0.12520599365234375, -0.11924171447753906, -0.11327743530273438, -0.10731315612792969, -0.101348876953125, -0.09538459777832031, -0.08942031860351562, -0.08345603942871094, -0.07749176025390625, -0.07152748107910156, -0.06556320190429688, -0.05959892272949219, -0.0536346435546875, -0.04767036437988281, -0.041706085205078125, -0.03574180603027344, -0.02977752685546875, -0.023813247680664062, -0.017848968505859375, -0.011884689331054688, -0.00592041015625, 4.38690185546875e-05, 0.006008148193359375, 0.011972427368164062, 0.01793670654296875, 0.023900985717773438, 0.029865264892578125, 0.03582954406738281, 0.0417938232421875, 0.04775810241699219, 0.053722381591796875, 0.05968666076660156, 0.06565093994140625, 0.07161521911621094, 0.07757949829101562, 0.08354377746582031, 0.089508056640625, 0.09547233581542969, 0.10143661499023438, 0.10740089416503906, 0.11336517333984375, 0.11932945251464844, 0.12529373168945312, 0.1312580108642578, 0.1372222900390625, 0.1431865692138672, 0.14915084838867188, 0.15511512756347656, 0.16107940673828125, 0.16704368591308594, 0.17300796508789062, 0.1789722442626953, 0.1849365234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 4.0, 11.0, 12.0, 14.0, 27.0, 37.0, 45.0, 78.0, 109.0, 147.0, 283.0, 476.0, 830.0, 1854.0, 4171.0, 12384.0, 50770.0, 346683.0, 2881796.0, 775854.0, 89562.0, 18721.0, 5716.0, 2191.0, 1063.0, 553.0, 315.0, 176.0, 121.0, 79.0, 47.0, 47.0, 29.0, 27.0, 19.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.6123046875, -0.5956039428710938, -0.5789031982421875, -0.5622024536132812, -0.545501708984375, -0.5288009643554688, -0.5121002197265625, -0.49539947509765625, -0.47869873046875, -0.46199798583984375, -0.4452972412109375, -0.42859649658203125, -0.411895751953125, -0.39519500732421875, -0.3784942626953125, -0.36179351806640625, -0.3450927734375, -0.32839202880859375, -0.3116912841796875, -0.29499053955078125, -0.278289794921875, -0.26158905029296875, -0.2448883056640625, -0.22818756103515625, -0.21148681640625, -0.19478607177734375, -0.1780853271484375, -0.16138458251953125, -0.144683837890625, -0.12798309326171875, -0.1112823486328125, -0.09458160400390625, -0.077880859375, -0.06118011474609375, -0.0444793701171875, -0.02777862548828125, -0.011077880859375, 0.00562286376953125, 0.0223236083984375, 0.03902435302734375, 0.05572509765625, 0.07242584228515625, 0.0891265869140625, 0.10582733154296875, 0.122528076171875, 0.13922882080078125, 0.1559295654296875, 0.17263031005859375, 0.1893310546875, 0.20603179931640625, 0.2227325439453125, 0.23943328857421875, 0.256134033203125, 0.27283477783203125, 0.2895355224609375, 0.30623626708984375, 0.32293701171875, 0.33963775634765625, 0.3563385009765625, 0.37303924560546875, 0.389739990234375, 0.40644073486328125, 0.4231414794921875, 0.43984222412109375, 0.45654296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 15.0, 17.0, 20.0, 24.0, 32.0, 63.0, 73.0, 94.0, 133.0, 185.0, 245.0, 321.0, 409.0, 434.0, 429.0, 371.0, 331.0, 234.0, 164.0, 121.0, 107.0, 59.0, 44.0, 26.0, 28.0, 19.0, 17.0, 9.0, 6.0, 2.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414794921875, -0.3998985290527344, -0.38500213623046875, -0.3701057434082031, -0.3552093505859375, -0.3403129577636719, -0.32541656494140625, -0.3105201721191406, -0.295623779296875, -0.2807273864746094, -0.26583099365234375, -0.2509346008300781, -0.2360382080078125, -0.22114181518554688, -0.20624542236328125, -0.19134902954101562, -0.17645263671875, -0.16155624389648438, -0.14665985107421875, -0.13176345825195312, -0.1168670654296875, -0.10197067260742188, -0.08707427978515625, -0.07217788696289062, -0.057281494140625, -0.042385101318359375, -0.02748870849609375, -0.012592315673828125, 0.0023040771484375, 0.017200469970703125, 0.03209686279296875, 0.046993255615234375, 0.0618896484375, 0.07678604125976562, 0.09168243408203125, 0.10657882690429688, 0.1214752197265625, 0.13637161254882812, 0.15126800537109375, 0.16616439819335938, 0.181060791015625, 0.19595718383789062, 0.21085357666015625, 0.22574996948242188, 0.2406463623046875, 0.2555427551269531, 0.27043914794921875, 0.2853355407714844, 0.30023193359375, 0.3151283264160156, 0.33002471923828125, 0.3449211120605469, 0.3598175048828125, 0.3747138977050781, 0.38961029052734375, 0.4045066833496094, 0.419403076171875, 0.4342994689941406, 0.44919586181640625, 0.4640922546386719, 0.4789886474609375, 0.4938850402832031, 0.5087814331054688, 0.5236778259277344, 0.53857421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 18.0, 14.0, 27.0, 40.0, 56.0, 70.0, 91.0, 101.0, 121.0, 118.0, 104.0, 62.0, 49.0, 41.0, 22.0, 16.0, 7.0, 3.0, 5.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986452102661133, -2.839566469192505, -2.692681074142456, -2.545795440673828, -2.3989100456237793, -2.2520244121551514, -2.1051387786865234, -1.958253264427185, -1.8113677501678467, -1.6644822359085083, -1.51759672164917, -1.370711088180542, -1.2238255739212036, -1.0769400596618652, -0.9300544857978821, -0.7831689119338989, -0.6362833976745605, -0.4893978536128998, -0.342512309551239, -0.19562676548957825, -0.04874122142791748, 0.0981442928314209, 0.24502986669540405, 0.3919154405593872, 0.5388009548187256, 0.685686469078064, 0.8325720429420471, 0.9794576168060303, 1.1263431310653687, 1.273228645324707, 1.420114278793335, 1.5669997930526733, 1.7138848304748535, 1.860770344734192, 2.0076558589935303, 2.154541492462158, 2.301426887512207, 2.448312520980835, 2.595198154449463, 2.7420835494995117, 2.8889691829681396, 3.0358548164367676, 3.1827402114868164, 3.3296258449554443, 3.4765114784240723, 3.623396873474121, 3.770282506942749, 3.917168140411377, 4.064053535461426, 4.210938930511475, 4.357824802398682, 4.5047101974487305, 4.651595592498779, 4.798480987548828, 4.945366859436035, 5.092252254486084, 5.239137649536133, 5.386023044586182, 5.532908916473389, 5.6797943115234375, 5.826679706573486, 5.973565101623535, 6.120450973510742, 6.267336368560791, 6.414222240447998]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 11.0, 7.0, 12.0, 21.0, 18.0, 15.0, 25.0, 30.0, 35.0, 39.0, 45.0, 44.0, 56.0, 54.0, 46.0, 60.0, 51.0, 46.0, 55.0, 49.0, 30.0, 52.0, 33.0, 34.0, 30.0, 19.0, 17.0, 14.0, 7.0, 13.0, 7.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.424018621444702, -2.350886583328247, -2.277754545211792, -2.204622507095337, -2.131490707397461, -2.058358669281006, -1.9852266311645508, -1.9120945930480957, -1.8389625549316406, -1.7658305168151855, -1.6926984786987305, -1.619566559791565, -1.5464345216751099, -1.4733024835586548, -1.4001705646514893, -1.3270385265350342, -1.253906488418579, -1.180774450302124, -1.107642412185669, -1.0345104932785034, -0.9613784551620483, -0.8882464170455933, -0.815114438533783, -0.7419824600219727, -0.6688504219055176, -0.5957183837890625, -0.5225864052772522, -0.4494543969631195, -0.3763223886489868, -0.3031903803348541, -0.23005837202072144, -0.15692639350891113, -0.08379459381103516, -0.010662585496902466, 0.062469422817230225, 0.13560143113136292, 0.2087334394454956, 0.2818654477596283, 0.354997456073761, 0.4281294345855713, 0.5012614727020264, 0.5743935108184814, 0.6475254893302917, 0.720657467842102, 0.7937895059585571, 0.8669215440750122, 0.9400535225868225, 1.0131855010986328, 1.086317539215088, 1.159449577331543, 1.232581615447998, 1.3057135343551636, 1.3788455724716187, 1.4519776105880737, 1.5251095294952393, 1.5982415676116943, 1.6713736057281494, 1.7445056438446045, 1.8176376819610596, 1.890769600868225, 1.9639016389846802, 2.0370335578918457, 2.110165596008301, 2.183297634124756, 2.256429672241211]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 20.0, 26.0, 29.0, 53.0, 75.0, 116.0, 174.0, 266.0, 464.0, 712.0, 1261.0, 2223.0, 4181.0, 8475.0, 17478.0, 40869.0, 96047.0, 212725.0, 301375.0, 201031.0, 89548.0, 37684.0, 16849.0, 7787.0, 3874.0, 2088.0, 1232.0, 668.0, 416.0, 288.0, 151.0, 106.0, 75.0, 61.0, 31.0, 22.0, 19.0, 15.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21106910705566406, -0.20277786254882812, -0.1944866180419922, -0.18619537353515625, -0.1779041290283203, -0.16961288452148438, -0.16132164001464844, -0.1530303955078125, -0.14473915100097656, -0.13644790649414062, -0.1281566619873047, -0.11986541748046875, -0.11157417297363281, -0.10328292846679688, -0.09499168395996094, -0.086700439453125, -0.07840919494628906, -0.07011795043945312, -0.06182670593261719, -0.05353546142578125, -0.04524421691894531, -0.036952972412109375, -0.028661727905273438, -0.0203704833984375, -0.012079238891601562, -0.003787994384765625, 0.0045032501220703125, 0.01279449462890625, 0.021085739135742188, 0.029376983642578125, 0.03766822814941406, 0.04595947265625, 0.05425071716308594, 0.06254196166992188, 0.07083320617675781, 0.07912445068359375, 0.08741569519042969, 0.09570693969726562, 0.10399818420410156, 0.1122894287109375, 0.12058067321777344, 0.12887191772460938, 0.1371631622314453, 0.14545440673828125, 0.1537456512451172, 0.16203689575195312, 0.17032814025878906, 0.178619384765625, 0.18691062927246094, 0.19520187377929688, 0.2034931182861328, 0.21178436279296875, 0.2200756072998047, 0.22836685180664062, 0.23665809631347656, 0.2449493408203125, 0.25324058532714844, 0.2615318298339844, 0.2698230743408203, 0.27811431884765625, 0.2864055633544922, 0.2946968078613281, 0.30298805236816406, 0.311279296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 11.0, 10.0, 12.0, 12.0, 15.0, 19.0, 37.0, 32.0, 33.0, 28.0, 52.0, 37.0, 49.0, 43.0, 47.0, 54.0, 60.0, 48.0, 33.0, 46.0, 41.0, 34.0, 38.0, 34.0, 31.0, 23.0, 29.0, 29.0, 16.0, 14.0, 8.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2524833679199219, -0.24349212646484375, -0.23450088500976562, -0.2255096435546875, -0.21651840209960938, -0.20752716064453125, -0.19853591918945312, -0.189544677734375, -0.18055343627929688, -0.17156219482421875, -0.16257095336914062, -0.1535797119140625, -0.14458847045898438, -0.13559722900390625, -0.12660598754882812, -0.11761474609375, -0.10862350463867188, -0.09963226318359375, -0.09064102172851562, -0.0816497802734375, -0.07265853881835938, -0.06366729736328125, -0.054676055908203125, -0.045684814453125, -0.036693572998046875, -0.02770233154296875, -0.018711090087890625, -0.0097198486328125, -0.000728607177734375, 0.00826263427734375, 0.017253875732421875, 0.0262451171875, 0.035236358642578125, 0.04422760009765625, 0.053218841552734375, 0.0622100830078125, 0.07120132446289062, 0.08019256591796875, 0.08918380737304688, 0.098175048828125, 0.10716629028320312, 0.11615753173828125, 0.12514877319335938, 0.1341400146484375, 0.14313125610351562, 0.15212249755859375, 0.16111373901367188, 0.17010498046875, 0.17909622192382812, 0.18808746337890625, 0.19707870483398438, 0.2060699462890625, 0.21506118774414062, 0.22405242919921875, 0.23304367065429688, 0.242034912109375, 0.2510261535644531, 0.26001739501953125, 0.2690086364746094, 0.2779998779296875, 0.2869911193847656, 0.29598236083984375, 0.3049736022949219, 0.31396484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 0.0, 7.0, 7.0, 10.0, 13.0, 14.0, 21.0, 27.0, 50.0, 60.0, 77.0, 136.0, 272.0, 561.0, 1287.0, 3541.0, 13048.0, 77235.0, 675398.0, 237287.0, 29301.0, 6357.0, 2065.0, 823.0, 374.0, 223.0, 129.0, 74.0, 55.0, 31.0, 12.0, 14.0, 11.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.51708984375, -0.5013008117675781, -0.48551177978515625, -0.4697227478027344, -0.4539337158203125, -0.4381446838378906, -0.42235565185546875, -0.4065666198730469, -0.390777587890625, -0.3749885559082031, -0.35919952392578125, -0.3434104919433594, -0.3276214599609375, -0.3118324279785156, -0.29604339599609375, -0.2802543640136719, -0.26446533203125, -0.24867630004882812, -0.23288726806640625, -0.21709823608398438, -0.2013092041015625, -0.18552017211914062, -0.16973114013671875, -0.15394210815429688, -0.138153076171875, -0.12236404418945312, -0.10657501220703125, -0.09078598022460938, -0.0749969482421875, -0.059207916259765625, -0.04341888427734375, -0.027629852294921875, -0.0118408203125, 0.003948211669921875, 0.01973724365234375, 0.035526275634765625, 0.0513153076171875, 0.06710433959960938, 0.08289337158203125, 0.09868240356445312, 0.114471435546875, 0.13026046752929688, 0.14604949951171875, 0.16183853149414062, 0.1776275634765625, 0.19341659545898438, 0.20920562744140625, 0.22499465942382812, 0.24078369140625, 0.2565727233886719, 0.27236175537109375, 0.2881507873535156, 0.3039398193359375, 0.3197288513183594, 0.33551788330078125, 0.3513069152832031, 0.367095947265625, 0.3828849792480469, 0.39867401123046875, 0.4144630432128906, 0.4302520751953125, 0.4460411071777344, 0.46183013916015625, 0.4776191711425781, 0.493408203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 7.0, 13.0, 14.0, 19.0, 22.0, 18.0, 24.0, 38.0, 53.0, 39.0, 45.0, 38.0, 43.0, 56.0, 44.0, 60.0, 40.0, 66.0, 39.0, 41.0, 50.0, 40.0, 27.0, 34.0, 24.0, 9.0, 25.0, 10.0, 14.0, 11.0, 8.0, 1.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.69580078125, -0.6740951538085938, -0.6523895263671875, -0.6306838989257812, -0.608978271484375, -0.5872726440429688, -0.5655670166015625, -0.5438613891601562, -0.52215576171875, -0.5004501342773438, -0.4787445068359375, -0.45703887939453125, -0.435333251953125, -0.41362762451171875, -0.3919219970703125, -0.37021636962890625, -0.3485107421875, -0.32680511474609375, -0.3050994873046875, -0.28339385986328125, -0.261688232421875, -0.23998260498046875, -0.2182769775390625, -0.19657135009765625, -0.17486572265625, -0.15316009521484375, -0.1314544677734375, -0.10974884033203125, -0.088043212890625, -0.06633758544921875, -0.0446319580078125, -0.02292633056640625, -0.001220703125, 0.02048492431640625, 0.0421905517578125, 0.06389617919921875, 0.085601806640625, 0.10730743408203125, 0.1290130615234375, 0.15071868896484375, 0.17242431640625, 0.19412994384765625, 0.2158355712890625, 0.23754119873046875, 0.259246826171875, 0.28095245361328125, 0.3026580810546875, 0.32436370849609375, 0.3460693359375, 0.36777496337890625, 0.3894805908203125, 0.41118621826171875, 0.432891845703125, 0.45459747314453125, 0.4763031005859375, 0.49800872802734375, 0.51971435546875, 0.5414199829101562, 0.5631256103515625, 0.5848312377929688, 0.606536865234375, 0.6282424926757812, 0.6499481201171875, 0.6716537475585938, 0.693359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 6.0, 16.0, 15.0, 44.0, 65.0, 99.0, 162.0, 335.0, 1063.0, 7554.0, 710396.0, 321567.0, 5695.0, 884.0, 260.0, 132.0, 89.0, 64.0, 35.0, 18.0, 11.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4278221130371094, -0.41399383544921875, -0.4001655578613281, -0.3863372802734375, -0.3725090026855469, -0.35868072509765625, -0.3448524475097656, -0.331024169921875, -0.3171958923339844, -0.30336761474609375, -0.2895393371582031, -0.2757110595703125, -0.2618827819824219, -0.24805450439453125, -0.23422622680664062, -0.22039794921875, -0.20656967163085938, -0.19274139404296875, -0.17891311645507812, -0.1650848388671875, -0.15125656127929688, -0.13742828369140625, -0.12360000610351562, -0.109771728515625, -0.09594345092773438, -0.08211517333984375, -0.06828689575195312, -0.0544586181640625, -0.040630340576171875, -0.02680206298828125, -0.012973785400390625, 0.0008544921875, 0.014682769775390625, 0.02851104736328125, 0.042339324951171875, 0.0561676025390625, 0.06999588012695312, 0.08382415771484375, 0.09765243530273438, 0.111480712890625, 0.12530899047851562, 0.13913726806640625, 0.15296554565429688, 0.1667938232421875, 0.18062210083007812, 0.19445037841796875, 0.20827865600585938, 0.22210693359375, 0.23593521118164062, 0.24976348876953125, 0.2635917663574219, 0.2774200439453125, 0.2912483215332031, 0.30507659912109375, 0.3189048767089844, 0.332733154296875, 0.3465614318847656, 0.36038970947265625, 0.3742179870605469, 0.3880462646484375, 0.4018745422363281, 0.41570281982421875, 0.4295310974121094, 0.443359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 9.0, 14.0, 17.0, 26.0, 40.0, 42.0, 74.0, 88.0, 104.0, 116.0, 108.0, 83.0, 65.0, 60.0, 44.0, 36.0, 21.0, 14.0, 7.0, 2.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5462359189987183e-05, -2.4281442165374756e-05, -2.310052514076233e-05, -2.1919608116149902e-05, -2.0738691091537476e-05, -1.955777406692505e-05, -1.8376857042312622e-05, -1.7195940017700195e-05, -1.601502299308777e-05, -1.4834105968475342e-05, -1.3653188943862915e-05, -1.2472271919250488e-05, -1.1291354894638062e-05, -1.0110437870025635e-05, -8.929520845413208e-06, -7.748603820800781e-06, -6.5676867961883545e-06, -5.386769771575928e-06, -4.205852746963501e-06, -3.0249357223510742e-06, -1.8440186977386475e-06, -6.631016731262207e-07, 5.178153514862061e-07, 1.6987323760986328e-06, 2.8796494007110596e-06, 4.060566425323486e-06, 5.241483449935913e-06, 6.42240047454834e-06, 7.603317499160767e-06, 8.784234523773193e-06, 9.96515154838562e-06, 1.1146068572998047e-05, 1.2326985597610474e-05, 1.35079026222229e-05, 1.4688819646835327e-05, 1.5869736671447754e-05, 1.705065369606018e-05, 1.8231570720672607e-05, 1.9412487745285034e-05, 2.059340476989746e-05, 2.1774321794509888e-05, 2.2955238819122314e-05, 2.413615584373474e-05, 2.5317072868347168e-05, 2.6497989892959595e-05, 2.767890691757202e-05, 2.8859823942184448e-05, 3.0040740966796875e-05, 3.12216579914093e-05, 3.240257501602173e-05, 3.3583492040634155e-05, 3.476440906524658e-05, 3.594532608985901e-05, 3.7126243114471436e-05, 3.830716013908386e-05, 3.948807716369629e-05, 4.0668994188308716e-05, 4.184991121292114e-05, 4.303082823753357e-05, 4.4211745262145996e-05, 4.539266228675842e-05, 4.657357931137085e-05, 4.7754496335983276e-05, 4.89354133605957e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 12.0, 27.0, 55.0, 95.0, 244.0, 705.0, 3029.0, 44103.0, 959052.0, 37312.0, 2718.0, 687.0, 240.0, 115.0, 78.0, 36.0, 19.0, 17.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.437744140625, -0.4242668151855469, -0.41078948974609375, -0.3973121643066406, -0.3838348388671875, -0.3703575134277344, -0.35688018798828125, -0.3434028625488281, -0.329925537109375, -0.3164482116699219, -0.30297088623046875, -0.2894935607910156, -0.2760162353515625, -0.2625389099121094, -0.24906158447265625, -0.23558425903320312, -0.22210693359375, -0.20862960815429688, -0.19515228271484375, -0.18167495727539062, -0.1681976318359375, -0.15472030639648438, -0.14124298095703125, -0.12776565551757812, -0.114288330078125, -0.10081100463867188, -0.08733367919921875, -0.07385635375976562, -0.0603790283203125, -0.046901702880859375, -0.03342437744140625, -0.019947052001953125, -0.0064697265625, 0.007007598876953125, 0.02048492431640625, 0.033962249755859375, 0.0474395751953125, 0.060916900634765625, 0.07439422607421875, 0.08787155151367188, 0.101348876953125, 0.11482620239257812, 0.12830352783203125, 0.14178085327148438, 0.1552581787109375, 0.16873550415039062, 0.18221282958984375, 0.19569015502929688, 0.20916748046875, 0.22264480590820312, 0.23612213134765625, 0.24959945678710938, 0.2630767822265625, 0.2765541076660156, 0.29003143310546875, 0.3035087585449219, 0.316986083984375, 0.3304634094238281, 0.34394073486328125, 0.3574180603027344, 0.3708953857421875, 0.3843727111816406, 0.39785003662109375, 0.4113273620605469, 0.4248046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 15.0, 26.0, 45.0, 81.0, 156.0, 230.0, 217.0, 94.0, 56.0, 31.0, 12.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4721260070800781, -0.45719146728515625, -0.4422569274902344, -0.4273223876953125, -0.4123878479003906, -0.39745330810546875, -0.3825187683105469, -0.367584228515625, -0.3526496887207031, -0.33771514892578125, -0.3227806091308594, -0.3078460693359375, -0.2929115295410156, -0.27797698974609375, -0.2630424499511719, -0.24810791015625, -0.23317337036132812, -0.21823883056640625, -0.20330429077148438, -0.1883697509765625, -0.17343521118164062, -0.15850067138671875, -0.14356613159179688, -0.128631591796875, -0.11369705200195312, -0.09876251220703125, -0.08382797241210938, -0.0688934326171875, -0.053958892822265625, -0.03902435302734375, -0.024089813232421875, -0.0091552734375, 0.005779266357421875, 0.02071380615234375, 0.035648345947265625, 0.0505828857421875, 0.06551742553710938, 0.08045196533203125, 0.09538650512695312, 0.110321044921875, 0.12525558471679688, 0.14019012451171875, 0.15512466430664062, 0.1700592041015625, 0.18499374389648438, 0.19992828369140625, 0.21486282348632812, 0.22979736328125, 0.24473190307617188, 0.25966644287109375, 0.2746009826660156, 0.2895355224609375, 0.3044700622558594, 0.31940460205078125, 0.3343391418457031, 0.349273681640625, 0.3642082214355469, 0.37914276123046875, 0.3940773010253906, 0.4090118408203125, 0.4239463806152344, 0.43888092041015625, 0.4538154602050781, 0.46875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 16.0, 21.0, 24.0, 41.0, 72.0, 77.0, 134.0, 148.0, 128.0, 95.0, 79.0, 49.0, 39.0, 21.0, 14.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.244434356689453, -2.130798578262329, -2.017162799835205, -1.903527021408081, -1.7898913621902466, -1.6762555837631226, -1.5626198053359985, -1.448984146118164, -1.33534836769104, -1.221712589263916, -1.108076810836792, -0.9944410920143127, -0.8808053731918335, -0.7671695947647095, -0.6535338163375854, -0.5398980975151062, -0.4262622594833374, -0.31262651085853577, -0.19899074733257294, -0.08535498380661011, 0.02828076481819153, 0.14191651344299316, 0.2555522918701172, 0.36918801069259644, 0.48282378911972046, 0.5964595675468445, 0.7100952863693237, 0.8237310647964478, 0.9373668432235718, 1.0510025024414062, 1.1646382808685303, 1.2782740592956543, 1.3919098377227783, 1.5055456161499023, 1.6191813945770264, 1.7328171730041504, 1.8464528322219849, 1.9600886106491089, 2.0737242698669434, 2.1873600482940674, 2.3009958267211914, 2.4146316051483154, 2.5282673835754395, 2.6419031620025635, 2.7555389404296875, 2.8691744804382324, 2.9828104972839355, 3.0964460372924805, 3.2100820541381836, 3.3237178325653076, 3.4373536109924316, 3.5509893894195557, 3.6646251678466797, 3.7782607078552246, 3.8918967247009277, 4.005532264709473, 4.119167804718018, 4.2328033447265625, 4.346439361572266, 4.4600749015808105, 4.573710918426514, 4.687346458435059, 4.800982475280762, 4.914618015289307, 5.02825403213501]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 10.0, 19.0, 14.0, 16.0, 19.0, 19.0, 42.0, 47.0, 48.0, 74.0, 70.0, 68.0, 75.0, 69.0, 64.0, 66.0, 40.0, 50.0, 33.0, 30.0, 36.0, 24.0, 14.0, 11.0, 6.0, 8.0, 7.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9931352138519287, -2.894886016845703, -2.7966365814208984, -2.6983871459960938, -2.600137948989868, -2.5018887519836426, -2.403639316558838, -2.305389881134033, -2.2071406841278076, -2.108891487121582, -2.0106420516967773, -1.9123927354812622, -1.814143419265747, -1.715894103050232, -1.6176447868347168, -1.5193954706192017, -1.4211461544036865, -1.3228968381881714, -1.2246475219726562, -1.1263982057571411, -1.028148889541626, -0.9298995733261108, -0.8316502571105957, -0.7334009408950806, -0.6351516246795654, -0.5369023084640503, -0.43865299224853516, -0.34040367603302, -0.24215435981750488, -0.14390504360198975, -0.04565572738647461, 0.05259358882904053, 0.15084266662597656, 0.2490919828414917, 0.34734129905700684, 0.445590615272522, 0.5438399314880371, 0.6420892477035522, 0.7403385639190674, 0.8385878801345825, 0.9368371963500977, 1.0350865125656128, 1.133335828781128, 1.231585144996643, 1.3298344612121582, 1.4280837774276733, 1.5263330936431885, 1.6245824098587036, 1.7228317260742188, 1.8210810422897339, 1.919330358505249, 2.0175795555114746, 2.1158289909362793, 2.214078426361084, 2.3123276233673096, 2.410576820373535, 2.50882625579834, 2.6070756912231445, 2.70532488822937, 2.8035740852355957, 2.9018235206604004, 3.000072956085205, 3.0983221530914307, 3.1965713500976562, 3.294820785522461]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 14.0, 9.0, 6.0, 9.0, 14.0, 14.0, 26.0, 28.0, 31.0, 42.0, 52.0, 71.0, 148.0, 227.0, 80.0, 55.0, 32.0, 31.0, 28.0, 19.0, 8.0, 10.0, 8.0, 6.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.381103515625, -0.3696098327636719, -0.35811614990234375, -0.3466224670410156, -0.3351287841796875, -0.3236351013183594, -0.31214141845703125, -0.3006477355957031, -0.289154052734375, -0.2776603698730469, -0.26616668701171875, -0.2546730041503906, -0.2431793212890625, -0.23168563842773438, -0.22019195556640625, -0.20869827270507812, -0.19720458984375, -0.18571090698242188, -0.17421722412109375, -0.16272354125976562, -0.1512298583984375, -0.13973617553710938, -0.12824249267578125, -0.11674880981445312, -0.105255126953125, -0.09376144409179688, -0.08226776123046875, -0.07077407836914062, -0.0592803955078125, -0.047786712646484375, -0.03629302978515625, -0.024799346923828125, -0.0133056640625, -0.001811981201171875, 0.00968170166015625, 0.021175384521484375, 0.0326690673828125, 0.044162750244140625, 0.05565643310546875, 0.06715011596679688, 0.078643798828125, 0.09013748168945312, 0.10163116455078125, 0.11312484741210938, 0.1246185302734375, 0.13611221313476562, 0.14760589599609375, 0.15909957885742188, 0.17059326171875, 0.18208694458007812, 0.19358062744140625, 0.20507431030273438, 0.2165679931640625, 0.22806167602539062, 0.23955535888671875, 0.2510490417480469, 0.262542724609375, 0.2740364074707031, 0.28553009033203125, 0.2970237731933594, 0.3085174560546875, 0.3200111389160156, 0.33150482177734375, 0.3429985046386719, 0.3544921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 8.0, 21.0, 22.0, 42.0, 65.0, 133.0, 228.0, 565.0, 1584.0, 6420.0, 74690.0, 8283641.0, 16336.0, 3053.0, 920.0, 371.0, 204.0, 114.0, 51.0, 38.0, 19.0, 14.0, 17.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9379535913467407, -1.8796736001968384, -1.8213937282562256, -1.7631137371063232, -1.7048338651657104, -1.646553874015808, -1.5882740020751953, -1.529994010925293, -1.4717140197753906, -1.4134340286254883, -1.3551541566848755, -1.2968741655349731, -1.2385942935943604, -1.180314302444458, -1.1220343112945557, -1.0637544393539429, -1.00547456741333, -0.9471946358680725, -0.8889147043228149, -0.8306347131729126, -0.772354781627655, -0.7140748500823975, -0.6557949185371399, -0.5975149869918823, -0.53923499584198, -0.4809550642967224, -0.42267510294914246, -0.3643951714038849, -0.30611521005630493, -0.24783527851104736, -0.1895553469657898, -0.13127538561820984, -0.07299542427062988, -0.014715481549501419, 0.043564461171627045, 0.10184440016746521, 0.16012434661388397, 0.21840429306030273, 0.2766842246055603, 0.33496418595314026, 0.3932441174983978, 0.4515240490436554, 0.5098040103912354, 0.5680839419364929, 0.6263638734817505, 0.6846438646316528, 0.7429237365722656, 0.801203727722168, 0.8594836592674255, 0.9177635908126831, 0.9760435223579407, 1.0343234539031982, 1.0926034450531006, 1.150883436203003, 1.2091633081436157, 1.267443299293518, 1.3257231712341309, 1.3840031623840332, 1.442283034324646, 1.5005630254745483, 1.5588428974151611, 1.6171228885650635, 1.6754028797149658, 1.7336827516555786, 1.791962742805481]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4320980310440063, -1.3883832693099976, -1.3446685075759888, -1.3009538650512695, -1.2572391033172607, -1.213524341583252, -1.1698095798492432, -1.1260948181152344, -1.0823800563812256, -1.0386652946472168, -0.9949505925178528, -0.951235830783844, -0.90752112865448, -0.8638063669204712, -0.8200916051864624, -0.7763768434524536, -0.7326622009277344, -0.6889474391937256, -0.6452327370643616, -0.6015179753303528, -0.5578032732009888, -0.51408851146698, -0.4703737497329712, -0.4266590178012848, -0.3829442858695984, -0.339229553937912, -0.2955148220062256, -0.2518000602722168, -0.2080853283405304, -0.164370596408844, -0.1206558346748352, -0.0769411027431488, -0.03322649002075195, 0.010488249361515045, 0.05420298874378204, 0.09791773557662964, 0.14163246750831604, 0.18534719944000244, 0.22906196117401123, 0.27277669310569763, 0.31649142503738403, 0.36020615696907043, 0.40392088890075684, 0.4476356506347656, 0.491350382566452, 0.5350651144981384, 0.5787798762321472, 0.6224945783615112, 0.66620934009552, 0.7099241018295288, 0.7536388039588928, 0.7973535656929016, 0.8410682678222656, 0.8847830295562744, 0.9284977912902832, 0.972212553024292, 1.0159273147583008, 1.0596420764923096, 1.1033568382263184, 1.1470715999603271, 1.1907862424850464, 1.2345010042190552, 1.278215765953064, 1.3219305276870728, 1.365645170211792]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 8.0, 7.0, 16.0, 15.0, 20.0, 23.0, 31.0, 35.0, 37.0, 74.0, 57.0, 62.0, 68.0, 87.0, 70.0, 58.0, 78.0, 44.0, 46.0, 35.0, 37.0, 25.0, 17.0, 12.0, 7.0, 1.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.27188873291015625, -0.2642364501953125, -0.25658416748046875, -0.248931884765625, -0.24127960205078125, -0.2336273193359375, -0.22597503662109375, -0.21832275390625, -0.21067047119140625, -0.2030181884765625, -0.19536590576171875, -0.187713623046875, -0.18006134033203125, -0.1724090576171875, -0.16475677490234375, -0.1571044921875, -0.14945220947265625, -0.1417999267578125, -0.13414764404296875, -0.126495361328125, -0.11884307861328125, -0.1111907958984375, -0.10353851318359375, -0.09588623046875, -0.08823394775390625, -0.0805816650390625, -0.07292938232421875, -0.065277099609375, -0.05762481689453125, -0.0499725341796875, -0.04232025146484375, -0.03466796875, -0.02701568603515625, -0.0193634033203125, -0.01171112060546875, -0.004058837890625, 0.00359344482421875, 0.0112457275390625, 0.01889801025390625, 0.02655029296875, 0.03420257568359375, 0.0418548583984375, 0.04950714111328125, 0.057159423828125, 0.06481170654296875, 0.0724639892578125, 0.08011627197265625, 0.0877685546875, 0.09542083740234375, 0.1030731201171875, 0.11072540283203125, 0.118377685546875, 0.12602996826171875, 0.1336822509765625, 0.14133453369140625, 0.14898681640625, 0.15663909912109375, 0.1642913818359375, 0.17194366455078125, 0.179595947265625, 0.18724822998046875, 0.1949005126953125, 0.20255279541015625, 0.210205078125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 13.0, 17.0, 29.0, 34.0, 54.0, 76.0, 122.0, 180.0, 311.0, 540.0, 966.0, 1754.0, 3615.0, 7624.0, 17935.0, 50805.0, 192073.0, 172171.0, 45460.0, 16354.0, 6953.0, 3319.0, 1690.0, 894.0, 477.0, 298.0, 168.0, 124.0, 78.0, 37.0, 29.0, 16.0, 13.0, 8.0, 11.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.532928466796875, -2.42718505859375, -2.321441650390625, -2.2156982421875, -2.109954833984375, -2.00421142578125, -1.898468017578125, -1.792724609375, -1.686981201171875, -1.58123779296875, -1.475494384765625, -1.3697509765625, -1.264007568359375, -1.15826416015625, -1.052520751953125, -0.94677734375, -0.841033935546875, -0.73529052734375, -0.629547119140625, -0.5238037109375, -0.418060302734375, -0.31231689453125, -0.206573486328125, -0.100830078125, 0.004913330078125, 0.11065673828125, 0.216400146484375, 0.3221435546875, 0.427886962890625, 0.53363037109375, 0.639373779296875, 0.7451171875, 0.850860595703125, 0.95660400390625, 1.062347412109375, 1.1680908203125, 1.273834228515625, 1.37957763671875, 1.485321044921875, 1.591064453125, 1.696807861328125, 1.80255126953125, 1.908294677734375, 2.0140380859375, 2.119781494140625, 2.22552490234375, 2.331268310546875, 2.43701171875, 2.542755126953125, 2.64849853515625, 2.754241943359375, 2.8599853515625, 2.965728759765625, 3.07147216796875, 3.177215576171875, 3.282958984375, 3.388702392578125, 3.49444580078125, 3.600189208984375, 3.7059326171875, 3.811676025390625, 3.91741943359375, 4.023162841796875, 4.12890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 13.0, 17.0, 15.0, 17.0, 18.0, 18.0, 27.0, 27.0, 34.0, 33.0, 37.0, 56.0, 49.0, 59.0, 51.0, 52.0, 61.0, 44.0, 51.0, 33.0, 36.0, 29.0, 37.0, 24.0, 21.0, 24.0, 24.0, 22.0, 10.0, 13.0, 11.0, 4.0, 2.0, 9.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2611961364746094, -0.25237274169921875, -0.24354934692382812, -0.2347259521484375, -0.22590255737304688, -0.21707916259765625, -0.20825576782226562, -0.199432373046875, -0.19060897827148438, -0.18178558349609375, -0.17296218872070312, -0.1641387939453125, -0.15531539916992188, -0.14649200439453125, -0.13766860961914062, -0.12884521484375, -0.12002182006835938, -0.11119842529296875, -0.10237503051757812, -0.0935516357421875, -0.08472824096679688, -0.07590484619140625, -0.06708145141601562, -0.058258056640625, -0.049434661865234375, -0.04061126708984375, -0.031787872314453125, -0.0229644775390625, -0.014141082763671875, -0.00531768798828125, 0.003505706787109375, 0.0123291015625, 0.021152496337890625, 0.02997589111328125, 0.038799285888671875, 0.0476226806640625, 0.056446075439453125, 0.06526947021484375, 0.07409286499023438, 0.082916259765625, 0.09173965454101562, 0.10056304931640625, 0.10938644409179688, 0.1182098388671875, 0.12703323364257812, 0.13585662841796875, 0.14468002319335938, 0.15350341796875, 0.16232681274414062, 0.17115020751953125, 0.17997360229492188, 0.1887969970703125, 0.19762039184570312, 0.20644378662109375, 0.21526718139648438, 0.224090576171875, 0.23291397094726562, 0.24173736572265625, 0.2505607604980469, 0.2593841552734375, 0.2682075500488281, 0.27703094482421875, 0.2858543395996094, 0.294677734375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 11.0, 8.0, 18.0, 12.0, 11.0, 21.0, 22.0, 33.0, 41.0, 37.0, 52.0, 43.0, 39.0, 30.0, 22.0, 20.0, 13.0, 6.0, 13.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0747687816619873, -1.0402421951293945, -1.0057154893875122, -0.9711889028549194, -0.9366622567176819, -0.9021356105804443, -0.8676090240478516, -0.833082377910614, -0.7985557317733765, -0.7640290856361389, -0.7295024991035461, -0.6949758529663086, -0.660449206829071, -0.6259225606918335, -0.5913959741592407, -0.5568693280220032, -0.5223427414894104, -0.48781612515449524, -0.4532894790172577, -0.41876286268234253, -0.384236216545105, -0.3497096002101898, -0.31518298387527466, -0.2806563377380371, -0.24612972140312195, -0.2116030901670456, -0.17707645893096924, -0.14254984259605408, -0.10802321135997772, -0.07349658012390137, -0.038969963788986206, -0.004443332552909851, 0.030083298683166504, 0.06460992991924286, 0.09913655370473862, 0.13366317749023438, 0.16818980872631073, 0.20271643996238708, 0.23724305629730225, 0.2717697024345398, 0.30629631876945496, 0.3408229351043701, 0.37534958124160767, 0.4098761975765228, 0.444402813911438, 0.47892946004867554, 0.5134561061859131, 0.5479826927185059, 0.5825093388557434, 0.617035984992981, 0.6515625715255737, 0.6860892176628113, 0.7206158638000488, 0.7551424503326416, 0.7896690964698792, 0.8241957426071167, 0.8587223291397095, 0.893248975276947, 0.9277755618095398, 0.9623022079467773, 0.9968288540840149, 1.0313555002212524, 1.0658820867538452, 1.100408673286438, 1.1349353790283203]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 5.0, 1.0, 13.0, 1.0, 9.0, 11.0, 15.0, 16.0, 19.0, 23.0, 35.0, 34.0, 47.0, 40.0, 52.0, 33.0, 27.0, 17.0, 15.0, 8.0, 8.0, 4.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.28456449508667, -1.245125412940979, -1.205686330795288, -1.1662472486495972, -1.1268081665039062, -1.0873689651489258, -1.0479298830032349, -1.008490800857544, -0.969051718711853, -0.9296126365661621, -0.8901735544204712, -0.8507344126701355, -0.8112953305244446, -0.7718562483787537, -0.732417106628418, -0.692978024482727, -0.6535389423370361, -0.6140998601913452, -0.5746607780456543, -0.5352216362953186, -0.4957825541496277, -0.45634347200393677, -0.41690436005592346, -0.37746524810791016, -0.33802616596221924, -0.2985870838165283, -0.259147971868515, -0.2197088748216629, -0.1802697777748108, -0.14083068072795868, -0.10139158368110657, -0.06195247173309326, -0.022513389587402344, 0.016925707459449768, 0.05636480450630188, 0.09580390155315399, 0.1352429986000061, 0.17468209564685822, 0.21412119269371033, 0.25356030464172363, 0.29299938678741455, 0.33243846893310547, 0.3718775808811188, 0.4113166928291321, 0.450755774974823, 0.4901948571205139, 0.5296339988708496, 0.5690730810165405, 0.6085121631622314, 0.6479512453079224, 0.6873903274536133, 0.726829469203949, 0.7662685513496399, 0.8057076334953308, 0.8451467752456665, 0.8845858573913574, 0.9240249395370483, 0.9634640216827393, 1.0029031038284302, 1.042342185974121, 1.0817813873291016, 1.1212204694747925, 1.1606595516204834, 1.2000986337661743, 1.2395377159118652]}, "eval/loss": 3.0510671138763428, "eval/bleu": 1.5827445667544166e-18, "eval/runtime": 2619.9089, "eval/samples_per_second": 5.634, "eval/steps_per_second": 0.704, "train/train_runtime": 93795.5595, "train/train_samples_per_second": 6.633, "train/train_steps_per_second": 0.104, "train/total_flos": 0.0, "train/train_loss": 3.260483605049765} \ No newline at end of file +{"train/loss": 0.9251, "train/learning_rate": 3.2066153313506185e-07, "train/epoch": 3.0, "train/global_step": 9720, "_runtime": 93795, "_timestamp": 1651767884, "_step": 9739, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 41.0, 232.0, 466.0, 211.0, 43.0, 14.0, 1.0], "bins": [-22.81093406677246, -22.4266300201416, -22.042327880859375, -21.658023834228516, -21.27372169494629, -20.88941764831543, -20.505115509033203, -20.120811462402344, -19.736509323120117, -19.352205276489258, -18.96790313720703, -18.583599090576172, -18.199296951293945, -17.814992904663086, -17.43069076538086, -17.04638671875, -16.66208267211914, -16.27777862548828, -15.893476486206055, -15.509173393249512, -15.124870300292969, -14.740567207336426, -14.356264114379883, -13.971960067749023, -13.587657928466797, -13.203354835510254, -12.819051742553711, -12.434748649597168, -12.050445556640625, -11.666142463684082, -11.281839370727539, -10.89753532409668, -10.513232231140137, -10.128929138183594, -9.74462604522705, -9.360322952270508, -8.976019859313965, -8.591716766357422, -8.207412719726562, -7.823110103607178, -7.438807487487793, -7.05450439453125, -6.670201301574707, -6.285898208618164, -5.901595115661621, -5.517292022705078, -5.132988452911377, -4.748685359954834, -4.364382266998291, -3.980079174041748, -3.595776081085205, -3.211472749710083, -2.82716965675354, -2.442866563796997, -2.058563232421875, -1.674260139465332, -1.2899569272994995, -0.9056537747383118, -0.521350622177124, -0.1370474100112915, 0.24725568294525146, 0.6315587759017944, 1.0158621072769165, 1.4001652002334595, 1.7844682931900024]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 3.0, 8.0, 13.0, 11.0, 13.0, 15.0, 16.0, 22.0, 21.0, 24.0, 29.0, 26.0, 28.0, 39.0, 33.0, 41.0, 34.0, 32.0, 33.0, 47.0, 38.0, 41.0, 30.0, 35.0, 35.0, 43.0, 38.0, 31.0, 30.0, 23.0, 33.0, 16.0, 25.0, 16.0, 12.0, 19.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.0006556510925293, -1.933129072189331, -1.8656026124954224, -1.7980761528015137, -1.7305495738983154, -1.6630229949951172, -1.5954965353012085, -1.5279700756072998, -1.4604434967041016, -1.3929169178009033, -1.3253904581069946, -1.257863998413086, -1.1903374195098877, -1.1228108406066895, -1.0552843809127808, -0.9877578616142273, -0.9202313423156738, -0.8527048230171204, -0.7851783037185669, -0.7176517844200134, -0.65012526512146, -0.5825987458229065, -0.515072226524353, -0.44754570722579956, -0.3800191879272461, -0.3124926686286926, -0.24496614933013916, -0.1774396300315857, -0.10991311073303223, -0.04238659143447876, 0.025139927864074707, 0.09266644716262817, 0.16019272804260254, 0.227719247341156, 0.2952457666397095, 0.36277228593826294, 0.4302988052368164, 0.4978253245353699, 0.5653518438339233, 0.6328783631324768, 0.7004048824310303, 0.7679314017295837, 0.8354579210281372, 0.9029844403266907, 0.9705109596252441, 1.0380375385284424, 1.105563998222351, 1.1730904579162598, 1.240617036819458, 1.3081436157226562, 1.375670075416565, 1.4431965351104736, 1.5107231140136719, 1.5782496929168701, 1.6457761526107788, 1.7133026123046875, 1.7808291912078857, 1.848355770111084, 1.9158822298049927, 1.9834086894989014, 2.0509352684020996, 2.118461847305298, 2.185988426208496, 2.2535147666931152, 2.3210413455963135]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 8.0, 9.0, 10.0, 20.0, 21.0, 38.0, 62.0, 83.0, 124.0, 179.0, 285.0, 389.0, 552.0, 796.0, 1204.0, 1853.0, 3058.0, 5427.0, 9892.0, 19022.0, 38094.0, 82406.0, 219508.0, 868829.0, 2214707.0, 462620.0, 142770.0, 60228.0, 28659.0, 14034.0, 7695.0, 4267.0, 2619.0, 1648.0, 1032.0, 694.0, 471.0, 298.0, 220.0, 151.0, 92.0, 76.0, 41.0, 29.0, 27.0, 10.0, 8.0, 6.0, 5.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.96484375, -1.899993896484375, -1.83514404296875, -1.770294189453125, -1.7054443359375, -1.640594482421875, -1.57574462890625, -1.510894775390625, -1.446044921875, -1.381195068359375, -1.31634521484375, -1.251495361328125, -1.1866455078125, -1.121795654296875, -1.05694580078125, -0.992095947265625, -0.92724609375, -0.862396240234375, -0.79754638671875, -0.732696533203125, -0.6678466796875, -0.602996826171875, -0.53814697265625, -0.473297119140625, -0.408447265625, -0.343597412109375, -0.27874755859375, -0.213897705078125, -0.1490478515625, -0.084197998046875, -0.01934814453125, 0.045501708984375, 0.1103515625, 0.175201416015625, 0.24005126953125, 0.304901123046875, 0.3697509765625, 0.434600830078125, 0.49945068359375, 0.564300537109375, 0.629150390625, 0.694000244140625, 0.75885009765625, 0.823699951171875, 0.8885498046875, 0.953399658203125, 1.01824951171875, 1.083099365234375, 1.14794921875, 1.212799072265625, 1.27764892578125, 1.342498779296875, 1.4073486328125, 1.472198486328125, 1.53704833984375, 1.601898193359375, 1.666748046875, 1.731597900390625, 1.79644775390625, 1.861297607421875, 1.9261474609375, 1.990997314453125, 2.05584716796875, 2.120697021484375, 2.185546875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 10.0, 4.0, 9.0, 9.0, 13.0, 11.0, 14.0, 25.0, 22.0, 30.0, 15.0, 32.0, 40.0, 40.0, 37.0, 45.0, 26.0, 51.0, 47.0, 53.0, 48.0, 48.0, 44.0, 29.0, 52.0, 41.0, 29.0, 32.0, 21.0, 23.0, 21.0, 22.0, 14.0, 10.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.538665771484375, -3.42108154296875, -3.303497314453125, -3.1859130859375, -3.068328857421875, -2.95074462890625, -2.833160400390625, -2.715576171875, -2.597991943359375, -2.48040771484375, -2.362823486328125, -2.2452392578125, -2.127655029296875, -2.01007080078125, -1.892486572265625, -1.77490234375, -1.657318115234375, -1.53973388671875, -1.422149658203125, -1.3045654296875, -1.186981201171875, -1.06939697265625, -0.951812744140625, -0.834228515625, -0.716644287109375, -0.59906005859375, -0.481475830078125, -0.3638916015625, -0.246307373046875, -0.12872314453125, -0.011138916015625, 0.1064453125, 0.224029541015625, 0.34161376953125, 0.459197998046875, 0.5767822265625, 0.694366455078125, 0.81195068359375, 0.929534912109375, 1.047119140625, 1.164703369140625, 1.28228759765625, 1.399871826171875, 1.5174560546875, 1.635040283203125, 1.75262451171875, 1.870208740234375, 1.98779296875, 2.105377197265625, 2.22296142578125, 2.340545654296875, 2.4581298828125, 2.575714111328125, 2.69329833984375, 2.810882568359375, 2.928466796875, 3.046051025390625, 3.16363525390625, 3.281219482421875, 3.3988037109375, 3.516387939453125, 3.63397216796875, 3.751556396484375, 3.869140625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 3.0, 6.0, 7.0, 11.0, 11.0, 21.0, 35.0, 58.0, 86.0, 172.0, 1069.0, 4186925.0, 5374.0, 249.0, 95.0, 60.0, 26.0, 22.0, 30.0, 13.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-65.5625, -63.6708984375, -61.779296875, -59.8876953125, -57.99609375, -56.1044921875, -54.212890625, -52.3212890625, -50.4296875, -48.5380859375, -46.646484375, -44.7548828125, -42.86328125, -40.9716796875, -39.080078125, -37.1884765625, -35.296875, -33.4052734375, -31.513671875, -29.6220703125, -27.73046875, -25.8388671875, -23.947265625, -22.0556640625, -20.1640625, -18.2724609375, -16.380859375, -14.4892578125, -12.59765625, -10.7060546875, -8.814453125, -6.9228515625, -5.03125, -3.1396484375, -1.248046875, 0.6435546875, 2.53515625, 4.4267578125, 6.318359375, 8.2099609375, 10.1015625, 11.9931640625, 13.884765625, 15.7763671875, 17.66796875, 19.5595703125, 21.451171875, 23.3427734375, 25.234375, 27.1259765625, 29.017578125, 30.9091796875, 32.80078125, 34.6923828125, 36.583984375, 38.4755859375, 40.3671875, 42.2587890625, 44.150390625, 46.0419921875, 47.93359375, 49.8251953125, 51.716796875, 53.6083984375, 55.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 6.0, 6.0, 15.0, 18.0, 24.0, 26.0, 66.0, 92.0, 157.0, 682.0, 2059.0, 554.0, 142.0, 84.0, 49.0, 29.0, 22.0, 13.0, 13.0, 11.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.216796875, -2.14630126953125, -2.0758056640625, -2.00531005859375, -1.934814453125, -1.86431884765625, -1.7938232421875, -1.72332763671875, -1.65283203125, -1.58233642578125, -1.5118408203125, -1.44134521484375, -1.370849609375, -1.30035400390625, -1.2298583984375, -1.15936279296875, -1.0888671875, -1.01837158203125, -0.9478759765625, -0.87738037109375, -0.806884765625, -0.73638916015625, -0.6658935546875, -0.59539794921875, -0.52490234375, -0.45440673828125, -0.3839111328125, -0.31341552734375, -0.242919921875, -0.17242431640625, -0.1019287109375, -0.03143310546875, 0.0390625, 0.10955810546875, 0.1800537109375, 0.25054931640625, 0.321044921875, 0.39154052734375, 0.4620361328125, 0.53253173828125, 0.60302734375, 0.67352294921875, 0.7440185546875, 0.81451416015625, 0.885009765625, 0.95550537109375, 1.0260009765625, 1.09649658203125, 1.1669921875, 1.23748779296875, 1.3079833984375, 1.37847900390625, 1.448974609375, 1.51947021484375, 1.5899658203125, 1.66046142578125, 1.73095703125, 1.80145263671875, 1.8719482421875, 1.94244384765625, 2.012939453125, 2.08343505859375, 2.1539306640625, 2.22442626953125, 2.294921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 13.0, 26.0, 31.0, 35.0, 72.0, 82.0, 131.0, 130.0, 138.0, 111.0, 78.0, 52.0, 37.0, 24.0, 12.0, 9.0, 5.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-12.560930252075195, -12.301332473754883, -12.04173469543457, -11.782137870788574, -11.522540092468262, -11.26294231414795, -11.003345489501953, -10.74374771118164, -10.484149932861328, -10.224552154541016, -9.964954376220703, -9.705357551574707, -9.445759773254395, -9.186161994934082, -8.926565170288086, -8.666967391967773, -8.407369613647461, -8.147771835327148, -7.888174533843994, -7.62857723236084, -7.368979454040527, -7.109381675720215, -6.8497843742370605, -6.590187072753906, -6.330589294433594, -6.070991516113281, -5.811394214630127, -5.551796913146973, -5.29219913482666, -5.032601356506348, -4.773004055023193, -4.513406753540039, -4.253809928894043, -3.9942123889923096, -3.734614849090576, -3.4750173091888428, -3.2154197692871094, -2.955822229385376, -2.6962246894836426, -2.436627149581909, -2.177029609680176, -1.9174320697784424, -1.657834529876709, -1.3982369899749756, -1.1386394500732422, -0.8790419101715088, -0.6194443702697754, -0.359846830368042, -0.1002492904663086, 0.1593482494354248, 0.4189457893371582, 0.6785433292388916, 0.938140869140625, 1.1977384090423584, 1.4573359489440918, 1.7169334888458252, 1.9765310287475586, 2.236128568649292, 2.4957261085510254, 2.755323648452759, 3.014921188354492, 3.2745187282562256, 3.534116268157959, 3.7937138080596924, 4.053311347961426]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 10.0, 11.0, 16.0, 14.0, 16.0, 19.0, 18.0, 17.0, 29.0, 28.0, 34.0, 48.0, 40.0, 34.0, 31.0, 49.0, 33.0, 45.0, 38.0, 36.0, 44.0, 42.0, 32.0, 32.0, 29.0, 32.0, 32.0, 24.0, 27.0, 15.0, 20.0, 23.0, 11.0, 17.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.888427495956421, -2.7885069847106934, -2.688586711883545, -2.5886662006378174, -2.488745927810669, -2.3888254165649414, -2.288905143737793, -2.1889846324920654, -2.089064121246338, -1.9891437292099, -1.889223337173462, -1.7893028259277344, -1.689382553100586, -1.5894620418548584, -1.4895416498184204, -1.3896212577819824, -1.289700984954834, -1.189780592918396, -1.089860200881958, -0.9899397492408752, -0.8900193572044373, -0.7900989651679993, -0.6901785135269165, -0.5902581214904785, -0.4903377294540405, -0.39041733741760254, -0.29049691557884216, -0.1905764937400818, -0.0906561017036438, 0.00926429033279419, 0.10918474197387695, 0.20910513401031494, 0.30902528762817383, 0.4089456796646118, 0.5088660717010498, 0.6087865233421326, 0.7087069153785706, 0.8086273074150085, 0.9085477590560913, 1.0084681510925293, 1.1083885431289673, 1.2083089351654053, 1.3082293272018433, 1.4081497192382812, 1.5080702304840088, 1.6079905033111572, 1.7079110145568848, 1.8078314065933228, 1.9077517986297607, 2.0076723098754883, 2.1075925827026367, 2.2075130939483643, 2.3074333667755127, 2.4073538780212402, 2.5072741508483887, 2.607194662094116, 2.7071151733398438, 2.8070356845855713, 2.9069559574127197, 3.0068764686584473, 3.1067967414855957, 3.2067172527313232, 3.306637763977051, 3.406558036804199, 3.5064783096313477]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 8.0, 16.0, 31.0, 47.0, 88.0, 148.0, 271.0, 435.0, 753.0, 1359.0, 2627.0, 5296.0, 11371.0, 26243.0, 65216.0, 173036.0, 349536.0, 248225.0, 96093.0, 37240.0, 15846.0, 7179.0, 3501.0, 1695.0, 932.0, 565.0, 317.0, 188.0, 131.0, 56.0, 20.0, 24.0, 13.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.291015625, -1.24603271484375, -1.2010498046875, -1.15606689453125, -1.111083984375, -1.06610107421875, -1.0211181640625, -0.97613525390625, -0.93115234375, -0.88616943359375, -0.8411865234375, -0.79620361328125, -0.751220703125, -0.70623779296875, -0.6612548828125, -0.61627197265625, -0.5712890625, -0.52630615234375, -0.4813232421875, -0.43634033203125, -0.391357421875, -0.34637451171875, -0.3013916015625, -0.25640869140625, -0.21142578125, -0.16644287109375, -0.1214599609375, -0.07647705078125, -0.031494140625, 0.01348876953125, 0.0584716796875, 0.10345458984375, 0.1484375, 0.19342041015625, 0.2384033203125, 0.28338623046875, 0.328369140625, 0.37335205078125, 0.4183349609375, 0.46331787109375, 0.50830078125, 0.55328369140625, 0.5982666015625, 0.64324951171875, 0.688232421875, 0.73321533203125, 0.7781982421875, 0.82318115234375, 0.8681640625, 0.91314697265625, 0.9581298828125, 1.00311279296875, 1.048095703125, 1.09307861328125, 1.1380615234375, 1.18304443359375, 1.22802734375, 1.27301025390625, 1.3179931640625, 1.36297607421875, 1.407958984375, 1.45294189453125, 1.4979248046875, 1.54290771484375, 1.587890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 12.0, 9.0, 14.0, 19.0, 27.0, 19.0, 30.0, 32.0, 37.0, 41.0, 47.0, 64.0, 63.0, 50.0, 65.0, 54.0, 59.0, 55.0, 52.0, 56.0, 37.0, 42.0, 28.0, 25.0, 14.0, 9.0, 15.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.1015625, -3.98828125, -3.875, -3.76171875, -3.6484375, -3.53515625, -3.421875, -3.30859375, -3.1953125, -3.08203125, -2.96875, -2.85546875, -2.7421875, -2.62890625, -2.515625, -2.40234375, -2.2890625, -2.17578125, -2.0625, -1.94921875, -1.8359375, -1.72265625, -1.609375, -1.49609375, -1.3828125, -1.26953125, -1.15625, -1.04296875, -0.9296875, -0.81640625, -0.703125, -0.58984375, -0.4765625, -0.36328125, -0.25, -0.13671875, -0.0234375, 0.08984375, 0.203125, 0.31640625, 0.4296875, 0.54296875, 0.65625, 0.76953125, 0.8828125, 0.99609375, 1.109375, 1.22265625, 1.3359375, 1.44921875, 1.5625, 1.67578125, 1.7890625, 1.90234375, 2.015625, 2.12890625, 2.2421875, 2.35546875, 2.46875, 2.58203125, 2.6953125, 2.80859375, 2.921875, 3.03515625, 3.1484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 3.0, 11.0, 17.0, 21.0, 30.0, 42.0, 76.0, 101.0, 183.0, 418.0, 634.0, 1361.0, 3222.0, 8430.0, 25532.0, 94036.0, 378079.0, 394984.0, 99770.0, 26703.0, 8597.0, 3250.0, 1409.0, 724.0, 355.0, 188.0, 127.0, 78.0, 48.0, 36.0, 18.0, 21.0, 10.0, 9.0, 5.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8125, -1.7607421875, -1.708984375, -1.6572265625, -1.60546875, -1.5537109375, -1.501953125, -1.4501953125, -1.3984375, -1.3466796875, -1.294921875, -1.2431640625, -1.19140625, -1.1396484375, -1.087890625, -1.0361328125, -0.984375, -0.9326171875, -0.880859375, -0.8291015625, -0.77734375, -0.7255859375, -0.673828125, -0.6220703125, -0.5703125, -0.5185546875, -0.466796875, -0.4150390625, -0.36328125, -0.3115234375, -0.259765625, -0.2080078125, -0.15625, -0.1044921875, -0.052734375, -0.0009765625, 0.05078125, 0.1025390625, 0.154296875, 0.2060546875, 0.2578125, 0.3095703125, 0.361328125, 0.4130859375, 0.46484375, 0.5166015625, 0.568359375, 0.6201171875, 0.671875, 0.7236328125, 0.775390625, 0.8271484375, 0.87890625, 0.9306640625, 0.982421875, 1.0341796875, 1.0859375, 1.1376953125, 1.189453125, 1.2412109375, 1.29296875, 1.3447265625, 1.396484375, 1.4482421875, 1.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 4.0, 7.0, 9.0, 11.0, 10.0, 15.0, 8.0, 24.0, 28.0, 30.0, 38.0, 33.0, 28.0, 38.0, 32.0, 41.0, 34.0, 45.0, 37.0, 47.0, 44.0, 54.0, 44.0, 41.0, 36.0, 25.0, 35.0, 34.0, 25.0, 17.0, 17.0, 13.0, 19.0, 13.0, 11.0, 8.0, 10.0, 12.0, 12.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.43597412109375, -5.2625732421875, -5.08917236328125, -4.915771484375, -4.74237060546875, -4.5689697265625, -4.39556884765625, -4.22216796875, -4.04876708984375, -3.8753662109375, -3.70196533203125, -3.528564453125, -3.35516357421875, -3.1817626953125, -3.00836181640625, -2.8349609375, -2.66156005859375, -2.4881591796875, -2.31475830078125, -2.141357421875, -1.96795654296875, -1.7945556640625, -1.62115478515625, -1.44775390625, -1.27435302734375, -1.1009521484375, -0.92755126953125, -0.754150390625, -0.58074951171875, -0.4073486328125, -0.23394775390625, -0.060546875, 0.11285400390625, 0.2862548828125, 0.45965576171875, 0.633056640625, 0.80645751953125, 0.9798583984375, 1.15325927734375, 1.32666015625, 1.50006103515625, 1.6734619140625, 1.84686279296875, 2.020263671875, 2.19366455078125, 2.3670654296875, 2.54046630859375, 2.7138671875, 2.88726806640625, 3.0606689453125, 3.23406982421875, 3.407470703125, 3.58087158203125, 3.7542724609375, 3.92767333984375, 4.10107421875, 4.27447509765625, 4.4478759765625, 4.62127685546875, 4.794677734375, 4.96807861328125, 5.1414794921875, 5.31488037109375, 5.48828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 2.0, 7.0, 14.0, 26.0, 37.0, 37.0, 57.0, 85.0, 121.0, 227.0, 306.0, 540.0, 838.0, 1482.0, 2504.0, 4760.0, 9445.0, 21136.0, 53814.0, 170990.0, 420848.0, 237123.0, 73071.0, 26541.0, 11585.0, 5552.0, 3031.0, 1710.0, 1020.0, 557.0, 346.0, 239.0, 154.0, 103.0, 67.0, 48.0, 45.0, 22.0, 20.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.373779296875, -0.3619651794433594, -0.35015106201171875, -0.3383369445800781, -0.3265228271484375, -0.3147087097167969, -0.30289459228515625, -0.2910804748535156, -0.279266357421875, -0.2674522399902344, -0.25563812255859375, -0.24382400512695312, -0.2320098876953125, -0.22019577026367188, -0.20838165283203125, -0.19656753540039062, -0.18475341796875, -0.17293930053710938, -0.16112518310546875, -0.14931106567382812, -0.1374969482421875, -0.12568283081054688, -0.11386871337890625, -0.10205459594726562, -0.090240478515625, -0.07842636108398438, -0.06661224365234375, -0.054798126220703125, -0.0429840087890625, -0.031169891357421875, -0.01935577392578125, -0.007541656494140625, 0.0042724609375, 0.016086578369140625, 0.02790069580078125, 0.039714813232421875, 0.0515289306640625, 0.06334304809570312, 0.07515716552734375, 0.08697128295898438, 0.098785400390625, 0.11059951782226562, 0.12241363525390625, 0.13422775268554688, 0.1460418701171875, 0.15785598754882812, 0.16967010498046875, 0.18148422241210938, 0.19329833984375, 0.20511245727539062, 0.21692657470703125, 0.22874069213867188, 0.2405548095703125, 0.2523689270019531, 0.26418304443359375, 0.2759971618652344, 0.287811279296875, 0.2996253967285156, 0.31143951416015625, 0.3232536315917969, 0.3350677490234375, 0.3468818664550781, 0.35869598388671875, 0.3705101013183594, 0.38232421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 12.0, 14.0, 28.0, 20.0, 40.0, 66.0, 81.0, 106.0, 125.0, 142.0, 102.0, 76.0, 54.0, 28.0, 32.0, 21.0, 11.0, 10.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037741661071777344, -0.00036386027932167053, -0.0003503039479255676, -0.0003367476165294647, -0.0003231912851333618, -0.0003096349537372589, -0.000296078622341156, -0.0002825222909450531, -0.0002689659595489502, -0.0002554096281528473, -0.00024185329675674438, -0.00022829696536064148, -0.00021474063396453857, -0.00020118430256843567, -0.00018762797117233276, -0.00017407163977622986, -0.00016051530838012695, -0.00014695897698402405, -0.00013340264558792114, -0.00011984631419181824, -0.00010628998279571533, -9.273365139961243e-05, -7.917732000350952e-05, -6.562098860740662e-05, -5.206465721130371e-05, -3.8508325815200806e-05, -2.49519944190979e-05, -1.1395663022994995e-05, 2.16066837310791e-06, 1.5716999769210815e-05, 2.927333116531372e-05, 4.2829662561416626e-05, 5.638599395751953e-05, 6.994232535362244e-05, 8.349865674972534e-05, 9.705498814582825e-05, 0.00011061131954193115, 0.00012416765093803406, 0.00013772398233413696, 0.00015128031373023987, 0.00016483664512634277, 0.00017839297652244568, 0.00019194930791854858, 0.0002055056393146515, 0.0002190619707107544, 0.0002326183021068573, 0.0002461746335029602, 0.0002597309648990631, 0.000273287296295166, 0.0002868436276912689, 0.0003003999590873718, 0.00031395629048347473, 0.00032751262187957764, 0.00034106895327568054, 0.00035462528467178345, 0.00036818161606788635, 0.00038173794746398926, 0.00039529427886009216, 0.00040885061025619507, 0.000422406941652298, 0.0004359632730484009, 0.0004495196044445038, 0.0004630759358406067, 0.0004766322672367096, 0.0004901885986328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 14.0, 11.0, 11.0, 35.0, 40.0, 66.0, 108.0, 229.0, 976.0, 6056.0, 71367.0, 832968.0, 125746.0, 8947.0, 1273.0, 305.0, 124.0, 91.0, 50.0, 24.0, 19.0, 19.0, 9.0, 8.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.331939697265625, -1.28692626953125, -1.241912841796875, -1.1968994140625, -1.151885986328125, -1.10687255859375, -1.061859130859375, -1.016845703125, -0.971832275390625, -0.92681884765625, -0.881805419921875, -0.8367919921875, -0.791778564453125, -0.74676513671875, -0.701751708984375, -0.65673828125, -0.611724853515625, -0.56671142578125, -0.521697998046875, -0.4766845703125, -0.431671142578125, -0.38665771484375, -0.341644287109375, -0.296630859375, -0.251617431640625, -0.20660400390625, -0.161590576171875, -0.1165771484375, -0.071563720703125, -0.02655029296875, 0.018463134765625, 0.0634765625, 0.108489990234375, 0.15350341796875, 0.198516845703125, 0.2435302734375, 0.288543701171875, 0.33355712890625, 0.378570556640625, 0.423583984375, 0.468597412109375, 0.51361083984375, 0.558624267578125, 0.6036376953125, 0.648651123046875, 0.69366455078125, 0.738677978515625, 0.78369140625, 0.828704833984375, 0.87371826171875, 0.918731689453125, 0.9637451171875, 1.008758544921875, 1.05377197265625, 1.098785400390625, 1.143798828125, 1.188812255859375, 1.23382568359375, 1.278839111328125, 1.3238525390625, 1.368865966796875, 1.41387939453125, 1.458892822265625, 1.50390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 5.0, 1.0, 8.0, 4.0, 5.0, 17.0, 15.0, 16.0, 20.0, 29.0, 33.0, 42.0, 40.0, 50.0, 54.0, 68.0, 70.0, 59.0, 63.0, 69.0, 60.0, 46.0, 56.0, 27.0, 40.0, 30.0, 16.0, 17.0, 8.0, 12.0, 9.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1416015625, -0.1370220184326172, -0.13244247436523438, -0.12786293029785156, -0.12328338623046875, -0.11870384216308594, -0.11412429809570312, -0.10954475402832031, -0.1049652099609375, -0.10038566589355469, -0.09580612182617188, -0.09122657775878906, -0.08664703369140625, -0.08206748962402344, -0.07748794555664062, -0.07290840148925781, -0.068328857421875, -0.06374931335449219, -0.059169769287109375, -0.05459022521972656, -0.05001068115234375, -0.04543113708496094, -0.040851593017578125, -0.03627204895019531, -0.0316925048828125, -0.027112960815429688, -0.022533416748046875, -0.017953872680664062, -0.01337432861328125, -0.008794784545898438, -0.004215240478515625, 0.0003643035888671875, 0.00494384765625, 0.009523391723632812, 0.014102935791015625, 0.018682479858398438, 0.02326202392578125, 0.027841567993164062, 0.032421112060546875, 0.03700065612792969, 0.0415802001953125, 0.04615974426269531, 0.050739288330078125, 0.05531883239746094, 0.05989837646484375, 0.06447792053222656, 0.06905746459960938, 0.07363700866699219, 0.078216552734375, 0.08279609680175781, 0.08737564086914062, 0.09195518493652344, 0.09653472900390625, 0.10111427307128906, 0.10569381713867188, 0.11027336120605469, 0.1148529052734375, 0.11943244934082031, 0.12401199340820312, 0.12859153747558594, 0.13317108154296875, 0.13775062561035156, 0.14233016967773438, 0.1469097137451172, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 33.0, 121.0, 350.0, 322.0, 110.0, 40.0, 15.0, 3.0, 1.0, 3.0], "bins": [-31.517847061157227, -30.963668823242188, -30.40949058532715, -29.855310440063477, -29.301132202148438, -28.7469539642334, -28.19277572631836, -27.63859748840332, -27.08441925048828, -26.530241012573242, -25.976062774658203, -25.42188262939453, -24.867704391479492, -24.313526153564453, -23.759347915649414, -23.205169677734375, -22.650989532470703, -22.096811294555664, -21.542633056640625, -20.988452911376953, -20.434274673461914, -19.880096435546875, -19.325918197631836, -18.771739959716797, -18.217559814453125, -17.663381576538086, -17.109203338623047, -16.555023193359375, -16.000844955444336, -15.446666717529297, -14.892488479614258, -14.338310241699219, -13.784130096435547, -13.229951858520508, -12.675772666931152, -12.121594429016113, -11.567415237426758, -11.013236999511719, -10.45905876159668, -9.90488052368164, -9.350701332092285, -8.796523094177246, -8.24234390258789, -7.688165664672852, -7.133986949920654, -6.579808235168457, -6.025629997253418, -5.471451282501221, -4.917272567749023, -4.363093852996826, -3.808915376663208, -3.25473690032959, -2.7005581855773926, -2.1463794708251953, -1.5922009944915771, -1.038022518157959, -0.4838438034057617, 0.070334792137146, 0.6245133876800537, 1.1786919832229614, 1.7328705787658691, 2.2870492935180664, 2.8412277698516846, 3.3954062461853027, 3.9495849609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 10.0, 17.0, 23.0, 28.0, 29.0, 25.0, 41.0, 35.0, 65.0, 64.0, 65.0, 64.0, 56.0, 69.0, 60.0, 52.0, 54.0, 44.0, 49.0, 42.0, 26.0, 25.0, 15.0, 9.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.441911697387695, -4.322793006896973, -4.203674793243408, -4.0845561027526855, -3.965437889099121, -3.8463194370269775, -3.727200984954834, -3.6080825328826904, -3.488964080810547, -3.3698456287384033, -3.2507271766662598, -3.131608724594116, -3.0124902725219727, -2.893371820449829, -2.7742533683776855, -2.655134916305542, -2.5360164642333984, -2.416898012161255, -2.2977795600891113, -2.1786611080169678, -2.059542655944824, -1.9404242038726807, -1.821305751800537, -1.7021872997283936, -1.583068609237671, -1.4639501571655273, -1.3448317050933838, -1.2257132530212402, -1.1065948009490967, -0.9874762892723083, -0.8683578372001648, -0.7492393851280212, -0.6301209926605225, -0.5110025405883789, -0.39188408851623535, -0.2727656066417694, -0.15364715456962585, -0.03452867269515991, 0.08458977937698364, 0.2037082314491272, 0.32282668352127075, 0.4419451355934143, 0.5610635876655579, 0.6801820993423462, 0.7993005514144897, 0.9184190034866333, 1.0375374555587769, 1.1566559076309204, 1.275774359703064, 1.3948928117752075, 1.514011263847351, 1.6331297159194946, 1.7522481679916382, 1.8713667392730713, 1.9904851913452148, 2.1096036434173584, 2.228722095489502, 2.3478405475616455, 2.466958999633789, 2.5860774517059326, 2.705195903778076, 2.8243143558502197, 2.9434328079223633, 3.062551259994507, 3.1816697120666504]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 17.0, 26.0, 34.0, 74.0, 129.0, 257.0, 594.0, 1410.0, 3652.0, 10241.0, 35789.0, 192897.0, 631025.0, 131685.0, 27353.0, 8093.0, 2947.0, 1208.0, 529.0, 257.0, 131.0, 79.0, 47.0, 19.0, 13.0, 12.0, 11.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.174560546875, -2.08544921875, -1.996337890625, -1.9072265625, -1.818115234375, -1.72900390625, -1.639892578125, -1.55078125, -1.461669921875, -1.37255859375, -1.283447265625, -1.1943359375, -1.105224609375, -1.01611328125, -0.927001953125, -0.837890625, -0.748779296875, -0.65966796875, -0.570556640625, -0.4814453125, -0.392333984375, -0.30322265625, -0.214111328125, -0.125, -0.035888671875, 0.05322265625, 0.142333984375, 0.2314453125, 0.320556640625, 0.40966796875, 0.498779296875, 0.587890625, 0.677001953125, 0.76611328125, 0.855224609375, 0.9443359375, 1.033447265625, 1.12255859375, 1.211669921875, 1.30078125, 1.389892578125, 1.47900390625, 1.568115234375, 1.6572265625, 1.746337890625, 1.83544921875, 1.924560546875, 2.013671875, 2.102783203125, 2.19189453125, 2.281005859375, 2.3701171875, 2.459228515625, 2.54833984375, 2.637451171875, 2.7265625, 2.815673828125, 2.90478515625, 2.993896484375, 3.0830078125, 3.172119140625, 3.26123046875, 3.350341796875, 3.439453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 8.0, 5.0, 14.0, 24.0, 18.0, 20.0, 23.0, 24.0, 33.0, 30.0, 29.0, 42.0, 39.0, 43.0, 43.0, 46.0, 44.0, 32.0, 39.0, 42.0, 43.0, 44.0, 32.0, 31.0, 30.0, 27.0, 27.0, 21.0, 18.0, 16.0, 17.0, 17.0, 10.0, 10.0, 4.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.140625, -7.91253662109375, -7.6844482421875, -7.45635986328125, -7.228271484375, -7.00018310546875, -6.7720947265625, -6.54400634765625, -6.31591796875, -6.08782958984375, -5.8597412109375, -5.63165283203125, -5.403564453125, -5.17547607421875, -4.9473876953125, -4.71929931640625, -4.4912109375, -4.26312255859375, -4.0350341796875, -3.80694580078125, -3.578857421875, -3.35076904296875, -3.1226806640625, -2.89459228515625, -2.66650390625, -2.43841552734375, -2.2103271484375, -1.98223876953125, -1.754150390625, -1.52606201171875, -1.2979736328125, -1.06988525390625, -0.841796875, -0.61370849609375, -0.3856201171875, -0.15753173828125, 0.070556640625, 0.29864501953125, 0.5267333984375, 0.75482177734375, 0.98291015625, 1.21099853515625, 1.4390869140625, 1.66717529296875, 1.895263671875, 2.12335205078125, 2.3514404296875, 2.57952880859375, 2.8076171875, 3.03570556640625, 3.2637939453125, 3.49188232421875, 3.719970703125, 3.94805908203125, 4.1761474609375, 4.40423583984375, 4.63232421875, 4.86041259765625, 5.0885009765625, 5.31658935546875, 5.544677734375, 5.77276611328125, 6.0008544921875, 6.22894287109375, 6.45703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 12.0, 12.0, 12.0, 25.0, 31.0, 42.0, 56.0, 71.0, 102.0, 132.0, 222.0, 432.0, 1308.0, 10681.0, 573857.0, 449960.0, 9307.0, 1126.0, 394.0, 209.0, 144.0, 92.0, 65.0, 47.0, 44.0, 36.0, 21.0, 28.0, 8.0, 13.0, 8.0, 2.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.34765625, -7.12481689453125, -6.9019775390625, -6.67913818359375, -6.456298828125, -6.23345947265625, -6.0106201171875, -5.78778076171875, -5.56494140625, -5.34210205078125, -5.1192626953125, -4.89642333984375, -4.673583984375, -4.45074462890625, -4.2279052734375, -4.00506591796875, -3.7822265625, -3.55938720703125, -3.3365478515625, -3.11370849609375, -2.890869140625, -2.66802978515625, -2.4451904296875, -2.22235107421875, -1.99951171875, -1.77667236328125, -1.5538330078125, -1.33099365234375, -1.108154296875, -0.88531494140625, -0.6624755859375, -0.43963623046875, -0.216796875, 0.00604248046875, 0.2288818359375, 0.45172119140625, 0.674560546875, 0.89739990234375, 1.1202392578125, 1.34307861328125, 1.56591796875, 1.78875732421875, 2.0115966796875, 2.23443603515625, 2.457275390625, 2.68011474609375, 2.9029541015625, 3.12579345703125, 3.3486328125, 3.57147216796875, 3.7943115234375, 4.01715087890625, 4.239990234375, 4.46282958984375, 4.6856689453125, 4.90850830078125, 5.13134765625, 5.35418701171875, 5.5770263671875, 5.79986572265625, 6.022705078125, 6.24554443359375, 6.4683837890625, 6.69122314453125, 6.9140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 9.0, 6.0, 5.0, 11.0, 12.0, 13.0, 16.0, 18.0, 21.0, 25.0, 28.0, 19.0, 39.0, 34.0, 29.0, 38.0, 26.0, 44.0, 35.0, 41.0, 54.0, 45.0, 41.0, 27.0, 42.0, 33.0, 29.0, 31.0, 30.0, 27.0, 24.0, 17.0, 16.0, 21.0, 16.0, 17.0, 12.0, 7.0, 9.0, 1.0, 6.0, 1.0, 6.0, 5.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3046875, -7.06494140625, -6.8251953125, -6.58544921875, -6.345703125, -6.10595703125, -5.8662109375, -5.62646484375, -5.38671875, -5.14697265625, -4.9072265625, -4.66748046875, -4.427734375, -4.18798828125, -3.9482421875, -3.70849609375, -3.46875, -3.22900390625, -2.9892578125, -2.74951171875, -2.509765625, -2.27001953125, -2.0302734375, -1.79052734375, -1.55078125, -1.31103515625, -1.0712890625, -0.83154296875, -0.591796875, -0.35205078125, -0.1123046875, 0.12744140625, 0.3671875, 0.60693359375, 0.8466796875, 1.08642578125, 1.326171875, 1.56591796875, 1.8056640625, 2.04541015625, 2.28515625, 2.52490234375, 2.7646484375, 3.00439453125, 3.244140625, 3.48388671875, 3.7236328125, 3.96337890625, 4.203125, 4.44287109375, 4.6826171875, 4.92236328125, 5.162109375, 5.40185546875, 5.6416015625, 5.88134765625, 6.12109375, 6.36083984375, 6.6005859375, 6.84033203125, 7.080078125, 7.31982421875, 7.5595703125, 7.79931640625, 8.0390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 11.0, 29.0, 39.0, 54.0, 119.0, 214.0, 420.0, 1152.0, 3624.0, 16163.0, 129794.0, 815705.0, 66841.0, 10125.0, 2531.0, 913.0, 365.0, 178.0, 103.0, 50.0, 26.0, 27.0, 21.0, 13.0, 8.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.818359375, -0.7904891967773438, -0.7626190185546875, -0.7347488403320312, -0.706878662109375, -0.6790084838867188, -0.6511383056640625, -0.6232681274414062, -0.59539794921875, -0.5675277709960938, -0.5396575927734375, -0.5117874145507812, -0.483917236328125, -0.45604705810546875, -0.4281768798828125, -0.40030670166015625, -0.3724365234375, -0.34456634521484375, -0.3166961669921875, -0.28882598876953125, -0.260955810546875, -0.23308563232421875, -0.2052154541015625, -0.17734527587890625, -0.14947509765625, -0.12160491943359375, -0.0937347412109375, -0.06586456298828125, -0.037994384765625, -0.01012420654296875, 0.0177459716796875, 0.04561614990234375, 0.073486328125, 0.10135650634765625, 0.1292266845703125, 0.15709686279296875, 0.184967041015625, 0.21283721923828125, 0.2407073974609375, 0.26857757568359375, 0.29644775390625, 0.32431793212890625, 0.3521881103515625, 0.38005828857421875, 0.407928466796875, 0.43579864501953125, 0.4636688232421875, 0.49153900146484375, 0.5194091796875, 0.5472793579101562, 0.5751495361328125, 0.6030197143554688, 0.630889892578125, 0.6587600708007812, 0.6866302490234375, 0.7145004272460938, 0.74237060546875, 0.7702407836914062, 0.7981109619140625, 0.8259811401367188, 0.853851318359375, 0.8817214965820312, 0.9095916748046875, 0.9374618530273438, 0.96533203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 10.0, 3.0, 6.0, 23.0, 42.0, 41.0, 66.0, 121.0, 150.0, 182.0, 101.0, 77.0, 47.0, 30.0, 21.0, 14.0, 13.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011426210403442383, -0.00011033471673727036, -0.00010640732944011688, -0.00010247994214296341, -9.855255484580994e-05, -9.462516754865646e-05, -9.069778025150299e-05, -8.677039295434952e-05, -8.284300565719604e-05, -7.891561836004257e-05, -7.49882310628891e-05, -7.106084376573563e-05, -6.713345646858215e-05, -6.320606917142868e-05, -5.927868187427521e-05, -5.5351294577121735e-05, -5.142390727996826e-05, -4.749651998281479e-05, -4.3569132685661316e-05, -3.964174538850784e-05, -3.571435809135437e-05, -3.17869707942009e-05, -2.7859583497047424e-05, -2.393219619989395e-05, -2.000480890274048e-05, -1.6077421605587006e-05, -1.2150034308433533e-05, -8.22264701128006e-06, -4.295259714126587e-06, -3.67872416973114e-07, 3.559514880180359e-06, 7.486902177333832e-06, 1.1414289474487305e-05, 1.5341676771640778e-05, 1.926906406879425e-05, 2.3196451365947723e-05, 2.7123838663101196e-05, 3.105122596025467e-05, 3.497861325740814e-05, 3.8906000554561615e-05, 4.283338785171509e-05, 4.676077514886856e-05, 5.0688162446022034e-05, 5.4615549743175507e-05, 5.854293704032898e-05, 6.247032433748245e-05, 6.639771163463593e-05, 7.03250989317894e-05, 7.425248622894287e-05, 7.817987352609634e-05, 8.210726082324982e-05, 8.603464812040329e-05, 8.996203541755676e-05, 9.388942271471024e-05, 9.781681001186371e-05, 0.00010174419730901718, 0.00010567158460617065, 0.00010959897190332413, 0.0001135263592004776, 0.00011745374649763107, 0.00012138113379478455, 0.00012530852109193802, 0.0001292359083890915, 0.00013316329568624496, 0.00013709068298339844]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 8.0, 7.0, 15.0, 13.0, 25.0, 46.0, 56.0, 109.0, 204.0, 300.0, 692.0, 1510.0, 4056.0, 12234.0, 49897.0, 519401.0, 394488.0, 47036.0, 11734.0, 3774.0, 1459.0, 685.0, 315.0, 194.0, 106.0, 67.0, 34.0, 21.0, 20.0, 7.0, 10.0, 9.0, 3.0, 1.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65283203125, -0.6317596435546875, -0.610687255859375, -0.5896148681640625, -0.56854248046875, -0.5474700927734375, -0.526397705078125, -0.5053253173828125, -0.4842529296875, -0.4631805419921875, -0.442108154296875, -0.4210357666015625, -0.39996337890625, -0.3788909912109375, -0.357818603515625, -0.3367462158203125, -0.315673828125, -0.2946014404296875, -0.273529052734375, -0.2524566650390625, -0.23138427734375, -0.2103118896484375, -0.189239501953125, -0.1681671142578125, -0.1470947265625, -0.1260223388671875, -0.104949951171875, -0.0838775634765625, -0.06280517578125, -0.0417327880859375, -0.020660400390625, 0.0004119873046875, 0.021484375, 0.0425567626953125, 0.063629150390625, 0.0847015380859375, 0.10577392578125, 0.1268463134765625, 0.147918701171875, 0.1689910888671875, 0.1900634765625, 0.2111358642578125, 0.232208251953125, 0.2532806396484375, 0.27435302734375, 0.2954254150390625, 0.316497802734375, 0.3375701904296875, 0.358642578125, 0.3797149658203125, 0.400787353515625, 0.4218597412109375, 0.44293212890625, 0.4640045166015625, 0.485076904296875, 0.5061492919921875, 0.5272216796875, 0.5482940673828125, 0.569366455078125, 0.5904388427734375, 0.61151123046875, 0.6325836181640625, 0.653656005859375, 0.6747283935546875, 0.69580078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 6.0, 8.0, 10.0, 10.0, 6.0, 11.0, 21.0, 35.0, 43.0, 51.0, 46.0, 105.0, 175.0, 120.0, 71.0, 49.0, 52.0, 28.0, 21.0, 18.0, 21.0, 19.0, 6.0, 5.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.264404296875, -0.2572002410888672, -0.24999618530273438, -0.24279212951660156, -0.23558807373046875, -0.22838401794433594, -0.22117996215820312, -0.2139759063720703, -0.2067718505859375, -0.1995677947998047, -0.19236373901367188, -0.18515968322753906, -0.17795562744140625, -0.17075157165527344, -0.16354751586914062, -0.1563434600830078, -0.149139404296875, -0.1419353485107422, -0.13473129272460938, -0.12752723693847656, -0.12032318115234375, -0.11311912536621094, -0.10591506958007812, -0.09871101379394531, -0.0915069580078125, -0.08430290222167969, -0.07709884643554688, -0.06989479064941406, -0.06269073486328125, -0.05548667907714844, -0.048282623291015625, -0.04107856750488281, -0.03387451171875, -0.026670455932617188, -0.019466400146484375, -0.012262344360351562, -0.00505828857421875, 0.0021457672119140625, 0.009349822998046875, 0.016553878784179688, 0.0237579345703125, 0.030961990356445312, 0.038166046142578125, 0.04537010192871094, 0.05257415771484375, 0.05977821350097656, 0.06698226928710938, 0.07418632507324219, 0.081390380859375, 0.08859443664550781, 0.09579849243164062, 0.10300254821777344, 0.11020660400390625, 0.11741065979003906, 0.12461471557617188, 0.1318187713623047, 0.1390228271484375, 0.1462268829345703, 0.15343093872070312, 0.16063499450683594, 0.16783905029296875, 0.17504310607910156, 0.18224716186523438, 0.1894512176513672, 0.1966552734375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 61.0, 320.0, 473.0, 126.0, 25.0, 6.0, 2.0], "bins": [-75.66742706298828, -74.3896484375, -73.11187744140625, -71.8341064453125, -70.55632781982422, -69.27854919433594, -68.00077819824219, -66.72300720214844, -65.44522857666016, -64.16744995117188, -62.889678955078125, -61.61190414428711, -60.334129333496094, -59.05635452270508, -57.77857971191406, -56.50080490112305, -55.22303009033203, -53.945255279541016, -52.66748046875, -51.389705657958984, -50.11193084716797, -48.83415603637695, -47.55638122558594, -46.27860641479492, -45.000831604003906, -43.72305679321289, -42.445281982421875, -41.16750717163086, -39.889732360839844, -38.61195755004883, -37.33418273925781, -36.0564079284668, -34.77863693237305, -33.50086212158203, -32.223087310791016, -30.9453125, -29.667537689208984, -28.38976287841797, -27.111988067626953, -25.834213256835938, -24.55643653869629, -23.278661727905273, -22.000886917114258, -20.723112106323242, -19.445337295532227, -18.16756248474121, -16.889787673950195, -15.61201286315918, -14.334238052368164, -13.056463241577148, -11.778688430786133, -10.500913619995117, -9.223138809204102, -7.945363998413086, -6.66758918762207, -5.389814376831055, -4.112040042877197, -2.8342652320861816, -1.556490421295166, -0.2787156105041504, 0.9990592002868652, 2.276834011077881, 3.5546088218688965, 4.832383632659912, 6.110158443450928]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 13.0, 9.0, 9.0, 11.0, 14.0, 16.0, 19.0, 30.0, 21.0, 18.0, 34.0, 27.0, 41.0, 29.0, 23.0, 42.0, 42.0, 30.0, 41.0, 34.0, 45.0, 39.0, 37.0, 32.0, 27.0, 38.0, 27.0, 28.0, 32.0, 20.0, 24.0, 29.0, 24.0, 16.0, 11.0, 10.0, 11.0, 9.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.042387962341309, -10.688484191894531, -10.334579467773438, -9.98067569732666, -9.626770973205566, -9.272867202758789, -8.918962478637695, -8.565058708190918, -8.21115493774414, -7.857250690460205, -7.5033464431762695, -7.149442672729492, -6.795538425445557, -6.441634178161621, -6.0877299308776855, -5.73382568359375, -5.3799214363098145, -5.026017189025879, -4.672112941741943, -4.318208694458008, -3.9643049240112305, -3.610400676727295, -3.2564964294433594, -2.902592420578003, -2.5486881732940674, -2.194783926010132, -1.8408799171447754, -1.4869756698608398, -1.1330715417861938, -0.7791674137115479, -0.4252631664276123, -0.07135915756225586, 0.2825450897216797, 0.6364492177963257, 0.9903534054756165, 1.3442575931549072, 1.6981617212295532, 2.052065849304199, 2.4059700965881348, 2.759874105453491, 3.1137783527374268, 3.4676826000213623, 3.8215866088867188, 4.175490856170654, 4.52939510345459, 4.883298873901367, 5.237203598022461, 5.591107368469238, 5.945011615753174, 6.298915863037109, 6.652820110321045, 7.0067243576049805, 7.360628128051758, 7.714532375335693, 8.068436622619629, 8.422340393066406, 8.7762451171875, 9.130148887634277, 9.484053611755371, 9.837957382202148, 10.191862106323242, 10.54576587677002, 10.899669647216797, 11.25357437133789, 11.607478141784668]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 6.0, 8.0, 25.0, 27.0, 45.0, 69.0, 119.0, 214.0, 394.0, 828.0, 1715.0, 4468.0, 12219.0, 42664.0, 295240.0, 3206520.0, 542674.0, 61423.0, 15583.0, 5547.0, 2299.0, 1073.0, 520.0, 290.0, 129.0, 80.0, 37.0, 18.0, 15.0, 9.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4765625, -5.3309326171875, -5.185302734375, -5.0396728515625, -4.89404296875, -4.7484130859375, -4.602783203125, -4.4571533203125, -4.3115234375, -4.1658935546875, -4.020263671875, -3.8746337890625, -3.72900390625, -3.5833740234375, -3.437744140625, -3.2921142578125, -3.146484375, -3.0008544921875, -2.855224609375, -2.7095947265625, -2.56396484375, -2.4183349609375, -2.272705078125, -2.1270751953125, -1.9814453125, -1.8358154296875, -1.690185546875, -1.5445556640625, -1.39892578125, -1.2532958984375, -1.107666015625, -0.9620361328125, -0.81640625, -0.6707763671875, -0.525146484375, -0.3795166015625, -0.23388671875, -0.0882568359375, 0.057373046875, 0.2030029296875, 0.3486328125, 0.4942626953125, 0.639892578125, 0.7855224609375, 0.93115234375, 1.0767822265625, 1.222412109375, 1.3680419921875, 1.513671875, 1.6593017578125, 1.804931640625, 1.9505615234375, 2.09619140625, 2.2418212890625, 2.387451171875, 2.5330810546875, 2.6787109375, 2.8243408203125, 2.969970703125, 3.1156005859375, 3.26123046875, 3.4068603515625, 3.552490234375, 3.6981201171875, 3.84375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 14.0, 17.0, 26.0, 57.0, 51.0, 71.0, 69.0, 84.0, 94.0, 112.0, 91.0, 79.0, 75.0, 55.0, 33.0, 29.0, 15.0, 12.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.171875, -7.9898681640625, -7.807861328125, -7.6258544921875, -7.44384765625, -7.2618408203125, -7.079833984375, -6.8978271484375, -6.7158203125, -6.5338134765625, -6.351806640625, -6.1697998046875, -5.98779296875, -5.8057861328125, -5.623779296875, -5.4417724609375, -5.259765625, -5.0777587890625, -4.895751953125, -4.7137451171875, -4.53173828125, -4.3497314453125, -4.167724609375, -3.9857177734375, -3.8037109375, -3.6217041015625, -3.439697265625, -3.2576904296875, -3.07568359375, -2.8936767578125, -2.711669921875, -2.5296630859375, -2.34765625, -2.1656494140625, -1.983642578125, -1.8016357421875, -1.61962890625, -1.4376220703125, -1.255615234375, -1.0736083984375, -0.8916015625, -0.7095947265625, -0.527587890625, -0.3455810546875, -0.16357421875, 0.0184326171875, 0.200439453125, 0.3824462890625, 0.564453125, 0.7464599609375, 0.928466796875, 1.1104736328125, 1.29248046875, 1.4744873046875, 1.656494140625, 1.8385009765625, 2.0205078125, 2.2025146484375, 2.384521484375, 2.5665283203125, 2.74853515625, 2.9305419921875, 3.112548828125, 3.2945556640625, 3.4765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 12.0, 28.0, 57.0, 145.0, 999.0, 4190117.0, 2634.0, 185.0, 63.0, 17.0, 12.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-87.5, -85.661865234375, -83.82373046875, -81.985595703125, -80.1474609375, -78.309326171875, -76.47119140625, -74.633056640625, -72.794921875, -70.956787109375, -69.11865234375, -67.280517578125, -65.4423828125, -63.604248046875, -61.76611328125, -59.927978515625, -58.08984375, -56.251708984375, -54.41357421875, -52.575439453125, -50.7373046875, -48.899169921875, -47.06103515625, -45.222900390625, -43.384765625, -41.546630859375, -39.70849609375, -37.870361328125, -36.0322265625, -34.194091796875, -32.35595703125, -30.517822265625, -28.6796875, -26.841552734375, -25.00341796875, -23.165283203125, -21.3271484375, -19.489013671875, -17.65087890625, -15.812744140625, -13.974609375, -12.136474609375, -10.29833984375, -8.460205078125, -6.6220703125, -4.783935546875, -2.94580078125, -1.107666015625, 0.73046875, 2.568603515625, 4.40673828125, 6.244873046875, 8.0830078125, 9.921142578125, 11.75927734375, 13.597412109375, 15.435546875, 17.273681640625, 19.11181640625, 20.949951171875, 22.7880859375, 24.626220703125, 26.46435546875, 28.302490234375, 30.140625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 2.0, 11.0, 25.0, 31.0, 35.0, 49.0, 99.0, 145.0, 307.0, 674.0, 1305.0, 684.0, 302.0, 145.0, 89.0, 67.0, 38.0, 19.0, 14.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.59130859375, -1.5390625, -1.48681640625, -1.4345703125, -1.38232421875, -1.330078125, -1.27783203125, -1.2255859375, -1.17333984375, -1.12109375, -1.06884765625, -1.0166015625, -0.96435546875, -0.912109375, -0.85986328125, -0.8076171875, -0.75537109375, -0.703125, -0.65087890625, -0.5986328125, -0.54638671875, -0.494140625, -0.44189453125, -0.3896484375, -0.33740234375, -0.28515625, -0.23291015625, -0.1806640625, -0.12841796875, -0.076171875, -0.02392578125, 0.0283203125, 0.08056640625, 0.1328125, 0.18505859375, 0.2373046875, 0.28955078125, 0.341796875, 0.39404296875, 0.4462890625, 0.49853515625, 0.55078125, 0.60302734375, 0.6552734375, 0.70751953125, 0.759765625, 0.81201171875, 0.8642578125, 0.91650390625, 0.96875, 1.02099609375, 1.0732421875, 1.12548828125, 1.177734375, 1.22998046875, 1.2822265625, 1.33447265625, 1.38671875, 1.43896484375, 1.4912109375, 1.54345703125, 1.595703125, 1.64794921875, 1.7001953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 13.0, 21.0, 29.0, 68.0, 119.0, 195.0, 178.0, 178.0, 101.0, 54.0, 28.0, 9.0, 11.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.76431655883789, -15.431965827941895, -15.099614143371582, -14.767263412475586, -14.434911727905273, -14.102560997009277, -13.770210266113281, -13.437858581542969, -13.105507850646973, -12.773157119750977, -12.440805435180664, -12.108454704284668, -11.776103973388672, -11.44375228881836, -11.111401557922363, -10.779050827026367, -10.446699142456055, -10.114348411560059, -9.781996726989746, -9.44964599609375, -9.117294311523438, -8.784943580627441, -8.452592849731445, -8.120241165161133, -7.787890434265137, -7.455539226531982, -7.123188018798828, -6.790837287902832, -6.458486080169678, -6.126134872436523, -5.793784141540527, -5.461432933807373, -5.129082679748535, -4.796731472015381, -4.464380264282227, -4.1320295333862305, -3.799678325653076, -3.467327117919922, -3.1349761486053467, -2.8026251792907715, -2.470273971557617, -2.137922763824463, -1.8055717945098877, -1.473220705986023, -1.1408696174621582, -0.8085185289382935, -0.4761674404144287, -0.14381647109985352, 0.18853473663330078, 0.5208858251571655, 0.8532369136810303, 1.185588002204895, 1.5179390907287598, 1.8502901792526245, 2.1826412677764893, 2.5149922370910645, 2.8473434448242188, 3.179694652557373, 3.5120456218719482, 3.8443965911865234, 4.176747798919678, 4.509099006652832, 4.841449737548828, 5.173800945281982, 5.506152153015137]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 5.0, 6.0, 6.0, 18.0, 15.0, 25.0, 26.0, 47.0, 32.0, 46.0, 40.0, 59.0, 54.0, 62.0, 69.0, 60.0, 67.0, 62.0, 61.0, 53.0, 54.0, 30.0, 23.0, 18.0, 18.0, 13.0, 10.0, 4.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.992746829986572, -4.8575592041015625, -4.722371578216553, -4.587183475494385, -4.451995849609375, -4.316808223724365, -4.1816205978393555, -4.046432971954346, -3.911245107650757, -3.776057481765747, -3.640869617462158, -3.5056819915771484, -3.3704943656921387, -3.23530650138855, -3.10011887550354, -2.964931011199951, -2.8297433853149414, -2.6945557594299316, -2.5593678951263428, -2.424180269241333, -2.288992404937744, -2.1538047790527344, -2.0186171531677246, -1.8834294080734253, -1.748241662979126, -1.6130539178848267, -1.4778661727905273, -1.3426785469055176, -1.2074908018112183, -1.072303056716919, -0.9371153712272644, -0.8019276857376099, -0.6667399406433105, -0.5315521955490112, -0.3963645100593567, -0.26117679476737976, -0.12598907947540283, 0.009198665618896484, 0.14438635110855103, 0.27957403659820557, 0.4147617816925049, 0.5499495267868042, 0.6851372122764587, 0.8203248977661133, 0.9555126428604126, 1.090700387954712, 1.2258880138397217, 1.361075758934021, 1.4962635040283203, 1.6314512491226196, 1.766638994216919, 1.9018266201019287, 2.0370144844055176, 2.1722021102905273, 2.307389736175537, 2.442577362060547, 2.5777652263641357, 2.7129528522491455, 2.8481407165527344, 2.983328342437744, 3.118515968322754, 3.2537038326263428, 3.3888914585113525, 3.5240793228149414, 3.659266948699951]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 8.0, 10.0, 18.0, 25.0, 39.0, 40.0, 72.0, 108.0, 149.0, 260.0, 467.0, 679.0, 1155.0, 1990.0, 3574.0, 6718.0, 14377.0, 36318.0, 114518.0, 378253.0, 333452.0, 97491.0, 31672.0, 12803.0, 6281.0, 3305.0, 1877.0, 1102.0, 657.0, 407.0, 258.0, 171.0, 99.0, 61.0, 40.0, 28.0, 29.0, 9.0, 12.0, 2.0, 5.0, 0.0, 3.0, 5.0, 1.0, 1.0, 5.0], "bins": [-1.2734375, -1.2389602661132812, -1.2044830322265625, -1.1700057983398438, -1.135528564453125, -1.1010513305664062, -1.0665740966796875, -1.0320968627929688, -0.99761962890625, -0.9631423950195312, -0.9286651611328125, -0.8941879272460938, -0.859710693359375, -0.8252334594726562, -0.7907562255859375, -0.7562789916992188, -0.7218017578125, -0.6873245239257812, -0.6528472900390625, -0.6183700561523438, -0.583892822265625, -0.5494155883789062, -0.5149383544921875, -0.48046112060546875, -0.44598388671875, -0.41150665283203125, -0.3770294189453125, -0.34255218505859375, -0.308074951171875, -0.27359771728515625, -0.2391204833984375, -0.20464324951171875, -0.170166015625, -0.13568878173828125, -0.1012115478515625, -0.06673431396484375, -0.032257080078125, 0.00222015380859375, 0.0366973876953125, 0.07117462158203125, 0.10565185546875, 0.14012908935546875, 0.1746063232421875, 0.20908355712890625, 0.243560791015625, 0.27803802490234375, 0.3125152587890625, 0.34699249267578125, 0.3814697265625, 0.41594696044921875, 0.4504241943359375, 0.48490142822265625, 0.519378662109375, 0.5538558959960938, 0.5883331298828125, 0.6228103637695312, 0.65728759765625, 0.6917648315429688, 0.7262420654296875, 0.7607192993164062, 0.795196533203125, 0.8296737670898438, 0.8641510009765625, 0.8986282348632812, 0.93310546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 4.0, 11.0, 12.0, 18.0, 39.0, 24.0, 41.0, 55.0, 60.0, 77.0, 70.0, 82.0, 88.0, 79.0, 66.0, 82.0, 60.0, 40.0, 29.0, 21.0, 13.0, 11.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.46484375, -4.346405029296875, -4.22796630859375, -4.109527587890625, -3.9910888671875, -3.872650146484375, -3.75421142578125, -3.635772705078125, -3.517333984375, -3.398895263671875, -3.28045654296875, -3.162017822265625, -3.0435791015625, -2.925140380859375, -2.80670166015625, -2.688262939453125, -2.56982421875, -2.451385498046875, -2.33294677734375, -2.214508056640625, -2.0960693359375, -1.977630615234375, -1.85919189453125, -1.740753173828125, -1.622314453125, -1.503875732421875, -1.38543701171875, -1.266998291015625, -1.1485595703125, -1.030120849609375, -0.91168212890625, -0.793243408203125, -0.6748046875, -0.556365966796875, -0.43792724609375, -0.319488525390625, -0.2010498046875, -0.082611083984375, 0.03582763671875, 0.154266357421875, 0.272705078125, 0.391143798828125, 0.50958251953125, 0.628021240234375, 0.7464599609375, 0.864898681640625, 0.98333740234375, 1.101776123046875, 1.22021484375, 1.338653564453125, 1.45709228515625, 1.575531005859375, 1.6939697265625, 1.812408447265625, 1.93084716796875, 2.049285888671875, 2.167724609375, 2.286163330078125, 2.40460205078125, 2.523040771484375, 2.6414794921875, 2.759918212890625, 2.87835693359375, 2.996795654296875, 3.115234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 8.0, 6.0, 6.0, 7.0, 11.0, 11.0, 20.0, 16.0, 33.0, 57.0, 65.0, 122.0, 162.0, 261.0, 454.0, 770.0, 1418.0, 2752.0, 5952.0, 13823.0, 40045.0, 147418.0, 470631.0, 260065.0, 66986.0, 21064.0, 8371.0, 3673.0, 1810.0, 991.0, 565.0, 312.0, 213.0, 134.0, 98.0, 53.0, 40.0, 38.0, 29.0, 18.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.9599609375, -0.9306106567382812, -0.9012603759765625, -0.8719100952148438, -0.842559814453125, -0.8132095336914062, -0.7838592529296875, -0.7545089721679688, -0.72515869140625, -0.6958084106445312, -0.6664581298828125, -0.6371078491210938, -0.607757568359375, -0.5784072875976562, -0.5490570068359375, -0.5197067260742188, -0.4903564453125, -0.46100616455078125, -0.4316558837890625, -0.40230560302734375, -0.372955322265625, -0.34360504150390625, -0.3142547607421875, -0.28490447998046875, -0.25555419921875, -0.22620391845703125, -0.1968536376953125, -0.16750335693359375, -0.138153076171875, -0.10880279541015625, -0.0794525146484375, -0.05010223388671875, -0.020751953125, 0.00859832763671875, 0.0379486083984375, 0.06729888916015625, 0.096649169921875, 0.12599945068359375, 0.1553497314453125, 0.18470001220703125, 0.21405029296875, 0.24340057373046875, 0.2727508544921875, 0.30210113525390625, 0.331451416015625, 0.36080169677734375, 0.3901519775390625, 0.41950225830078125, 0.4488525390625, 0.47820281982421875, 0.5075531005859375, 0.5369033813476562, 0.566253662109375, 0.5956039428710938, 0.6249542236328125, 0.6543045043945312, 0.68365478515625, 0.7130050659179688, 0.7423553466796875, 0.7717056274414062, 0.801055908203125, 0.8304061889648438, 0.8597564697265625, 0.8891067504882812, 0.91845703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 8.0, 7.0, 6.0, 8.0, 12.0, 15.0, 15.0, 19.0, 20.0, 29.0, 28.0, 29.0, 35.0, 42.0, 31.0, 38.0, 45.0, 38.0, 46.0, 32.0, 46.0, 49.0, 41.0, 38.0, 40.0, 34.0, 30.0, 26.0, 23.0, 27.0, 18.0, 14.0, 10.0, 11.0, 11.0, 13.0, 13.0, 12.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.4140625, -3.30328369140625, -3.1925048828125, -3.08172607421875, -2.970947265625, -2.86016845703125, -2.7493896484375, -2.63861083984375, -2.52783203125, -2.41705322265625, -2.3062744140625, -2.19549560546875, -2.084716796875, -1.97393798828125, -1.8631591796875, -1.75238037109375, -1.6416015625, -1.53082275390625, -1.4200439453125, -1.30926513671875, -1.198486328125, -1.08770751953125, -0.9769287109375, -0.86614990234375, -0.75537109375, -0.64459228515625, -0.5338134765625, -0.42303466796875, -0.312255859375, -0.20147705078125, -0.0906982421875, 0.02008056640625, 0.130859375, 0.24163818359375, 0.3524169921875, 0.46319580078125, 0.573974609375, 0.68475341796875, 0.7955322265625, 0.90631103515625, 1.01708984375, 1.12786865234375, 1.2386474609375, 1.34942626953125, 1.460205078125, 1.57098388671875, 1.6817626953125, 1.79254150390625, 1.9033203125, 2.01409912109375, 2.1248779296875, 2.23565673828125, 2.346435546875, 2.45721435546875, 2.5679931640625, 2.67877197265625, 2.78955078125, 2.90032958984375, 3.0111083984375, 3.12188720703125, 3.232666015625, 3.34344482421875, 3.4542236328125, 3.56500244140625, 3.67578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 18.0, 14.0, 26.0, 39.0, 71.0, 136.0, 160.0, 290.0, 474.0, 831.0, 1614.0, 3300.0, 7315.0, 18005.0, 56233.0, 257369.0, 532304.0, 117515.0, 31218.0, 11637.0, 4852.0, 2283.0, 1221.0, 693.0, 347.0, 219.0, 130.0, 74.0, 50.0, 35.0, 26.0, 15.0, 7.0, 4.0, 9.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35498046875, -0.34430694580078125, -0.3336334228515625, -0.32295989990234375, -0.312286376953125, -0.30161285400390625, -0.2909393310546875, -0.28026580810546875, -0.26959228515625, -0.25891876220703125, -0.2482452392578125, -0.23757171630859375, -0.226898193359375, -0.21622467041015625, -0.2055511474609375, -0.19487762451171875, -0.1842041015625, -0.17353057861328125, -0.1628570556640625, -0.15218353271484375, -0.141510009765625, -0.13083648681640625, -0.1201629638671875, -0.10948944091796875, -0.09881591796875, -0.08814239501953125, -0.0774688720703125, -0.06679534912109375, -0.056121826171875, -0.04544830322265625, -0.0347747802734375, -0.02410125732421875, -0.013427734375, -0.00275421142578125, 0.0079193115234375, 0.01859283447265625, 0.029266357421875, 0.03993988037109375, 0.0506134033203125, 0.06128692626953125, 0.07196044921875, 0.08263397216796875, 0.0933074951171875, 0.10398101806640625, 0.114654541015625, 0.12532806396484375, 0.1360015869140625, 0.14667510986328125, 0.1573486328125, 0.16802215576171875, 0.1786956787109375, 0.18936920166015625, 0.200042724609375, 0.21071624755859375, 0.2213897705078125, 0.23206329345703125, 0.24273681640625, 0.25341033935546875, 0.2640838623046875, 0.27475738525390625, 0.285430908203125, 0.29610443115234375, 0.3067779541015625, 0.31745147705078125, 0.328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 4.0, 7.0, 12.0, 30.0, 25.0, 51.0, 91.0, 123.0, 155.0, 153.0, 112.0, 63.0, 43.0, 38.0, 17.0, 16.0, 12.0, 7.0, 8.0, 7.0, 7.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002105236053466797, -0.00019943341612815857, -0.00018834322690963745, -0.00017725303769111633, -0.00016616284847259521, -0.0001550726592540741, -0.00014398247003555298, -0.00013289228081703186, -0.00012180209159851074, -0.00011071190237998962, -9.96217131614685e-05, -8.853152394294739e-05, -7.744133472442627e-05, -6.635114550590515e-05, -5.526095628738403e-05, -4.4170767068862915e-05, -3.30805778503418e-05, -2.199038863182068e-05, -1.090019941329956e-05, 1.8998980522155762e-07, 1.1280179023742676e-05, 2.2370368242263794e-05, 3.346055746078491e-05, 4.455074667930603e-05, 5.564093589782715e-05, 6.673112511634827e-05, 7.782131433486938e-05, 8.89115035533905e-05, 0.00010000169277191162, 0.00011109188199043274, 0.00012218207120895386, 0.00013327226042747498, 0.0001443624496459961, 0.0001554526388645172, 0.00016654282808303833, 0.00017763301730155945, 0.00018872320652008057, 0.00019981339573860168, 0.0002109035849571228, 0.00022199377417564392, 0.00023308396339416504, 0.00024417415261268616, 0.0002552643418312073, 0.0002663545310497284, 0.0002774447202682495, 0.00028853490948677063, 0.00029962509870529175, 0.00031071528792381287, 0.000321805477142334, 0.0003328956663608551, 0.0003439858555793762, 0.00035507604479789734, 0.00036616623401641846, 0.0003772564232349396, 0.0003883466124534607, 0.0003994368016719818, 0.00041052699089050293, 0.00042161718010902405, 0.00043270736932754517, 0.0004437975585460663, 0.0004548877477645874, 0.0004659779369831085, 0.00047706812620162964, 0.00048815831542015076, 0.0004992485046386719]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 11.0, 17.0, 10.0, 22.0, 14.0, 32.0, 51.0, 62.0, 99.0, 210.0, 426.0, 978.0, 2767.0, 10401.0, 98433.0, 860371.0, 62425.0, 8180.0, 2253.0, 853.0, 413.0, 186.0, 100.0, 59.0, 38.0, 31.0, 22.0, 10.0, 10.0, 11.0, 12.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8740234375, -0.8470687866210938, -0.8201141357421875, -0.7931594848632812, -0.766204833984375, -0.7392501831054688, -0.7122955322265625, -0.6853408813476562, -0.65838623046875, -0.6314315795898438, -0.6044769287109375, -0.5775222778320312, -0.550567626953125, -0.5236129760742188, -0.4966583251953125, -0.46970367431640625, -0.4427490234375, -0.41579437255859375, -0.3888397216796875, -0.36188507080078125, -0.334930419921875, -0.30797576904296875, -0.2810211181640625, -0.25406646728515625, -0.22711181640625, -0.20015716552734375, -0.1732025146484375, -0.14624786376953125, -0.119293212890625, -0.09233856201171875, -0.0653839111328125, -0.03842926025390625, -0.011474609375, 0.01548004150390625, 0.0424346923828125, 0.06938934326171875, 0.096343994140625, 0.12329864501953125, 0.1502532958984375, 0.17720794677734375, 0.20416259765625, 0.23111724853515625, 0.2580718994140625, 0.28502655029296875, 0.311981201171875, 0.33893585205078125, 0.3658905029296875, 0.39284515380859375, 0.4197998046875, 0.44675445556640625, 0.4737091064453125, 0.5006637573242188, 0.527618408203125, 0.5545730590820312, 0.5815277099609375, 0.6084823608398438, 0.63543701171875, 0.6623916625976562, 0.6893463134765625, 0.7163009643554688, 0.743255615234375, 0.7702102661132812, 0.7971649169921875, 0.8241195678710938, 0.85107421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 9.0, 22.0, 12.0, 17.0, 23.0, 42.0, 40.0, 49.0, 67.0, 72.0, 70.0, 105.0, 80.0, 79.0, 56.0, 49.0, 37.0, 31.0, 28.0, 21.0, 13.0, 9.0, 9.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08489990234375, -0.08214282989501953, -0.07938575744628906, -0.0766286849975586, -0.07387161254882812, -0.07111454010009766, -0.06835746765136719, -0.06560039520263672, -0.06284332275390625, -0.06008625030517578, -0.05732917785644531, -0.054572105407714844, -0.051815032958984375, -0.049057960510253906, -0.04630088806152344, -0.04354381561279297, -0.0407867431640625, -0.03802967071533203, -0.03527259826660156, -0.032515525817871094, -0.029758453369140625, -0.027001380920410156, -0.024244308471679688, -0.02148723602294922, -0.01873016357421875, -0.01597309112548828, -0.013216018676757812, -0.010458946228027344, -0.007701873779296875, -0.004944801330566406, -0.0021877288818359375, 0.0005693435668945312, 0.003326416015625, 0.006083488464355469, 0.008840560913085938, 0.011597633361816406, 0.014354705810546875, 0.017111778259277344, 0.019868850708007812, 0.02262592315673828, 0.02538299560546875, 0.02814006805419922, 0.030897140502929688, 0.033654212951660156, 0.036411285400390625, 0.039168357849121094, 0.04192543029785156, 0.04468250274658203, 0.0474395751953125, 0.05019664764404297, 0.05295372009277344, 0.055710792541503906, 0.058467864990234375, 0.061224937438964844, 0.06398200988769531, 0.06673908233642578, 0.06949615478515625, 0.07225322723388672, 0.07501029968261719, 0.07776737213134766, 0.08052444458007812, 0.0832815170288086, 0.08603858947753906, 0.08879566192626953, 0.091552734375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 32.0, 44.0, 103.0, 234.0, 246.0, 189.0, 62.0, 46.0, 22.0, 7.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.347467422485352, -12.080865859985352, -11.814263343811035, -11.547661781311035, -11.281060218811035, -11.014457702636719, -10.747856140136719, -10.481254577636719, -10.214653015136719, -9.948051452636719, -9.681448936462402, -9.414847373962402, -9.148245811462402, -8.881643295288086, -8.615041732788086, -8.348440170288086, -8.08183765411377, -7.815235614776611, -7.548634052276611, -7.282032012939453, -7.015430450439453, -6.748828411102295, -6.482226371765137, -6.215624809265137, -5.9490227699279785, -5.68242073059082, -5.41581916809082, -5.149217128753662, -4.882615089416504, -4.616013526916504, -4.349411487579346, -4.0828094482421875, -3.8162078857421875, -3.5496060848236084, -3.2830042839050293, -3.016402244567871, -2.749800443649292, -2.483198642730713, -2.2165966033935547, -1.9499948024749756, -1.6833930015563965, -1.4167912006378174, -1.1501892805099487, -0.8835874199867249, -0.616985559463501, -0.3503837585449219, -0.08378183841705322, 0.18282008171081543, 0.44942188262939453, 0.7160237431526184, 0.9826256036758423, 1.249227523803711, 1.51582932472229, 1.7824311256408691, 2.0490331649780273, 2.3156349658966064, 2.5822367668151855, 2.8488385677337646, 3.1154403686523438, 3.382042407989502, 3.648644208908081, 3.91524600982666, 4.181848049163818, 4.448450088500977, 4.715051651000977]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 5.0, 7.0, 19.0, 23.0, 29.0, 43.0, 61.0, 45.0, 60.0, 80.0, 74.0, 91.0, 91.0, 74.0, 75.0, 66.0, 47.0, 22.0, 32.0, 15.0, 13.0, 8.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.14798641204834, -4.033320426940918, -3.918654203414917, -3.803987979888916, -3.689321994781494, -3.574655771255493, -3.459989547729492, -3.3453235626220703, -3.2306575775146484, -3.1159913539886475, -3.0013253688812256, -2.8866591453552246, -2.7719931602478027, -2.6573269367218018, -2.542660713195801, -2.427994728088379, -2.313328504562378, -2.198662281036377, -2.083996295928955, -1.969330072402954, -1.8546640872955322, -1.7399978637695312, -1.6253317594528198, -1.5106656551361084, -1.395999550819397, -1.2813334465026855, -1.1666673421859741, -1.0520012378692627, -0.9373350739479065, -0.8226689696311951, -0.7080028057098389, -0.5933367013931274, -0.4786708354949951, -0.3640047311782837, -0.24933859705924988, -0.13467246294021606, -0.02000635862350464, 0.09465974569320679, 0.209325909614563, 0.3239920139312744, 0.43865811824798584, 0.5533242225646973, 0.6679903268814087, 0.7826564908027649, 0.8973225951194763, 1.011988639831543, 1.126654863357544, 1.2413209676742554, 1.3559870719909668, 1.4706531763076782, 1.5853192806243896, 1.6999855041503906, 1.8146514892578125, 1.9293177127838135, 2.0439839363098145, 2.1586499214172363, 2.273315906524658, 2.387982130050659, 2.502648115158081, 2.617314338684082, 2.731980323791504, 2.846646547317505, 2.961312770843506, 3.0759787559509277, 3.1906449794769287]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 12.0, 8.0, 19.0, 24.0, 30.0, 48.0, 94.0, 124.0, 210.0, 366.0, 604.0, 991.0, 1683.0, 3011.0, 5455.0, 10718.0, 22240.0, 60584.0, 360490.0, 459299.0, 72454.0, 24917.0, 11353.0, 5982.0, 3225.0, 1883.0, 1032.0, 636.0, 382.0, 246.0, 131.0, 111.0, 60.0, 51.0, 27.0, 18.0, 4.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-2.4140625, -2.34521484375, -2.2763671875, -2.20751953125, -2.138671875, -2.06982421875, -2.0009765625, -1.93212890625, -1.86328125, -1.79443359375, -1.7255859375, -1.65673828125, -1.587890625, -1.51904296875, -1.4501953125, -1.38134765625, -1.3125, -1.24365234375, -1.1748046875, -1.10595703125, -1.037109375, -0.96826171875, -0.8994140625, -0.83056640625, -0.76171875, -0.69287109375, -0.6240234375, -0.55517578125, -0.486328125, -0.41748046875, -0.3486328125, -0.27978515625, -0.2109375, -0.14208984375, -0.0732421875, -0.00439453125, 0.064453125, 0.13330078125, 0.2021484375, 0.27099609375, 0.33984375, 0.40869140625, 0.4775390625, 0.54638671875, 0.615234375, 0.68408203125, 0.7529296875, 0.82177734375, 0.890625, 0.95947265625, 1.0283203125, 1.09716796875, 1.166015625, 1.23486328125, 1.3037109375, 1.37255859375, 1.44140625, 1.51025390625, 1.5791015625, 1.64794921875, 1.716796875, 1.78564453125, 1.8544921875, 1.92333984375, 1.9921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 13.0, 12.0, 16.0, 20.0, 15.0, 29.0, 23.0, 34.0, 49.0, 25.0, 46.0, 52.0, 42.0, 61.0, 40.0, 47.0, 42.0, 52.0, 46.0, 45.0, 29.0, 39.0, 23.0, 34.0, 22.0, 17.0, 18.0, 10.0, 15.0, 7.0, 13.0, 9.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.63671875, -5.4742431640625, -5.311767578125, -5.1492919921875, -4.98681640625, -4.8243408203125, -4.661865234375, -4.4993896484375, -4.3369140625, -4.1744384765625, -4.011962890625, -3.8494873046875, -3.68701171875, -3.5245361328125, -3.362060546875, -3.1995849609375, -3.037109375, -2.8746337890625, -2.712158203125, -2.5496826171875, -2.38720703125, -2.2247314453125, -2.062255859375, -1.8997802734375, -1.7373046875, -1.5748291015625, -1.412353515625, -1.2498779296875, -1.08740234375, -0.9249267578125, -0.762451171875, -0.5999755859375, -0.4375, -0.2750244140625, -0.112548828125, 0.0499267578125, 0.21240234375, 0.3748779296875, 0.537353515625, 0.6998291015625, 0.8623046875, 1.0247802734375, 1.187255859375, 1.3497314453125, 1.51220703125, 1.6746826171875, 1.837158203125, 1.9996337890625, 2.162109375, 2.3245849609375, 2.487060546875, 2.6495361328125, 2.81201171875, 2.9744873046875, 3.136962890625, 3.2994384765625, 3.4619140625, 3.6243896484375, 3.786865234375, 3.9493408203125, 4.11181640625, 4.2742919921875, 4.436767578125, 4.5992431640625, 4.76171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 1.0, 9.0, 8.0, 6.0, 15.0, 16.0, 19.0, 15.0, 27.0, 32.0, 30.0, 29.0, 47.0, 46.0, 68.0, 78.0, 331.0, 8335.0, 1032146.0, 6557.0, 277.0, 95.0, 57.0, 38.0, 38.0, 46.0, 17.0, 27.0, 25.0, 20.0, 19.0, 22.0, 10.0, 7.0, 4.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.5625, -18.0535888671875, -17.544677734375, -17.0357666015625, -16.52685546875, -16.0179443359375, -15.509033203125, -15.0001220703125, -14.4912109375, -13.9822998046875, -13.473388671875, -12.9644775390625, -12.45556640625, -11.9466552734375, -11.437744140625, -10.9288330078125, -10.419921875, -9.9110107421875, -9.402099609375, -8.8931884765625, -8.38427734375, -7.8753662109375, -7.366455078125, -6.8575439453125, -6.3486328125, -5.8397216796875, -5.330810546875, -4.8218994140625, -4.31298828125, -3.8040771484375, -3.295166015625, -2.7862548828125, -2.27734375, -1.7684326171875, -1.259521484375, -0.7506103515625, -0.24169921875, 0.2672119140625, 0.776123046875, 1.2850341796875, 1.7939453125, 2.3028564453125, 2.811767578125, 3.3206787109375, 3.82958984375, 4.3385009765625, 4.847412109375, 5.3563232421875, 5.865234375, 6.3741455078125, 6.883056640625, 7.3919677734375, 7.90087890625, 8.4097900390625, 8.918701171875, 9.4276123046875, 9.9365234375, 10.4454345703125, 10.954345703125, 11.4632568359375, 11.97216796875, 12.4810791015625, 12.989990234375, 13.4989013671875, 14.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 3.0, 8.0, 14.0, 5.0, 11.0, 16.0, 19.0, 19.0, 33.0, 25.0, 33.0, 23.0, 39.0, 35.0, 51.0, 48.0, 51.0, 54.0, 37.0, 38.0, 41.0, 51.0, 36.0, 35.0, 46.0, 34.0, 18.0, 29.0, 23.0, 18.0, 22.0, 20.0, 12.0, 11.0, 5.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.6875, -6.50421142578125, -6.3209228515625, -6.13763427734375, -5.954345703125, -5.77105712890625, -5.5877685546875, -5.40447998046875, -5.22119140625, -5.03790283203125, -4.8546142578125, -4.67132568359375, -4.488037109375, -4.30474853515625, -4.1214599609375, -3.93817138671875, -3.7548828125, -3.57159423828125, -3.3883056640625, -3.20501708984375, -3.021728515625, -2.83843994140625, -2.6551513671875, -2.47186279296875, -2.28857421875, -2.10528564453125, -1.9219970703125, -1.73870849609375, -1.555419921875, -1.37213134765625, -1.1888427734375, -1.00555419921875, -0.822265625, -0.63897705078125, -0.4556884765625, -0.27239990234375, -0.089111328125, 0.09417724609375, 0.2774658203125, 0.46075439453125, 0.64404296875, 0.82733154296875, 1.0106201171875, 1.19390869140625, 1.377197265625, 1.56048583984375, 1.7437744140625, 1.92706298828125, 2.1103515625, 2.29364013671875, 2.4769287109375, 2.66021728515625, 2.843505859375, 3.02679443359375, 3.2100830078125, 3.39337158203125, 3.57666015625, 3.75994873046875, 3.9432373046875, 4.12652587890625, 4.309814453125, 4.49310302734375, 4.6763916015625, 4.85968017578125, 5.04296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 7.0, 13.0, 8.0, 20.0, 25.0, 37.0, 59.0, 93.0, 139.0, 222.0, 365.0, 657.0, 1382.0, 3288.0, 9069.0, 32897.0, 703880.0, 254593.0, 27883.0, 8064.0, 2946.0, 1283.0, 632.0, 351.0, 217.0, 134.0, 83.0, 60.0, 40.0, 20.0, 23.0, 13.0, 6.0, 11.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2958984375, -1.256561279296875, -1.21722412109375, -1.177886962890625, -1.1385498046875, -1.099212646484375, -1.05987548828125, -1.020538330078125, -0.981201171875, -0.941864013671875, -0.90252685546875, -0.863189697265625, -0.8238525390625, -0.784515380859375, -0.74517822265625, -0.705841064453125, -0.66650390625, -0.627166748046875, -0.58782958984375, -0.548492431640625, -0.5091552734375, -0.469818115234375, -0.43048095703125, -0.391143798828125, -0.351806640625, -0.312469482421875, -0.27313232421875, -0.233795166015625, -0.1944580078125, -0.155120849609375, -0.11578369140625, -0.076446533203125, -0.037109375, 0.002227783203125, 0.04156494140625, 0.080902099609375, 0.1202392578125, 0.159576416015625, 0.19891357421875, 0.238250732421875, 0.277587890625, 0.316925048828125, 0.35626220703125, 0.395599365234375, 0.4349365234375, 0.474273681640625, 0.51361083984375, 0.552947998046875, 0.59228515625, 0.631622314453125, 0.67095947265625, 0.710296630859375, 0.7496337890625, 0.788970947265625, 0.82830810546875, 0.867645263671875, 0.906982421875, 0.946319580078125, 0.98565673828125, 1.024993896484375, 1.0643310546875, 1.103668212890625, 1.14300537109375, 1.182342529296875, 1.2216796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 5.0, 8.0, 22.0, 16.0, 23.0, 30.0, 55.0, 114.0, 236.0, 226.0, 83.0, 65.0, 25.0, 19.0, 13.0, 5.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016188621520996094, -0.0001572445034980774, -0.00015260279178619385, -0.0001479610800743103, -0.00014331936836242676, -0.0001386776566505432, -0.00013403594493865967, -0.00012939423322677612, -0.00012475252151489258, -0.00012011080980300903, -0.00011546909809112549, -0.00011082738637924194, -0.0001061856746673584, -0.00010154396295547485, -9.690225124359131e-05, -9.226053953170776e-05, -8.761882781982422e-05, -8.297711610794067e-05, -7.833540439605713e-05, -7.369369268417358e-05, -6.905198097229004e-05, -6.44102692604065e-05, -5.976855754852295e-05, -5.5126845836639404e-05, -5.048513412475586e-05, -4.5843422412872314e-05, -4.120171070098877e-05, -3.6559998989105225e-05, -3.191828727722168e-05, -2.7276575565338135e-05, -2.263486385345459e-05, -1.7993152141571045e-05, -1.33514404296875e-05, -8.709728717803955e-06, -4.06801700592041e-06, 5.736947059631348e-07, 5.21540641784668e-06, 9.857118129730225e-06, 1.449882984161377e-05, 1.9140541553497314e-05, 2.378225326538086e-05, 2.8423964977264404e-05, 3.306567668914795e-05, 3.7707388401031494e-05, 4.234910011291504e-05, 4.6990811824798584e-05, 5.163252353668213e-05, 5.6274235248565674e-05, 6.091594696044922e-05, 6.555765867233276e-05, 7.019937038421631e-05, 7.484108209609985e-05, 7.94827938079834e-05, 8.412450551986694e-05, 8.876621723175049e-05, 9.340792894363403e-05, 9.804964065551758e-05, 0.00010269135236740112, 0.00010733306407928467, 0.00011197477579116821, 0.00011661648750305176, 0.0001212581992149353, 0.00012589991092681885, 0.0001305416226387024, 0.00013518333435058594]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 1.0, 6.0, 12.0, 13.0, 12.0, 19.0, 25.0, 56.0, 56.0, 85.0, 92.0, 167.0, 301.0, 444.0, 869.0, 1661.0, 3638.0, 9532.0, 32619.0, 288354.0, 655372.0, 36902.0, 10306.0, 3903.0, 1795.0, 905.0, 555.0, 294.0, 197.0, 119.0, 82.0, 55.0, 30.0, 19.0, 17.0, 12.0, 5.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.028076171875, -0.99267578125, -0.957275390625, -0.921875, -0.886474609375, -0.85107421875, -0.815673828125, -0.7802734375, -0.744873046875, -0.70947265625, -0.674072265625, -0.638671875, -0.603271484375, -0.56787109375, -0.532470703125, -0.4970703125, -0.461669921875, -0.42626953125, -0.390869140625, -0.35546875, -0.320068359375, -0.28466796875, -0.249267578125, -0.2138671875, -0.178466796875, -0.14306640625, -0.107666015625, -0.072265625, -0.036865234375, -0.00146484375, 0.033935546875, 0.0693359375, 0.104736328125, 0.14013671875, 0.175537109375, 0.2109375, 0.246337890625, 0.28173828125, 0.317138671875, 0.3525390625, 0.387939453125, 0.42333984375, 0.458740234375, 0.494140625, 0.529541015625, 0.56494140625, 0.600341796875, 0.6357421875, 0.671142578125, 0.70654296875, 0.741943359375, 0.77734375, 0.812744140625, 0.84814453125, 0.883544921875, 0.9189453125, 0.954345703125, 0.98974609375, 1.025146484375, 1.060546875, 1.095947265625, 1.13134765625, 1.166748046875, 1.2021484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 4.0, 9.0, 16.0, 14.0, 13.0, 20.0, 30.0, 44.0, 88.0, 400.0, 142.0, 55.0, 37.0, 35.0, 21.0, 10.0, 15.0, 8.0, 6.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5880203247070312, -0.5715484619140625, -0.5550765991210938, -0.538604736328125, -0.5221328735351562, -0.5056610107421875, -0.48918914794921875, -0.47271728515625, -0.45624542236328125, -0.4397735595703125, -0.42330169677734375, -0.406829833984375, -0.39035797119140625, -0.3738861083984375, -0.35741424560546875, -0.3409423828125, -0.32447052001953125, -0.3079986572265625, -0.29152679443359375, -0.275054931640625, -0.25858306884765625, -0.2421112060546875, -0.22563934326171875, -0.20916748046875, -0.19269561767578125, -0.1762237548828125, -0.15975189208984375, -0.143280029296875, -0.12680816650390625, -0.1103363037109375, -0.09386444091796875, -0.077392578125, -0.06092071533203125, -0.0444488525390625, -0.02797698974609375, -0.011505126953125, 0.00496673583984375, 0.0214385986328125, 0.03791046142578125, 0.05438232421875, 0.07085418701171875, 0.0873260498046875, 0.10379791259765625, 0.120269775390625, 0.13674163818359375, 0.1532135009765625, 0.16968536376953125, 0.1861572265625, 0.20262908935546875, 0.2191009521484375, 0.23557281494140625, 0.252044677734375, 0.26851654052734375, 0.2849884033203125, 0.30146026611328125, 0.31793212890625, 0.33440399169921875, 0.3508758544921875, 0.36734771728515625, 0.383819580078125, 0.40029144287109375, 0.4167633056640625, 0.43323516845703125, 0.44970703125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 9.0, 26.0, 58.0, 167.0, 315.0, 254.0, 106.0, 41.0, 15.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.3998908996582, -32.76668167114258, -32.13346862792969, -31.500259399414062, -30.867048263549805, -30.233837127685547, -29.60062599182129, -28.96741485595703, -28.334205627441406, -27.70099449157715, -27.06778335571289, -26.434574127197266, -25.801362991333008, -25.16815185546875, -24.534940719604492, -23.901729583740234, -23.26852035522461, -22.63530921936035, -22.002098083496094, -21.36888885498047, -20.73567771911621, -20.102466583251953, -19.469255447387695, -18.836044311523438, -18.20283317565918, -17.569622039794922, -16.936410903930664, -16.30320167541504, -15.669990539550781, -15.036779403686523, -14.403568267822266, -13.770358085632324, -13.1371488571167, -12.503937721252441, -11.8707275390625, -11.237516403198242, -10.6043062210083, -9.971095085144043, -9.337884902954102, -8.704673767089844, -8.071462631225586, -7.438251972198486, -6.805041313171387, -6.171830177307129, -5.5386199951171875, -4.90540885925293, -4.27219820022583, -3.6389875411987305, -3.005777359008789, -2.3725666999816895, -1.7393559217453003, -1.1061451435089111, -0.4729344844818115, 0.16027617454528809, 0.7934870719909668, 1.4266977310180664, 2.059908390045166, 2.6931190490722656, 3.3263297080993652, 3.959540605545044, 4.592751502990723, 5.225961685180664, 5.859172821044922, 6.4923834800720215, 7.125594139099121]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 11.0, 14.0, 17.0, 17.0, 14.0, 17.0, 28.0, 24.0, 31.0, 41.0, 33.0, 36.0, 45.0, 52.0, 47.0, 48.0, 43.0, 53.0, 49.0, 47.0, 31.0, 47.0, 35.0, 35.0, 27.0, 29.0, 28.0, 15.0, 12.0, 16.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.205902099609375, -9.90009593963623, -9.594289779663086, -9.288483619689941, -8.982677459716797, -8.676871299743652, -8.371065139770508, -8.065258979797363, -7.759452819824219, -7.453646659851074, -7.14784049987793, -6.842034339904785, -6.536228179931641, -6.230422019958496, -5.924615859985352, -5.618809700012207, -5.3130035400390625, -5.007197380065918, -4.701391220092773, -4.395585060119629, -4.089778900146484, -3.78397274017334, -3.4781665802001953, -3.172360420227051, -2.8665542602539062, -2.5607481002807617, -2.254941940307617, -1.9491357803344727, -1.6433296203613281, -1.3375234603881836, -1.031717300415039, -0.7259111404418945, -0.42010498046875, -0.11429882049560547, 0.19150733947753906, 0.4973134994506836, 0.8031196594238281, 1.1089258193969727, 1.4147319793701172, 1.7205381393432617, 2.0263442993164062, 2.332150459289551, 2.6379566192626953, 2.94376277923584, 3.2495689392089844, 3.555375099182129, 3.8611812591552734, 4.166987419128418, 4.4727935791015625, 4.778599739074707, 5.084405899047852, 5.390212059020996, 5.696018218994141, 6.001824378967285, 6.30763053894043, 6.613436698913574, 6.919242858886719, 7.225049018859863, 7.530855178833008, 7.836661338806152, 8.142467498779297, 8.448273658752441, 8.754079818725586, 9.05988597869873, 9.365692138671875]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 10.0, 17.0, 9.0, 13.0, 25.0, 38.0, 34.0, 63.0, 113.0, 199.0, 330.0, 718.0, 1531.0, 4072.0, 13613.0, 70164.0, 1661647.0, 2336200.0, 82939.0, 14835.0, 4480.0, 1664.0, 701.0, 348.0, 171.0, 103.0, 81.0, 42.0, 32.0, 21.0, 13.0, 10.0, 5.0, 6.0, 12.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.52886962890625, -5.3507080078125, -5.17254638671875, -4.994384765625, -4.81622314453125, -4.6380615234375, -4.45989990234375, -4.28173828125, -4.10357666015625, -3.9254150390625, -3.74725341796875, -3.569091796875, -3.39093017578125, -3.2127685546875, -3.03460693359375, -2.8564453125, -2.67828369140625, -2.5001220703125, -2.32196044921875, -2.143798828125, -1.96563720703125, -1.7874755859375, -1.60931396484375, -1.43115234375, -1.25299072265625, -1.0748291015625, -0.89666748046875, -0.718505859375, -0.54034423828125, -0.3621826171875, -0.18402099609375, -0.005859375, 0.17230224609375, 0.3504638671875, 0.52862548828125, 0.706787109375, 0.88494873046875, 1.0631103515625, 1.24127197265625, 1.41943359375, 1.59759521484375, 1.7757568359375, 1.95391845703125, 2.132080078125, 2.31024169921875, 2.4884033203125, 2.66656494140625, 2.8447265625, 3.02288818359375, 3.2010498046875, 3.37921142578125, 3.557373046875, 3.73553466796875, 3.9136962890625, 4.09185791015625, 4.27001953125, 4.44818115234375, 4.6263427734375, 4.80450439453125, 4.982666015625, 5.16082763671875, 5.3389892578125, 5.51715087890625, 5.6953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 4.0, 24.0, 24.0, 30.0, 35.0, 55.0, 60.0, 72.0, 81.0, 88.0, 87.0, 77.0, 110.0, 69.0, 49.0, 41.0, 20.0, 22.0, 14.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.073486328125, -4.93603515625, -4.798583984375, -4.6611328125, -4.523681640625, -4.38623046875, -4.248779296875, -4.111328125, -3.973876953125, -3.83642578125, -3.698974609375, -3.5615234375, -3.424072265625, -3.28662109375, -3.149169921875, -3.01171875, -2.874267578125, -2.73681640625, -2.599365234375, -2.4619140625, -2.324462890625, -2.18701171875, -2.049560546875, -1.912109375, -1.774658203125, -1.63720703125, -1.499755859375, -1.3623046875, -1.224853515625, -1.08740234375, -0.949951171875, -0.8125, -0.675048828125, -0.53759765625, -0.400146484375, -0.2626953125, -0.125244140625, 0.01220703125, 0.149658203125, 0.287109375, 0.424560546875, 0.56201171875, 0.699462890625, 0.8369140625, 0.974365234375, 1.11181640625, 1.249267578125, 1.38671875, 1.524169921875, 1.66162109375, 1.799072265625, 1.9365234375, 2.073974609375, 2.21142578125, 2.348876953125, 2.486328125, 2.623779296875, 2.76123046875, 2.898681640625, 3.0361328125, 3.173583984375, 3.31103515625, 3.448486328125, 3.5859375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 16.0, 50.0, 280.0, 18906.0, 4173348.0, 1513.0, 128.0, 27.0, 8.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.046875, -22.967529296875, -21.88818359375, -20.808837890625, -19.7294921875, -18.650146484375, -17.57080078125, -16.491455078125, -15.412109375, -14.332763671875, -13.25341796875, -12.174072265625, -11.0947265625, -10.015380859375, -8.93603515625, -7.856689453125, -6.77734375, -5.697998046875, -4.61865234375, -3.539306640625, -2.4599609375, -1.380615234375, -0.30126953125, 0.778076171875, 1.857421875, 2.936767578125, 4.01611328125, 5.095458984375, 6.1748046875, 7.254150390625, 8.33349609375, 9.412841796875, 10.4921875, 11.571533203125, 12.65087890625, 13.730224609375, 14.8095703125, 15.888916015625, 16.96826171875, 18.047607421875, 19.126953125, 20.206298828125, 21.28564453125, 22.364990234375, 23.4443359375, 24.523681640625, 25.60302734375, 26.682373046875, 27.76171875, 28.841064453125, 29.92041015625, 30.999755859375, 32.0791015625, 33.158447265625, 34.23779296875, 35.317138671875, 36.396484375, 37.475830078125, 38.55517578125, 39.634521484375, 40.7138671875, 41.793212890625, 42.87255859375, 43.951904296875, 45.03125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 4.0, 7.0, 11.0, 12.0, 24.0, 34.0, 33.0, 44.0, 60.0, 121.0, 172.0, 305.0, 521.0, 1050.0, 669.0, 338.0, 206.0, 138.0, 99.0, 68.0, 27.0, 30.0, 22.0, 13.0, 12.0, 9.0, 9.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.2490997314453125, -1.214019775390625, -1.1789398193359375, -1.14385986328125, -1.1087799072265625, -1.073699951171875, -1.0386199951171875, -1.0035400390625, -0.9684600830078125, -0.933380126953125, -0.8983001708984375, -0.86322021484375, -0.8281402587890625, -0.793060302734375, -0.7579803466796875, -0.722900390625, -0.6878204345703125, -0.652740478515625, -0.6176605224609375, -0.58258056640625, -0.5475006103515625, -0.512420654296875, -0.4773406982421875, -0.4422607421875, -0.4071807861328125, -0.372100830078125, -0.3370208740234375, -0.30194091796875, -0.2668609619140625, -0.231781005859375, -0.1967010498046875, -0.16162109375, -0.1265411376953125, -0.091461181640625, -0.0563812255859375, -0.02130126953125, 0.0137786865234375, 0.048858642578125, 0.0839385986328125, 0.1190185546875, 0.1540985107421875, 0.189178466796875, 0.2242584228515625, 0.25933837890625, 0.2944183349609375, 0.329498291015625, 0.3645782470703125, 0.399658203125, 0.4347381591796875, 0.469818115234375, 0.5048980712890625, 0.53997802734375, 0.5750579833984375, 0.610137939453125, 0.6452178955078125, 0.6802978515625, 0.7153778076171875, 0.750457763671875, 0.7855377197265625, 0.82061767578125, 0.8556976318359375, 0.890777587890625, 0.9258575439453125, 0.9609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 11.0, 18.0, 30.0, 33.0, 62.0, 75.0, 121.0, 146.0, 135.0, 114.0, 85.0, 52.0, 46.0, 18.0, 9.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.353464126586914, -7.154359817504883, -6.955255508422852, -6.75615119934082, -6.557046890258789, -6.357943058013916, -6.158838748931885, -5.9597344398498535, -5.760630130767822, -5.561525821685791, -5.36242151260376, -5.1633172035217285, -4.9642133712768555, -4.765109062194824, -4.566004753112793, -4.366900444030762, -4.1677961349487305, -3.968691825866699, -3.769587516784668, -3.570483446121216, -3.3713791370391846, -3.1722748279571533, -2.973170757293701, -2.77406644821167, -2.5749621391296387, -2.3758578300476074, -2.176753520965576, -1.977649450302124, -1.7785451412200928, -1.5794408321380615, -1.3803366422653198, -1.1812324523925781, -0.9821276664733887, -0.7830234169960022, -0.5839191675186157, -0.38481491804122925, -0.18571066856384277, 0.013393580913543701, 0.21249783039093018, 0.4116020202636719, 0.6107063293457031, 0.8098105788230896, 1.008914828300476, 1.2080190181732178, 1.407123327255249, 1.6062276363372803, 1.805331826210022, 2.0044360160827637, 2.203540325164795, 2.402644634246826, 2.6017489433288574, 2.8008530139923096, 2.999957323074341, 3.199061632156372, 3.398165702819824, 3.5972700119018555, 3.7963743209838867, 3.995478630065918, 4.194582939147949, 4.3936872482299805, 4.592791557312012, 4.791895389556885, 4.990999698638916, 5.190104007720947, 5.3892083168029785]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 4.0, 3.0, 13.0, 10.0, 14.0, 12.0, 25.0, 27.0, 39.0, 37.0, 37.0, 45.0, 46.0, 52.0, 70.0, 69.0, 61.0, 57.0, 51.0, 54.0, 45.0, 41.0, 41.0, 26.0, 28.0, 22.0, 18.0, 19.0, 10.0, 6.0, 4.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.372010707855225, -4.262429714202881, -4.152849197387695, -4.043268203735352, -3.933687448501587, -3.8241066932678223, -3.7145259380340576, -3.604945182800293, -3.4953644275665283, -3.3857836723327637, -3.276202917098999, -3.1666221618652344, -3.0570411682128906, -2.947460412979126, -2.8378796577453613, -2.7282989025115967, -2.618718147277832, -2.5091373920440674, -2.3995566368103027, -2.289975643157959, -2.1803948879241943, -2.0708141326904297, -1.961233377456665, -1.8516526222229004, -1.7420716285705566, -1.632490873336792, -1.5229099988937378, -1.4133292436599731, -1.3037484884262085, -1.1941676139831543, -1.0845868587493896, -0.975006103515625, -0.8654253482818604, -0.7558445334434509, -0.6462637782096863, -0.5366829633712769, -0.4271021783351898, -0.3175213932991028, -0.20794057846069336, -0.09835982322692871, 0.011220991611480713, 0.12080178409814835, 0.23038257658481598, 0.3399633765220642, 0.44954416155815125, 0.5591249465942383, 0.6687057614326477, 0.7782865166664124, 0.8878673315048218, 0.9974481463432312, 1.1070289611816406, 1.2166097164154053, 1.32619047164917, 1.4357712268829346, 1.5453521013259888, 1.6549328565597534, 1.7645137310028076, 1.8740944862365723, 1.9836753606796265, 2.0932559967041016, 2.2028369903564453, 2.31241774559021, 2.4219985008239746, 2.5315792560577393, 2.641160011291504]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 10.0, 18.0, 17.0, 29.0, 52.0, 104.0, 231.0, 540.0, 1607.0, 5843.0, 32101.0, 465609.0, 498980.0, 34519.0, 6094.0, 1707.0, 635.0, 229.0, 98.0, 52.0, 23.0, 15.0, 10.0, 5.0, 4.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.224609375, -1.182403564453125, -1.14019775390625, -1.097991943359375, -1.0557861328125, -1.013580322265625, -0.97137451171875, -0.929168701171875, -0.886962890625, -0.844757080078125, -0.80255126953125, -0.760345458984375, -0.7181396484375, -0.675933837890625, -0.63372802734375, -0.591522216796875, -0.54931640625, -0.507110595703125, -0.46490478515625, -0.422698974609375, -0.3804931640625, -0.338287353515625, -0.29608154296875, -0.253875732421875, -0.211669921875, -0.169464111328125, -0.12725830078125, -0.085052490234375, -0.0428466796875, -0.000640869140625, 0.04156494140625, 0.083770751953125, 0.1259765625, 0.168182373046875, 0.21038818359375, 0.252593994140625, 0.2947998046875, 0.337005615234375, 0.37921142578125, 0.421417236328125, 0.463623046875, 0.505828857421875, 0.54803466796875, 0.590240478515625, 0.6324462890625, 0.674652099609375, 0.71685791015625, 0.759063720703125, 0.80126953125, 0.843475341796875, 0.88568115234375, 0.927886962890625, 0.9700927734375, 1.012298583984375, 1.05450439453125, 1.096710205078125, 1.138916015625, 1.181121826171875, 1.22332763671875, 1.265533447265625, 1.3077392578125, 1.349945068359375, 1.39215087890625, 1.434356689453125, 1.4765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 14.0, 15.0, 25.0, 42.0, 33.0, 59.0, 79.0, 69.0, 88.0, 97.0, 93.0, 87.0, 75.0, 57.0, 57.0, 24.0, 26.0, 18.0, 10.0, 6.0, 6.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.277313232421875, -4.17181396484375, -4.066314697265625, -3.9608154296875, -3.855316162109375, -3.74981689453125, -3.644317626953125, -3.538818359375, -3.433319091796875, -3.32781982421875, -3.222320556640625, -3.1168212890625, -3.011322021484375, -2.90582275390625, -2.800323486328125, -2.69482421875, -2.589324951171875, -2.48382568359375, -2.378326416015625, -2.2728271484375, -2.167327880859375, -2.06182861328125, -1.956329345703125, -1.850830078125, -1.745330810546875, -1.63983154296875, -1.534332275390625, -1.4288330078125, -1.323333740234375, -1.21783447265625, -1.112335205078125, -1.0068359375, -0.901336669921875, -0.79583740234375, -0.690338134765625, -0.5848388671875, -0.479339599609375, -0.37384033203125, -0.268341064453125, -0.162841796875, -0.057342529296875, 0.04815673828125, 0.153656005859375, 0.2591552734375, 0.364654541015625, 0.47015380859375, 0.575653076171875, 0.68115234375, 0.786651611328125, 0.89215087890625, 0.997650146484375, 1.1031494140625, 1.208648681640625, 1.31414794921875, 1.419647216796875, 1.525146484375, 1.630645751953125, 1.73614501953125, 1.841644287109375, 1.9471435546875, 2.052642822265625, 2.15814208984375, 2.263641357421875, 2.369140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 9.0, 9.0, 23.0, 33.0, 57.0, 84.0, 127.0, 228.0, 430.0, 881.0, 2146.0, 5343.0, 15867.0, 63566.0, 343031.0, 482565.0, 99776.0, 22375.0, 6983.0, 2690.0, 1174.0, 516.0, 255.0, 148.0, 104.0, 46.0, 21.0, 20.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6122970581054688, -0.5932464599609375, -0.5741958618164062, -0.555145263671875, -0.5360946655273438, -0.5170440673828125, -0.49799346923828125, -0.47894287109375, -0.45989227294921875, -0.4408416748046875, -0.42179107666015625, -0.402740478515625, -0.38368988037109375, -0.3646392822265625, -0.34558868408203125, -0.3265380859375, -0.30748748779296875, -0.2884368896484375, -0.26938629150390625, -0.250335693359375, -0.23128509521484375, -0.2122344970703125, -0.19318389892578125, -0.17413330078125, -0.15508270263671875, -0.1360321044921875, -0.11698150634765625, -0.097930908203125, -0.07888031005859375, -0.0598297119140625, -0.04077911376953125, -0.021728515625, -0.00267791748046875, 0.0163726806640625, 0.03542327880859375, 0.054473876953125, 0.07352447509765625, 0.0925750732421875, 0.11162567138671875, 0.13067626953125, 0.14972686767578125, 0.1687774658203125, 0.18782806396484375, 0.206878662109375, 0.22592926025390625, 0.2449798583984375, 0.26403045654296875, 0.2830810546875, 0.30213165283203125, 0.3211822509765625, 0.34023284912109375, 0.359283447265625, 0.37833404541015625, 0.3973846435546875, 0.41643524169921875, 0.43548583984375, 0.45453643798828125, 0.4735870361328125, 0.49263763427734375, 0.511688232421875, 0.5307388305664062, 0.5497894287109375, 0.5688400268554688, 0.587890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 9.0, 9.0, 13.0, 13.0, 15.0, 26.0, 19.0, 36.0, 33.0, 41.0, 50.0, 46.0, 59.0, 70.0, 58.0, 61.0, 56.0, 55.0, 53.0, 47.0, 43.0, 35.0, 26.0, 36.0, 16.0, 17.0, 11.0, 14.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4093017578125, -3.283447265625, -3.1575927734375, -3.03173828125, -2.9058837890625, -2.780029296875, -2.6541748046875, -2.5283203125, -2.4024658203125, -2.276611328125, -2.1507568359375, -2.02490234375, -1.8990478515625, -1.773193359375, -1.6473388671875, -1.521484375, -1.3956298828125, -1.269775390625, -1.1439208984375, -1.01806640625, -0.8922119140625, -0.766357421875, -0.6405029296875, -0.5146484375, -0.3887939453125, -0.262939453125, -0.1370849609375, -0.01123046875, 0.1146240234375, 0.240478515625, 0.3663330078125, 0.4921875, 0.6180419921875, 0.743896484375, 0.8697509765625, 0.99560546875, 1.1214599609375, 1.247314453125, 1.3731689453125, 1.4990234375, 1.6248779296875, 1.750732421875, 1.8765869140625, 2.00244140625, 2.1282958984375, 2.254150390625, 2.3800048828125, 2.505859375, 2.6317138671875, 2.757568359375, 2.8834228515625, 3.00927734375, 3.1351318359375, 3.260986328125, 3.3868408203125, 3.5126953125, 3.6385498046875, 3.764404296875, 3.8902587890625, 4.01611328125, 4.1419677734375, 4.267822265625, 4.3936767578125, 4.51953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 20.0, 25.0, 37.0, 66.0, 91.0, 152.0, 271.0, 517.0, 891.0, 1761.0, 3407.0, 7594.0, 20829.0, 75326.0, 378474.0, 431378.0, 88468.0, 22913.0, 8504.0, 3674.0, 1885.0, 1026.0, 507.0, 274.0, 153.0, 104.0, 65.0, 38.0, 33.0, 19.0, 12.0, 7.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.22216796875, -0.21632957458496094, -0.21049118041992188, -0.2046527862548828, -0.19881439208984375, -0.1929759979248047, -0.18713760375976562, -0.18129920959472656, -0.1754608154296875, -0.16962242126464844, -0.16378402709960938, -0.1579456329345703, -0.15210723876953125, -0.1462688446044922, -0.14043045043945312, -0.13459205627441406, -0.128753662109375, -0.12291526794433594, -0.11707687377929688, -0.11123847961425781, -0.10540008544921875, -0.09956169128417969, -0.09372329711914062, -0.08788490295410156, -0.0820465087890625, -0.07620811462402344, -0.07036972045898438, -0.06453132629394531, -0.05869293212890625, -0.05285453796386719, -0.047016143798828125, -0.04117774963378906, -0.03533935546875, -0.029500961303710938, -0.023662567138671875, -0.017824172973632812, -0.01198577880859375, -0.0061473846435546875, -0.000308990478515625, 0.0055294036865234375, 0.0113677978515625, 0.017206192016601562, 0.023044586181640625, 0.028882980346679688, 0.03472137451171875, 0.04055976867675781, 0.046398162841796875, 0.05223655700683594, 0.058074951171875, 0.06391334533691406, 0.06975173950195312, 0.07559013366699219, 0.08142852783203125, 0.08726692199707031, 0.09310531616210938, 0.09894371032714844, 0.1047821044921875, 0.11062049865722656, 0.11645889282226562, 0.12229728698730469, 0.12813568115234375, 0.1339740753173828, 0.13981246948242188, 0.14565086364746094, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 9.0, 19.0, 25.0, 33.0, 41.0, 70.0, 101.0, 102.0, 132.0, 120.0, 91.0, 70.0, 52.0, 35.0, 25.0, 19.0, 15.0, 4.0, 4.0, 9.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011783838272094727, -0.00011319946497678757, -0.00010856054723262787, -0.00010392162948846817, -9.928271174430847e-05, -9.464379400014877e-05, -9.000487625598907e-05, -8.536595851182938e-05, -8.072704076766968e-05, -7.608812302350998e-05, -7.144920527935028e-05, -6.681028753519058e-05, -6.217136979103088e-05, -5.7532452046871185e-05, -5.289353430271149e-05, -4.825461655855179e-05, -4.361569881439209e-05, -3.897678107023239e-05, -3.433786332607269e-05, -2.9698945581912994e-05, -2.5060027837753296e-05, -2.0421110093593597e-05, -1.57821923494339e-05, -1.11432746052742e-05, -6.504356861114502e-06, -1.8654391169548035e-06, 2.773478627204895e-06, 7.4123963713645935e-06, 1.2051314115524292e-05, 1.669023185968399e-05, 2.132914960384369e-05, 2.5968067348003387e-05, 3.0606985092163086e-05, 3.5245902836322784e-05, 3.988482058048248e-05, 4.452373832464218e-05, 4.916265606880188e-05, 5.380157381296158e-05, 5.844049155712128e-05, 6.307940930128098e-05, 6.771832704544067e-05, 7.235724478960037e-05, 7.699616253376007e-05, 8.163508027791977e-05, 8.627399802207947e-05, 9.091291576623917e-05, 9.555183351039886e-05, 0.00010019075125455856, 0.00010482966899871826, 0.00010946858674287796, 0.00011410750448703766, 0.00011874642223119736, 0.00012338533997535706, 0.00012802425771951675, 0.00013266317546367645, 0.00013730209320783615, 0.00014194101095199585, 0.00014657992869615555, 0.00015121884644031525, 0.00015585776418447495, 0.00016049668192863464, 0.00016513559967279434, 0.00016977451741695404, 0.00017441343516111374, 0.00017905235290527344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 13.0, 4.0, 14.0, 12.0, 15.0, 23.0, 36.0, 67.0, 66.0, 137.0, 188.0, 366.0, 647.0, 1184.0, 2266.0, 4590.0, 10643.0, 29567.0, 108000.0, 451810.0, 327216.0, 73766.0, 21596.0, 8270.0, 3830.0, 1847.0, 956.0, 546.0, 320.0, 180.0, 126.0, 74.0, 54.0, 40.0, 23.0, 10.0, 12.0, 9.0, 12.0, 7.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166259765625, -0.16049957275390625, -0.1547393798828125, -0.14897918701171875, -0.143218994140625, -0.13745880126953125, -0.1316986083984375, -0.12593841552734375, -0.12017822265625, -0.11441802978515625, -0.1086578369140625, -0.10289764404296875, -0.097137451171875, -0.09137725830078125, -0.0856170654296875, -0.07985687255859375, -0.0740966796875, -0.06833648681640625, -0.0625762939453125, -0.05681610107421875, -0.051055908203125, -0.04529571533203125, -0.0395355224609375, -0.03377532958984375, -0.02801513671875, -0.02225494384765625, -0.0164947509765625, -0.01073455810546875, -0.004974365234375, 0.00078582763671875, 0.0065460205078125, 0.01230621337890625, 0.01806640625, 0.02382659912109375, 0.0295867919921875, 0.03534698486328125, 0.041107177734375, 0.04686737060546875, 0.0526275634765625, 0.05838775634765625, 0.06414794921875, 0.06990814208984375, 0.0756683349609375, 0.08142852783203125, 0.087188720703125, 0.09294891357421875, 0.0987091064453125, 0.10446929931640625, 0.1102294921875, 0.11598968505859375, 0.1217498779296875, 0.12751007080078125, 0.133270263671875, 0.13903045654296875, 0.1447906494140625, 0.15055084228515625, 0.15631103515625, 0.16207122802734375, 0.1678314208984375, 0.17359161376953125, 0.179351806640625, 0.18511199951171875, 0.1908721923828125, 0.19663238525390625, 0.202392578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 12.0, 12.0, 22.0, 10.0, 18.0, 38.0, 42.0, 39.0, 56.0, 82.0, 86.0, 94.0, 93.0, 80.0, 69.0, 63.0, 47.0, 38.0, 22.0, 21.0, 14.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037109375, -0.03561687469482422, -0.03412437438964844, -0.032631874084472656, -0.031139373779296875, -0.029646873474121094, -0.028154373168945312, -0.02666187286376953, -0.02516937255859375, -0.02367687225341797, -0.022184371948242188, -0.020691871643066406, -0.019199371337890625, -0.017706871032714844, -0.016214370727539062, -0.014721870422363281, -0.0132293701171875, -0.011736869812011719, -0.010244369506835938, -0.008751869201660156, -0.007259368896484375, -0.005766868591308594, -0.0042743682861328125, -0.0027818679809570312, -0.00128936767578125, 0.00020313262939453125, 0.0016956329345703125, 0.0031881332397460938, 0.004680633544921875, 0.006173133850097656, 0.0076656341552734375, 0.009158134460449219, 0.010650634765625, 0.012143135070800781, 0.013635635375976562, 0.015128135681152344, 0.016620635986328125, 0.018113136291503906, 0.019605636596679688, 0.02109813690185547, 0.02259063720703125, 0.02408313751220703, 0.025575637817382812, 0.027068138122558594, 0.028560638427734375, 0.030053138732910156, 0.03154563903808594, 0.03303813934326172, 0.0345306396484375, 0.03602313995361328, 0.03751564025878906, 0.039008140563964844, 0.040500640869140625, 0.041993141174316406, 0.04348564147949219, 0.04497814178466797, 0.04647064208984375, 0.04796314239501953, 0.04945564270019531, 0.050948143005371094, 0.052440643310546875, 0.053933143615722656, 0.05542564392089844, 0.05691814422607422, 0.05841064453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 10.0, 7.0, 19.0, 26.0, 39.0, 66.0, 94.0, 175.0, 165.0, 137.0, 104.0, 72.0, 31.0, 17.0, 10.0, 8.0, 7.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.084479808807373, -4.936653137207031, -4.7888264656066895, -4.641000270843506, -4.493173599243164, -4.345346927642822, -4.1975202560424805, -4.049693584442139, -3.901867151260376, -3.754040479660034, -3.6062140464782715, -3.4583873748779297, -3.310560703277588, -3.162734270095825, -3.0149075984954834, -2.8670811653137207, -2.719254493713379, -2.571427822113037, -2.4236013889312744, -2.2757747173309326, -2.12794828414917, -1.9801216125488281, -1.8322949409484863, -1.684468388557434, -1.5366418361663818, -1.3888152837753296, -1.2409887313842773, -1.0931620597839355, -0.9453355073928833, -0.797508955001831, -0.649682343006134, -0.501855731010437, -0.35402917861938477, -0.20620259642601013, -0.0583760142326355, 0.08945056796073914, 0.23727715015411377, 0.385103702545166, 0.532930314540863, 0.6807569265365601, 0.8285834789276123, 0.9764100313186646, 1.1242365837097168, 1.2720632553100586, 1.4198898077011108, 1.567716360092163, 1.7155430316925049, 1.8633695840835571, 2.0111961364746094, 2.159022808074951, 2.306849241256714, 2.4546759128570557, 2.6025023460388184, 2.75032901763916, 2.898155689239502, 3.0459823608398438, 3.1938087940216064, 3.3416354656219482, 3.489461898803711, 3.6372885704040527, 3.7851152420043945, 3.9329416751861572, 4.08076810836792, 4.228594779968262, 4.3764214515686035]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 17.0, 13.0, 22.0, 28.0, 39.0, 51.0, 50.0, 51.0, 68.0, 85.0, 95.0, 68.0, 79.0, 62.0, 55.0, 55.0, 35.0, 33.0, 22.0, 22.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4835197925567627, -3.3976821899414062, -3.31184458732605, -3.2260069847106934, -3.140169620513916, -3.0543320178985596, -2.968494415283203, -2.8826568126678467, -2.7968192100524902, -2.710981607437134, -2.6251440048217773, -2.539306640625, -2.4534690380096436, -2.367631435394287, -2.2817938327789307, -2.195956230163574, -2.110118865966797, -2.0242812633514404, -1.9384437799453735, -1.852606177330017, -1.7667686939239502, -1.6809310913085938, -1.5950934886932373, -1.5092558860778809, -1.423418402671814, -1.3375808000564575, -1.2517433166503906, -1.1659057140350342, -1.0800681114196777, -0.9942306280136108, -0.9083930253982544, -0.8225554823875427, -0.7367181777954102, -0.6508806347846985, -0.5650430917739868, -0.47920548915863037, -0.3933679461479187, -0.30753040313720703, -0.22169280052185059, -0.13585525751113892, -0.050017714500427246, 0.03581984341144562, 0.12165740132331848, 0.20749497413635254, 0.2933325171470642, 0.3791700601577759, 0.4650076627731323, 0.550845205783844, 0.6366827487945557, 0.7225202918052673, 0.808357834815979, 0.8941954374313354, 0.9800329804420471, 1.0658705234527588, 1.1517081260681152, 1.2375457286834717, 1.3233832120895386, 1.409220814704895, 1.495058298110962, 1.5808959007263184, 1.6667335033416748, 1.7525709867477417, 1.8384085893630981, 1.924246072769165, 2.0100836753845215]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 8.0, 14.0, 22.0, 42.0, 65.0, 157.0, 244.0, 519.0, 1053.0, 2354.0, 6112.0, 19030.0, 79613.0, 644098.0, 238707.0, 38524.0, 11053.0, 3887.0, 1583.0, 687.0, 370.0, 178.0, 88.0, 51.0, 29.0, 22.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.19921875, -3.09173583984375, -2.9842529296875, -2.87677001953125, -2.769287109375, -2.66180419921875, -2.5543212890625, -2.44683837890625, -2.33935546875, -2.23187255859375, -2.1243896484375, -2.01690673828125, -1.909423828125, -1.80194091796875, -1.6944580078125, -1.58697509765625, -1.4794921875, -1.37200927734375, -1.2645263671875, -1.15704345703125, -1.049560546875, -0.94207763671875, -0.8345947265625, -0.72711181640625, -0.61962890625, -0.51214599609375, -0.4046630859375, -0.29718017578125, -0.189697265625, -0.08221435546875, 0.0252685546875, 0.13275146484375, 0.240234375, 0.34771728515625, 0.4552001953125, 0.56268310546875, 0.670166015625, 0.77764892578125, 0.8851318359375, 0.99261474609375, 1.10009765625, 1.20758056640625, 1.3150634765625, 1.42254638671875, 1.530029296875, 1.63751220703125, 1.7449951171875, 1.85247802734375, 1.9599609375, 2.06744384765625, 2.1749267578125, 2.28240966796875, 2.389892578125, 2.49737548828125, 2.6048583984375, 2.71234130859375, 2.81982421875, 2.92730712890625, 3.0347900390625, 3.14227294921875, 3.249755859375, 3.35723876953125, 3.4647216796875, 3.57220458984375, 3.6796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 4.0, 8.0, 11.0, 11.0, 14.0, 10.0, 32.0, 23.0, 33.0, 35.0, 43.0, 70.0, 60.0, 57.0, 78.0, 56.0, 54.0, 71.0, 41.0, 49.0, 49.0, 39.0, 34.0, 21.0, 22.0, 18.0, 13.0, 7.0, 5.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-6.9296875, -6.764923095703125, -6.60015869140625, -6.435394287109375, -6.2706298828125, -6.105865478515625, -5.94110107421875, -5.776336669921875, -5.611572265625, -5.446807861328125, -5.28204345703125, -5.117279052734375, -4.9525146484375, -4.787750244140625, -4.62298583984375, -4.458221435546875, -4.29345703125, -4.128692626953125, -3.96392822265625, -3.799163818359375, -3.6343994140625, -3.469635009765625, -3.30487060546875, -3.140106201171875, -2.975341796875, -2.810577392578125, -2.64581298828125, -2.481048583984375, -2.3162841796875, -2.151519775390625, -1.98675537109375, -1.821990966796875, -1.6572265625, -1.492462158203125, -1.32769775390625, -1.162933349609375, -0.9981689453125, -0.833404541015625, -0.66864013671875, -0.503875732421875, -0.339111328125, -0.174346923828125, -0.00958251953125, 0.155181884765625, 0.3199462890625, 0.484710693359375, 0.64947509765625, 0.814239501953125, 0.97900390625, 1.143768310546875, 1.30853271484375, 1.473297119140625, 1.6380615234375, 1.802825927734375, 1.96759033203125, 2.132354736328125, 2.297119140625, 2.461883544921875, 2.62664794921875, 2.791412353515625, 2.9561767578125, 3.120941162109375, 3.28570556640625, 3.450469970703125, 3.615234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 12.0, 12.0, 14.0, 14.0, 16.0, 22.0, 21.0, 21.0, 25.0, 26.0, 27.0, 24.0, 33.0, 41.0, 47.0, 88.0, 342.0, 5564.0, 915583.0, 123997.0, 1963.0, 218.0, 76.0, 38.0, 30.0, 25.0, 20.0, 33.0, 26.0, 16.0, 20.0, 19.0, 18.0, 15.0, 14.0, 8.0, 11.0, 9.0, 8.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.0078125, -9.67236328125, -9.3369140625, -9.00146484375, -8.666015625, -8.33056640625, -7.9951171875, -7.65966796875, -7.32421875, -6.98876953125, -6.6533203125, -6.31787109375, -5.982421875, -5.64697265625, -5.3115234375, -4.97607421875, -4.640625, -4.30517578125, -3.9697265625, -3.63427734375, -3.298828125, -2.96337890625, -2.6279296875, -2.29248046875, -1.95703125, -1.62158203125, -1.2861328125, -0.95068359375, -0.615234375, -0.27978515625, 0.0556640625, 0.39111328125, 0.7265625, 1.06201171875, 1.3974609375, 1.73291015625, 2.068359375, 2.40380859375, 2.7392578125, 3.07470703125, 3.41015625, 3.74560546875, 4.0810546875, 4.41650390625, 4.751953125, 5.08740234375, 5.4228515625, 5.75830078125, 6.09375, 6.42919921875, 6.7646484375, 7.10009765625, 7.435546875, 7.77099609375, 8.1064453125, 8.44189453125, 8.77734375, 9.11279296875, 9.4482421875, 9.78369140625, 10.119140625, 10.45458984375, 10.7900390625, 11.12548828125, 11.4609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 13.0, 21.0, 20.0, 17.0, 12.0, 21.0, 30.0, 23.0, 21.0, 27.0, 29.0, 27.0, 42.0, 34.0, 37.0, 43.0, 42.0, 44.0, 38.0, 31.0, 50.0, 24.0, 27.0, 24.0, 22.0, 34.0, 22.0, 22.0, 19.0, 23.0, 20.0, 17.0, 13.0, 6.0, 10.0, 14.0, 8.0, 11.0, 5.0, 10.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.630859375, -3.502593994140625, -3.37432861328125, -3.246063232421875, -3.1177978515625, -2.989532470703125, -2.86126708984375, -2.733001708984375, -2.604736328125, -2.476470947265625, -2.34820556640625, -2.219940185546875, -2.0916748046875, -1.963409423828125, -1.83514404296875, -1.706878662109375, -1.57861328125, -1.450347900390625, -1.32208251953125, -1.193817138671875, -1.0655517578125, -0.937286376953125, -0.80902099609375, -0.680755615234375, -0.552490234375, -0.424224853515625, -0.29595947265625, -0.167694091796875, -0.0394287109375, 0.088836669921875, 0.21710205078125, 0.345367431640625, 0.4736328125, 0.601898193359375, 0.73016357421875, 0.858428955078125, 0.9866943359375, 1.114959716796875, 1.24322509765625, 1.371490478515625, 1.499755859375, 1.628021240234375, 1.75628662109375, 1.884552001953125, 2.0128173828125, 2.141082763671875, 2.26934814453125, 2.397613525390625, 2.52587890625, 2.654144287109375, 2.78240966796875, 2.910675048828125, 3.0389404296875, 3.167205810546875, 3.29547119140625, 3.423736572265625, 3.552001953125, 3.680267333984375, 3.80853271484375, 3.936798095703125, 4.0650634765625, 4.193328857421875, 4.32159423828125, 4.449859619140625, 4.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 7.0, 21.0, 24.0, 35.0, 85.0, 145.0, 298.0, 627.0, 1408.0, 4508.0, 20673.0, 259957.0, 711070.0, 39692.0, 6552.0, 1915.0, 751.0, 331.0, 154.0, 98.0, 55.0, 40.0, 23.0, 19.0, 8.0, 12.0, 2.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1396484375, -1.0904388427734375, -1.041229248046875, -0.9920196533203125, -0.94281005859375, -0.8936004638671875, -0.844390869140625, -0.7951812744140625, -0.7459716796875, -0.6967620849609375, -0.647552490234375, -0.5983428955078125, -0.54913330078125, -0.4999237060546875, -0.450714111328125, -0.4015045166015625, -0.352294921875, -0.3030853271484375, -0.253875732421875, -0.2046661376953125, -0.15545654296875, -0.1062469482421875, -0.057037353515625, -0.0078277587890625, 0.0413818359375, 0.0905914306640625, 0.139801025390625, 0.1890106201171875, 0.23822021484375, 0.2874298095703125, 0.336639404296875, 0.3858489990234375, 0.43505859375, 0.4842681884765625, 0.533477783203125, 0.5826873779296875, 0.63189697265625, 0.6811065673828125, 0.730316162109375, 0.7795257568359375, 0.8287353515625, 0.8779449462890625, 0.927154541015625, 0.9763641357421875, 1.02557373046875, 1.0747833251953125, 1.123992919921875, 1.1732025146484375, 1.222412109375, 1.2716217041015625, 1.320831298828125, 1.3700408935546875, 1.41925048828125, 1.4684600830078125, 1.517669677734375, 1.5668792724609375, 1.6160888671875, 1.6652984619140625, 1.714508056640625, 1.7637176513671875, 1.81292724609375, 1.8621368408203125, 1.911346435546875, 1.9605560302734375, 2.009765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 7.0, 15.0, 15.0, 25.0, 35.0, 47.0, 71.0, 107.0, 182.0, 142.0, 118.0, 76.0, 33.0, 31.0, 18.0, 19.0, 14.0, 12.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002149343490600586, -0.00020877830684185028, -0.00020262226462364197, -0.00019646622240543365, -0.00019031018018722534, -0.00018415413796901703, -0.00017799809575080872, -0.0001718420535326004, -0.0001656860113143921, -0.00015952996909618378, -0.00015337392687797546, -0.00014721788465976715, -0.00014106184244155884, -0.00013490580022335052, -0.0001287497580051422, -0.0001225937157869339, -0.00011643767356872559, -0.00011028163135051727, -0.00010412558913230896, -9.796954691410065e-05, -9.181350469589233e-05, -8.565746247768402e-05, -7.950142025947571e-05, -7.33453780412674e-05, -6.718933582305908e-05, -6.103329360485077e-05, -5.4877251386642456e-05, -4.872120916843414e-05, -4.256516695022583e-05, -3.640912473201752e-05, -3.0253082513809204e-05, -2.409704029560089e-05, -1.7940998077392578e-05, -1.1784955859184265e-05, -5.628913640975952e-06, 5.271285772323608e-07, 6.683170795440674e-06, 1.2839213013648987e-05, 1.89952552318573e-05, 2.5151297450065613e-05, 3.1307339668273926e-05, 3.746338188648224e-05, 4.361942410469055e-05, 4.9775466322898865e-05, 5.593150854110718e-05, 6.208755075931549e-05, 6.82435929775238e-05, 7.439963519573212e-05, 8.055567741394043e-05, 8.671171963214874e-05, 9.286776185035706e-05, 9.902380406856537e-05, 0.00010517984628677368, 0.000111335888504982, 0.00011749193072319031, 0.00012364797294139862, 0.00012980401515960693, 0.00013596005737781525, 0.00014211609959602356, 0.00014827214181423187, 0.00015442818403244019, 0.0001605842262506485, 0.0001667402684688568, 0.00017289631068706512, 0.00017905235290527344]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 11.0, 17.0, 25.0, 44.0, 47.0, 92.0, 147.0, 218.0, 359.0, 613.0, 1109.0, 2104.0, 4314.0, 10179.0, 30302.0, 145194.0, 678716.0, 128470.0, 28017.0, 9730.0, 4184.0, 2006.0, 1115.0, 565.0, 323.0, 197.0, 133.0, 104.0, 55.0, 45.0, 24.0, 26.0, 14.0, 9.0, 8.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.033203125, -1.0040740966796875, -0.974945068359375, -0.9458160400390625, -0.91668701171875, -0.8875579833984375, -0.858428955078125, -0.8292999267578125, -0.8001708984375, -0.7710418701171875, -0.741912841796875, -0.7127838134765625, -0.68365478515625, -0.6545257568359375, -0.625396728515625, -0.5962677001953125, -0.567138671875, -0.5380096435546875, -0.508880615234375, -0.4797515869140625, -0.45062255859375, -0.4214935302734375, -0.392364501953125, -0.3632354736328125, -0.3341064453125, -0.3049774169921875, -0.275848388671875, -0.2467193603515625, -0.21759033203125, -0.1884613037109375, -0.159332275390625, -0.1302032470703125, -0.10107421875, -0.0719451904296875, -0.042816162109375, -0.0136871337890625, 0.01544189453125, 0.0445709228515625, 0.073699951171875, 0.1028289794921875, 0.1319580078125, 0.1610870361328125, 0.190216064453125, 0.2193450927734375, 0.24847412109375, 0.2776031494140625, 0.306732177734375, 0.3358612060546875, 0.364990234375, 0.3941192626953125, 0.423248291015625, 0.4523773193359375, 0.48150634765625, 0.5106353759765625, 0.539764404296875, 0.5688934326171875, 0.5980224609375, 0.6271514892578125, 0.656280517578125, 0.6854095458984375, 0.71453857421875, 0.7436676025390625, 0.772796630859375, 0.8019256591796875, 0.8310546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 2.0, 7.0, 7.0, 12.0, 22.0, 39.0, 42.0, 53.0, 89.0, 151.0, 187.0, 146.0, 76.0, 44.0, 34.0, 22.0, 17.0, 9.0, 10.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6259765625, -0.6065673828125, -0.587158203125, -0.5677490234375, -0.54833984375, -0.5289306640625, -0.509521484375, -0.4901123046875, -0.470703125, -0.4512939453125, -0.431884765625, -0.4124755859375, -0.39306640625, -0.3736572265625, -0.354248046875, -0.3348388671875, -0.3154296875, -0.2960205078125, -0.276611328125, -0.2572021484375, -0.23779296875, -0.2183837890625, -0.198974609375, -0.1795654296875, -0.16015625, -0.1407470703125, -0.121337890625, -0.1019287109375, -0.08251953125, -0.0631103515625, -0.043701171875, -0.0242919921875, -0.0048828125, 0.0145263671875, 0.033935546875, 0.0533447265625, 0.07275390625, 0.0921630859375, 0.111572265625, 0.1309814453125, 0.150390625, 0.1697998046875, 0.189208984375, 0.2086181640625, 0.22802734375, 0.2474365234375, 0.266845703125, 0.2862548828125, 0.3056640625, 0.3250732421875, 0.344482421875, 0.3638916015625, 0.38330078125, 0.4027099609375, 0.422119140625, 0.4415283203125, 0.4609375, 0.4803466796875, 0.499755859375, 0.5191650390625, 0.53857421875, 0.5579833984375, 0.577392578125, 0.5968017578125, 0.6162109375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 12.0, 15.0, 9.0, 16.0, 42.0, 40.0, 59.0, 88.0, 129.0, 130.0, 105.0, 98.0, 78.0, 61.0, 34.0, 17.0, 13.0, 17.0, 9.0, 6.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.66705322265625, -7.446164608001709, -7.225276470184326, -7.004387855529785, -6.783499240875244, -6.562610626220703, -6.34172248840332, -6.120833873748779, -5.899945259094238, -5.679056644439697, -5.4581685066223145, -5.237279891967773, -5.016391277313232, -4.795502662658691, -4.574614524841309, -4.353725910186768, -4.132837295532227, -3.9119489192962646, -3.6910603046417236, -3.4701719284057617, -3.2492833137512207, -3.028394937515259, -2.807506561279297, -2.586617946624756, -2.365729808807373, -2.144841432571411, -1.9239528179168701, -1.7030644416809082, -1.4821758270263672, -1.2612874507904053, -1.0403989553451538, -0.8195104598999023, -0.5986218452453613, -0.37773334980010986, -0.1568448841571808, 0.06404358148574829, 0.28493207693099976, 0.5058205127716064, 0.7267090082168579, 0.9475975036621094, 1.1684859991073608, 1.3893744945526123, 1.6102629899978638, 1.8311514854431152, 2.052039861679077, 2.272928237915039, 2.49381685256958, 2.714705467224121, 2.935593843460083, 3.156482219696045, 3.377370834350586, 3.598259210586548, 3.819147825241089, 4.040036201477051, 4.260924816131592, 4.481813430786133, 4.702701568603516, 4.923590183258057, 5.1444783210754395, 5.3653669357299805, 5.5862555503845215, 5.8071441650390625, 6.028032302856445, 6.248920917510986, 6.469809532165527]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 4.0, 8.0, 7.0, 11.0, 8.0, 11.0, 12.0, 21.0, 12.0, 21.0, 24.0, 31.0, 31.0, 39.0, 41.0, 41.0, 40.0, 52.0, 33.0, 48.0, 40.0, 32.0, 37.0, 40.0, 35.0, 36.0, 34.0, 31.0, 27.0, 32.0, 25.0, 27.0, 20.0, 11.0, 14.0, 14.0, 14.0, 3.0, 5.0, 4.0, 10.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.317837238311768, -7.08499002456665, -6.852142810821533, -6.619295597076416, -6.386447906494141, -6.153600692749023, -5.920753479003906, -5.687906265258789, -5.455059051513672, -5.222211837768555, -4.9893646240234375, -4.75651741027832, -4.523670196533203, -4.290822982788086, -4.0579752922058105, -3.8251280784606934, -3.592280864715576, -3.359433650970459, -3.126586437225342, -2.8937389850616455, -2.6608917713165283, -2.428044557571411, -2.195197105407715, -1.9623498916625977, -1.7295026779174805, -1.4966554641723633, -1.2638081312179565, -1.0309607982635498, -0.7981135845184326, -0.5652663707733154, -0.3324190378189087, -0.09957170486450195, 0.13327550888061523, 0.3661227822303772, 0.5989700555801392, 0.8318173289299011, 1.064664602279663, 1.2975118160247803, 1.530359148979187, 1.7632064819335938, 1.996053695678711, 2.228900909423828, 2.4617481231689453, 2.6945955753326416, 2.927442789077759, 3.160290002822876, 3.3931374549865723, 3.6259846687316895, 3.8588318824768066, 4.091679096221924, 4.324526309967041, 4.557373523712158, 4.790221214294434, 5.023068428039551, 5.255915641784668, 5.488762855529785, 5.721610069274902, 5.9544572830200195, 6.187304496765137, 6.420151710510254, 6.652998924255371, 6.885846138000488, 7.118693828582764, 7.351541042327881, 7.584388256072998]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 3.0, 8.0, 8.0, 17.0, 20.0, 30.0, 26.0, 72.0, 85.0, 156.0, 293.0, 640.0, 1775.0, 6013.0, 31885.0, 641030.0, 3408779.0, 87095.0, 11616.0, 2821.0, 941.0, 414.0, 203.0, 109.0, 64.0, 48.0, 29.0, 27.0, 12.0, 10.0, 8.0, 8.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.1796875, -6.9698486328125, -6.760009765625, -6.5501708984375, -6.34033203125, -6.1304931640625, -5.920654296875, -5.7108154296875, -5.5009765625, -5.2911376953125, -5.081298828125, -4.8714599609375, -4.66162109375, -4.4517822265625, -4.241943359375, -4.0321044921875, -3.822265625, -3.6124267578125, -3.402587890625, -3.1927490234375, -2.98291015625, -2.7730712890625, -2.563232421875, -2.3533935546875, -2.1435546875, -1.9337158203125, -1.723876953125, -1.5140380859375, -1.30419921875, -1.0943603515625, -0.884521484375, -0.6746826171875, -0.46484375, -0.2550048828125, -0.045166015625, 0.1646728515625, 0.37451171875, 0.5843505859375, 0.794189453125, 1.0040283203125, 1.2138671875, 1.4237060546875, 1.633544921875, 1.8433837890625, 2.05322265625, 2.2630615234375, 2.472900390625, 2.6827392578125, 2.892578125, 3.1024169921875, 3.312255859375, 3.5220947265625, 3.73193359375, 3.9417724609375, 4.151611328125, 4.3614501953125, 4.5712890625, 4.7811279296875, 4.990966796875, 5.2008056640625, 5.41064453125, 5.6204833984375, 5.830322265625, 6.0401611328125, 6.25]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 7.0, 6.0, 10.0, 19.0, 25.0, 26.0, 32.0, 59.0, 56.0, 61.0, 80.0, 84.0, 82.0, 70.0, 64.0, 61.0, 52.0, 51.0, 35.0, 26.0, 17.0, 13.0, 13.0, 13.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.908203125, -3.808563232421875, -3.70892333984375, -3.609283447265625, -3.5096435546875, -3.410003662109375, -3.31036376953125, -3.210723876953125, -3.111083984375, -3.011444091796875, -2.91180419921875, -2.812164306640625, -2.7125244140625, -2.612884521484375, -2.51324462890625, -2.413604736328125, -2.31396484375, -2.214324951171875, -2.11468505859375, -2.015045166015625, -1.9154052734375, -1.815765380859375, -1.71612548828125, -1.616485595703125, -1.516845703125, -1.417205810546875, -1.31756591796875, -1.217926025390625, -1.1182861328125, -1.018646240234375, -0.91900634765625, -0.819366455078125, -0.7197265625, -0.620086669921875, -0.52044677734375, -0.420806884765625, -0.3211669921875, -0.221527099609375, -0.12188720703125, -0.022247314453125, 0.077392578125, 0.177032470703125, 0.27667236328125, 0.376312255859375, 0.4759521484375, 0.575592041015625, 0.67523193359375, 0.774871826171875, 0.87451171875, 0.974151611328125, 1.07379150390625, 1.173431396484375, 1.2730712890625, 1.372711181640625, 1.47235107421875, 1.571990966796875, 1.671630859375, 1.771270751953125, 1.87091064453125, 1.970550537109375, 2.0701904296875, 2.169830322265625, 2.26947021484375, 2.369110107421875, 2.46875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 15.0, 31.0, 43.0, 113.0, 308.0, 1645.0, 53296.0, 4120618.0, 16792.0, 969.0, 219.0, 98.0, 43.0, 22.0, 21.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -9.880859375, -9.37109375, -8.861328125, -8.3515625, -7.841796875, -7.33203125, -6.822265625, -6.3125, -5.802734375, -5.29296875, -4.783203125, -4.2734375, -3.763671875, -3.25390625, -2.744140625, -2.234375, -1.724609375, -1.21484375, -0.705078125, -0.1953125, 0.314453125, 0.82421875, 1.333984375, 1.84375, 2.353515625, 2.86328125, 3.373046875, 3.8828125, 4.392578125, 4.90234375, 5.412109375, 5.921875, 6.431640625, 6.94140625, 7.451171875, 7.9609375, 8.470703125, 8.98046875, 9.490234375, 10.0, 10.509765625, 11.01953125, 11.529296875, 12.0390625, 12.548828125, 13.05859375, 13.568359375, 14.078125, 14.587890625, 15.09765625, 15.607421875, 16.1171875, 16.626953125, 17.13671875, 17.646484375, 18.15625, 18.666015625, 19.17578125, 19.685546875, 20.1953125, 20.705078125, 21.21484375, 21.724609375, 22.234375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 9.0, 6.0, 9.0, 17.0, 26.0, 22.0, 31.0, 43.0, 75.0, 99.0, 120.0, 153.0, 226.0, 407.0, 727.0, 751.0, 420.0, 273.0, 188.0, 133.0, 65.0, 70.0, 49.0, 35.0, 18.0, 21.0, 22.0, 7.0, 13.0, 4.0, 2.0, 9.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89794921875, -0.8680801391601562, -0.8382110595703125, -0.8083419799804688, -0.778472900390625, -0.7486038208007812, -0.7187347412109375, -0.6888656616210938, -0.65899658203125, -0.6291275024414062, -0.5992584228515625, -0.5693893432617188, -0.539520263671875, -0.5096511840820312, -0.4797821044921875, -0.44991302490234375, -0.4200439453125, -0.39017486572265625, -0.3603057861328125, -0.33043670654296875, -0.300567626953125, -0.27069854736328125, -0.2408294677734375, -0.21096038818359375, -0.18109130859375, -0.15122222900390625, -0.1213531494140625, -0.09148406982421875, -0.061614990234375, -0.03174591064453125, -0.0018768310546875, 0.02799224853515625, 0.057861328125, 0.08773040771484375, 0.1175994873046875, 0.14746856689453125, 0.177337646484375, 0.20720672607421875, 0.2370758056640625, 0.26694488525390625, 0.29681396484375, 0.32668304443359375, 0.3565521240234375, 0.38642120361328125, 0.416290283203125, 0.44615936279296875, 0.4760284423828125, 0.5058975219726562, 0.5357666015625, 0.5656356811523438, 0.5955047607421875, 0.6253738403320312, 0.655242919921875, 0.6851119995117188, 0.7149810791015625, 0.7448501586914062, 0.77471923828125, 0.8045883178710938, 0.8344573974609375, 0.8643264770507812, 0.894195556640625, 0.9240646362304688, 0.9539337158203125, 0.9838027954101562, 1.013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 16.0, 11.0, 15.0, 28.0, 28.0, 52.0, 64.0, 71.0, 100.0, 107.0, 118.0, 75.0, 69.0, 59.0, 36.0, 34.0, 21.0, 21.0, 8.0, 13.0, 14.0, 7.0, 0.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.490677356719971, -4.362713813781738, -4.234749794006348, -4.106786251068115, -3.9788224697113037, -3.850858688354492, -3.7228951454162598, -3.5949313640594482, -3.4669675827026367, -3.339003801345825, -3.2110402584075928, -3.0830764770507812, -2.9551126956939697, -2.827148914337158, -2.699185371398926, -2.5712215900421143, -2.443258047103882, -2.3152942657470703, -2.187330722808838, -2.0593669414520264, -1.9314031600952148, -1.8034394979476929, -1.675475835800171, -1.5475120544433594, -1.4195483922958374, -1.2915847301483154, -1.163620948791504, -1.035657286643982, -0.9076935648918152, -0.7797298431396484, -0.6517661809921265, -0.5238024592399597, -0.39583897590637207, -0.2678752541542053, -0.13991156220436096, -0.011947870254516602, 0.11601585149765015, 0.2439795732498169, 0.37194323539733887, 0.4999069571495056, 0.6278706789016724, 0.7558344006538391, 0.8837981224060059, 1.0117617845535278, 1.1397254467010498, 1.2676892280578613, 1.3956528902053833, 1.5236165523529053, 1.6515803337097168, 1.7795439958572388, 1.9075077772140503, 2.0354714393615723, 2.163435220718384, 2.2913990020751953, 2.4193625450134277, 2.5473263263702393, 2.675290107727051, 2.8032538890838623, 2.9312174320220947, 3.0591812133789062, 3.1871449947357178, 3.3151087760925293, 3.4430723190307617, 3.5710361003875732, 3.6989996433258057]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 12.0, 13.0, 9.0, 13.0, 23.0, 35.0, 32.0, 29.0, 41.0, 55.0, 66.0, 61.0, 53.0, 63.0, 67.0, 55.0, 41.0, 56.0, 55.0, 42.0, 27.0, 28.0, 22.0, 23.0, 17.0, 21.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.8028132915496826, -3.7039666175842285, -3.6051201820373535, -3.5062735080718994, -3.4074270725250244, -3.3085803985595703, -3.2097339630126953, -3.110887289047241, -3.012040615081787, -2.913193941116333, -2.814347505569458, -2.715500831604004, -2.616654396057129, -2.517807722091675, -2.4189610481262207, -2.3201146125793457, -2.2212681770324707, -2.1224215030670166, -2.0235750675201416, -1.9247283935546875, -1.825881838798523, -1.7270352840423584, -1.6281887292861938, -1.5293421745300293, -1.4304955005645752, -1.3316489458084106, -1.232802391052246, -1.133955717086792, -1.0351091623306274, -0.9362626075744629, -0.8374160528182983, -0.738569438457489, -0.6397228240966797, -0.5408762693405151, -0.4420296549797058, -0.34318310022354126, -0.24433651566505432, -0.14548993110656738, -0.04664337635040283, 0.052203238010406494, 0.15104979276657104, 0.24989637732505798, 0.3487429618835449, 0.4475895166397095, 0.546436071395874, 0.6452826857566833, 0.7441292405128479, 0.8429758548736572, 0.9418224096298218, 1.0406689643859863, 1.1395155191421509, 1.2383620738983154, 1.3372087478637695, 1.436055302619934, 1.5349018573760986, 1.6337485313415527, 1.7325949668884277, 1.8314415216445923, 1.9302880764007568, 2.029134750366211, 2.127981185913086, 2.22682785987854, 2.325674533843994, 2.424520969390869, 2.5233676433563232]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 7.0, 13.0, 36.0, 22.0, 42.0, 62.0, 101.0, 153.0, 290.0, 549.0, 1260.0, 3028.0, 9263.0, 40415.0, 293162.0, 577431.0, 96677.0, 17533.0, 4918.0, 1746.0, 829.0, 407.0, 206.0, 133.0, 83.0, 43.0, 36.0, 21.0, 17.0, 12.0, 10.0, 4.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7158203125, -0.692901611328125, -0.66998291015625, -0.647064208984375, -0.6241455078125, -0.601226806640625, -0.57830810546875, -0.555389404296875, -0.532470703125, -0.509552001953125, -0.48663330078125, -0.463714599609375, -0.4407958984375, -0.417877197265625, -0.39495849609375, -0.372039794921875, -0.34912109375, -0.326202392578125, -0.30328369140625, -0.280364990234375, -0.2574462890625, -0.234527587890625, -0.21160888671875, -0.188690185546875, -0.165771484375, -0.142852783203125, -0.11993408203125, -0.097015380859375, -0.0740966796875, -0.051177978515625, -0.02825927734375, -0.005340576171875, 0.017578125, 0.040496826171875, 0.06341552734375, 0.086334228515625, 0.1092529296875, 0.132171630859375, 0.15509033203125, 0.178009033203125, 0.200927734375, 0.223846435546875, 0.24676513671875, 0.269683837890625, 0.2926025390625, 0.315521240234375, 0.33843994140625, 0.361358642578125, 0.38427734375, 0.407196044921875, 0.43011474609375, 0.453033447265625, 0.4759521484375, 0.498870849609375, 0.52178955078125, 0.544708251953125, 0.567626953125, 0.590545654296875, 0.61346435546875, 0.636383056640625, 0.6593017578125, 0.682220458984375, 0.70513916015625, 0.728057861328125, 0.7509765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 7.0, 14.0, 14.0, 23.0, 24.0, 22.0, 44.0, 44.0, 51.0, 56.0, 67.0, 77.0, 59.0, 69.0, 55.0, 64.0, 57.0, 51.0, 35.0, 32.0, 31.0, 22.0, 21.0, 16.0, 14.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.17523193359375, -2.1043701171875, -2.03350830078125, -1.962646484375, -1.89178466796875, -1.8209228515625, -1.75006103515625, -1.67919921875, -1.60833740234375, -1.5374755859375, -1.46661376953125, -1.395751953125, -1.32489013671875, -1.2540283203125, -1.18316650390625, -1.1123046875, -1.04144287109375, -0.9705810546875, -0.89971923828125, -0.828857421875, -0.75799560546875, -0.6871337890625, -0.61627197265625, -0.54541015625, -0.47454833984375, -0.4036865234375, -0.33282470703125, -0.261962890625, -0.19110107421875, -0.1202392578125, -0.04937744140625, 0.021484375, 0.09234619140625, 0.1632080078125, 0.23406982421875, 0.304931640625, 0.37579345703125, 0.4466552734375, 0.51751708984375, 0.58837890625, 0.65924072265625, 0.7301025390625, 0.80096435546875, 0.871826171875, 0.94268798828125, 1.0135498046875, 1.08441162109375, 1.1552734375, 1.22613525390625, 1.2969970703125, 1.36785888671875, 1.438720703125, 1.50958251953125, 1.5804443359375, 1.65130615234375, 1.72216796875, 1.79302978515625, 1.8638916015625, 1.93475341796875, 2.005615234375, 2.07647705078125, 2.1473388671875, 2.21820068359375, 2.2890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 19.0, 19.0, 24.0, 34.0, 54.0, 91.0, 113.0, 221.0, 344.0, 637.0, 1262.0, 2637.0, 5809.0, 16577.0, 58124.0, 238949.0, 464340.0, 190392.0, 45623.0, 13358.0, 5119.0, 2238.0, 1010.0, 584.0, 347.0, 191.0, 140.0, 85.0, 57.0, 40.0, 21.0, 14.0, 19.0, 12.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.49609375, -0.4828338623046875, -0.469573974609375, -0.4563140869140625, -0.44305419921875, -0.4297943115234375, -0.416534423828125, -0.4032745361328125, -0.3900146484375, -0.3767547607421875, -0.363494873046875, -0.3502349853515625, -0.33697509765625, -0.3237152099609375, -0.310455322265625, -0.2971954345703125, -0.283935546875, -0.2706756591796875, -0.257415771484375, -0.2441558837890625, -0.23089599609375, -0.2176361083984375, -0.204376220703125, -0.1911163330078125, -0.1778564453125, -0.1645965576171875, -0.151336669921875, -0.1380767822265625, -0.12481689453125, -0.1115570068359375, -0.098297119140625, -0.0850372314453125, -0.07177734375, -0.0585174560546875, -0.045257568359375, -0.0319976806640625, -0.01873779296875, -0.0054779052734375, 0.007781982421875, 0.0210418701171875, 0.0343017578125, 0.0475616455078125, 0.060821533203125, 0.0740814208984375, 0.08734130859375, 0.1006011962890625, 0.113861083984375, 0.1271209716796875, 0.140380859375, 0.1536407470703125, 0.166900634765625, 0.1801605224609375, 0.19342041015625, 0.2066802978515625, 0.219940185546875, 0.2332000732421875, 0.2464599609375, 0.2597198486328125, 0.272979736328125, 0.2862396240234375, 0.29949951171875, 0.3127593994140625, 0.326019287109375, 0.3392791748046875, 0.3525390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 10.0, 5.0, 7.0, 12.0, 17.0, 26.0, 18.0, 20.0, 20.0, 38.0, 33.0, 41.0, 51.0, 58.0, 54.0, 61.0, 71.0, 58.0, 51.0, 50.0, 46.0, 38.0, 39.0, 37.0, 27.0, 29.0, 28.0, 14.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.17578125, -4.061065673828125, -3.94635009765625, -3.831634521484375, -3.7169189453125, -3.602203369140625, -3.48748779296875, -3.372772216796875, -3.258056640625, -3.143341064453125, -3.02862548828125, -2.913909912109375, -2.7991943359375, -2.684478759765625, -2.56976318359375, -2.455047607421875, -2.34033203125, -2.225616455078125, -2.11090087890625, -1.996185302734375, -1.8814697265625, -1.766754150390625, -1.65203857421875, -1.537322998046875, -1.422607421875, -1.307891845703125, -1.19317626953125, -1.078460693359375, -0.9637451171875, -0.849029541015625, -0.73431396484375, -0.619598388671875, -0.5048828125, -0.390167236328125, -0.27545166015625, -0.160736083984375, -0.0460205078125, 0.068695068359375, 0.18341064453125, 0.298126220703125, 0.412841796875, 0.527557373046875, 0.64227294921875, 0.756988525390625, 0.8717041015625, 0.986419677734375, 1.10113525390625, 1.215850830078125, 1.33056640625, 1.445281982421875, 1.55999755859375, 1.674713134765625, 1.7894287109375, 1.904144287109375, 2.01885986328125, 2.133575439453125, 2.248291015625, 2.363006591796875, 2.47772216796875, 2.592437744140625, 2.7071533203125, 2.821868896484375, 2.93658447265625, 3.051300048828125, 3.166015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 14.0, 7.0, 7.0, 15.0, 19.0, 48.0, 47.0, 88.0, 155.0, 321.0, 589.0, 1228.0, 2783.0, 7110.0, 22831.0, 104706.0, 494179.0, 329133.0, 60742.0, 15220.0, 5202.0, 2078.0, 937.0, 456.0, 224.0, 161.0, 87.0, 62.0, 28.0, 32.0, 11.0, 14.0, 4.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.20093536376953125, -0.1953277587890625, -0.18972015380859375, -0.184112548828125, -0.17850494384765625, -0.1728973388671875, -0.16728973388671875, -0.16168212890625, -0.15607452392578125, -0.1504669189453125, -0.14485931396484375, -0.139251708984375, -0.13364410400390625, -0.1280364990234375, -0.12242889404296875, -0.1168212890625, -0.11121368408203125, -0.1056060791015625, -0.09999847412109375, -0.094390869140625, -0.08878326416015625, -0.0831756591796875, -0.07756805419921875, -0.07196044921875, -0.06635284423828125, -0.0607452392578125, -0.05513763427734375, -0.049530029296875, -0.04392242431640625, -0.0383148193359375, -0.03270721435546875, -0.027099609375, -0.02149200439453125, -0.0158843994140625, -0.01027679443359375, -0.004669189453125, 0.00093841552734375, 0.0065460205078125, 0.01215362548828125, 0.01776123046875, 0.02336883544921875, 0.0289764404296875, 0.03458404541015625, 0.040191650390625, 0.04579925537109375, 0.0514068603515625, 0.05701446533203125, 0.0626220703125, 0.06822967529296875, 0.0738372802734375, 0.07944488525390625, 0.085052490234375, 0.09066009521484375, 0.0962677001953125, 0.10187530517578125, 0.10748291015625, 0.11309051513671875, 0.1186981201171875, 0.12430572509765625, 0.129913330078125, 0.13552093505859375, 0.1411285400390625, 0.14673614501953125, 0.15234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 9.0, 11.0, 13.0, 11.0, 16.0, 31.0, 26.0, 29.0, 37.0, 56.0, 61.0, 81.0, 66.0, 79.0, 74.0, 66.0, 66.0, 46.0, 42.0, 43.0, 37.0, 23.0, 18.0, 8.0, 13.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208917617797852e-05, -8.940789848566055e-05, -8.672662079334259e-05, -8.404534310102463e-05, -8.136406540870667e-05, -7.86827877163887e-05, -7.600151002407074e-05, -7.332023233175278e-05, -7.063895463943481e-05, -6.795767694711685e-05, -6.527639925479889e-05, -6.259512156248093e-05, -5.9913843870162964e-05, -5.7232566177845e-05, -5.455128848552704e-05, -5.1870010793209076e-05, -4.918873310089111e-05, -4.650745540857315e-05, -4.382617771625519e-05, -4.1144900023937225e-05, -3.846362233161926e-05, -3.57823446393013e-05, -3.310106694698334e-05, -3.0419789254665375e-05, -2.7738511562347412e-05, -2.505723387002945e-05, -2.2375956177711487e-05, -1.9694678485393524e-05, -1.701340079307556e-05, -1.4332123100757599e-05, -1.1650845408439636e-05, -8.969567716121674e-06, -6.288290023803711e-06, -3.6070123314857483e-06, -9.257346391677856e-07, 1.755543053150177e-06, 4.43682074546814e-06, 7.118098437786102e-06, 9.799376130104065e-06, 1.2480653822422028e-05, 1.516193151473999e-05, 1.7843209207057953e-05, 2.0524486899375916e-05, 2.3205764591693878e-05, 2.588704228401184e-05, 2.8568319976329803e-05, 3.1249597668647766e-05, 3.393087536096573e-05, 3.661215305328369e-05, 3.9293430745601654e-05, 4.197470843791962e-05, 4.465598613023758e-05, 4.733726382255554e-05, 5.0018541514873505e-05, 5.269981920719147e-05, 5.538109689950943e-05, 5.806237459182739e-05, 6.0743652284145355e-05, 6.342492997646332e-05, 6.610620766878128e-05, 6.878748536109924e-05, 7.14687630534172e-05, 7.415004074573517e-05, 7.683131843805313e-05, 7.95125961303711e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 14.0, 19.0, 37.0, 44.0, 76.0, 195.0, 400.0, 777.0, 1872.0, 5334.0, 22871.0, 282742.0, 671391.0, 49536.0, 8487.0, 2671.0, 1034.0, 482.0, 253.0, 125.0, 64.0, 49.0, 22.0, 20.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.32990264892578125, -0.3199615478515625, -0.31002044677734375, -0.300079345703125, -0.29013824462890625, -0.2801971435546875, -0.27025604248046875, -0.26031494140625, -0.25037384033203125, -0.2404327392578125, -0.23049163818359375, -0.220550537109375, -0.21060943603515625, -0.2006683349609375, -0.19072723388671875, -0.1807861328125, -0.17084503173828125, -0.1609039306640625, -0.15096282958984375, -0.141021728515625, -0.13108062744140625, -0.1211395263671875, -0.11119842529296875, -0.10125732421875, -0.09131622314453125, -0.0813751220703125, -0.07143402099609375, -0.061492919921875, -0.05155181884765625, -0.0416107177734375, -0.03166961669921875, -0.021728515625, -0.01178741455078125, -0.0018463134765625, 0.00809478759765625, 0.018035888671875, 0.02797698974609375, 0.0379180908203125, 0.04785919189453125, 0.05780029296875, 0.06774139404296875, 0.0776824951171875, 0.08762359619140625, 0.097564697265625, 0.10750579833984375, 0.1174468994140625, 0.12738800048828125, 0.1373291015625, 0.14727020263671875, 0.1572113037109375, 0.16715240478515625, 0.177093505859375, 0.18703460693359375, 0.1969757080078125, 0.20691680908203125, 0.21685791015625, 0.22679901123046875, 0.2367401123046875, 0.24668121337890625, 0.256622314453125, 0.26656341552734375, 0.2765045166015625, 0.28644561767578125, 0.29638671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 8.0, 13.0, 22.0, 27.0, 36.0, 69.0, 82.0, 152.0, 166.0, 150.0, 107.0, 51.0, 38.0, 23.0, 13.0, 6.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.0611572265625, -0.05908203125, -0.0570068359375, -0.054931640625, -0.0528564453125, -0.05078125, -0.0487060546875, -0.046630859375, -0.0445556640625, -0.04248046875, -0.0404052734375, -0.038330078125, -0.0362548828125, -0.0341796875, -0.0321044921875, -0.030029296875, -0.0279541015625, -0.02587890625, -0.0238037109375, -0.021728515625, -0.0196533203125, -0.017578125, -0.0155029296875, -0.013427734375, -0.0113525390625, -0.00927734375, -0.0072021484375, -0.005126953125, -0.0030517578125, -0.0009765625, 0.0010986328125, 0.003173828125, 0.0052490234375, 0.00732421875, 0.0093994140625, 0.011474609375, 0.0135498046875, 0.015625, 0.0177001953125, 0.019775390625, 0.0218505859375, 0.02392578125, 0.0260009765625, 0.028076171875, 0.0301513671875, 0.0322265625, 0.0343017578125, 0.036376953125, 0.0384521484375, 0.04052734375, 0.0426025390625, 0.044677734375, 0.0467529296875, 0.048828125, 0.0509033203125, 0.052978515625, 0.0550537109375, 0.05712890625, 0.0592041015625, 0.061279296875, 0.0633544921875, 0.0654296875, 0.0675048828125, 0.069580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 19.0, 24.0, 33.0, 31.0, 70.0, 88.0, 118.0, 107.0, 127.0, 82.0, 65.0, 55.0, 36.0, 30.0, 17.0, 18.0, 16.0, 8.0, 5.0, 6.0, 1.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2435925006866455, -3.153115749359131, -3.062638998031616, -2.9721622467041016, -2.881685256958008, -2.791208505630493, -2.7007317543029785, -2.610255002975464, -2.519778251647949, -2.4293015003204346, -2.33882474899292, -2.2483479976654053, -2.1578712463378906, -2.067394256591797, -1.9769175052642822, -1.8864407539367676, -1.795964002609253, -1.7054872512817383, -1.6150104999542236, -1.5245336294174194, -1.4340568780899048, -1.3435801267623901, -1.253103256225586, -1.1626265048980713, -1.0721497535705566, -0.981673002243042, -0.8911961913108826, -0.8007193803787231, -0.7102426290512085, -0.6197658777236938, -0.5292890667915344, -0.438812255859375, -0.34833574295043945, -0.2578589618206024, -0.16738218069076538, -0.07690539956092834, 0.013571381568908691, 0.10404816269874573, 0.19452494382858276, 0.2850017547607422, 0.37547850608825684, 0.46595528721809387, 0.5564320683479309, 0.6469088792800903, 0.737385630607605, 0.8278623819351196, 0.918339192867279, 1.0088160037994385, 1.0992927551269531, 1.1897695064544678, 1.2802462577819824, 1.3707231283187866, 1.4611998796463013, 1.551676630973816, 1.6421535015106201, 1.7326302528381348, 1.8231070041656494, 1.913583755493164, 2.0040605068206787, 2.0945372581481934, 2.185014247894287, 2.2754909992218018, 2.3659677505493164, 2.456444501876831, 2.5469212532043457]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 12.0, 12.0, 20.0, 22.0, 35.0, 28.0, 46.0, 57.0, 59.0, 79.0, 64.0, 74.0, 91.0, 46.0, 66.0, 70.0, 45.0, 28.0, 33.0, 27.0, 20.0, 17.0, 14.0, 11.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.759587049484253, -2.686246871948242, -2.6129066944122314, -2.5395665168762207, -2.46622633934021, -2.392886161804199, -2.3195459842681885, -2.2462058067321777, -2.172865629196167, -2.0995254516601562, -2.0261852741241455, -1.9528450965881348, -1.879504919052124, -1.8061647415161133, -1.7328245639801025, -1.6594843864440918, -1.5861440896987915, -1.5128039121627808, -1.43946373462677, -1.3661235570907593, -1.2927833795547485, -1.2194432020187378, -1.1461029052734375, -1.0727627277374268, -0.9994226098060608, -0.92608243227005, -0.8527422547340393, -0.7794020175933838, -0.706061840057373, -0.6327216625213623, -0.5593814849853516, -0.4860413074493408, -0.41270124912261963, -0.3393610715866089, -0.26602089405059814, -0.19268068671226501, -0.11934050917625427, -0.04600033164024353, 0.0273398756980896, 0.10068005323410034, 0.17402023077011108, 0.24736040830612183, 0.32070058584213257, 0.3940407931804657, 0.46738097071647644, 0.5407211780548096, 0.6140613555908203, 0.687401533126831, 0.7607417106628418, 0.8340818881988525, 0.9074220657348633, 0.980762243270874, 1.0541024208068848, 1.1274425983428955, 1.2007827758789062, 1.274122953414917, 1.3474631309509277, 1.4208033084869385, 1.4941434860229492, 1.56748366355896, 1.6408238410949707, 1.7141640186309814, 1.7875041961669922, 1.860844373703003, 1.9341846704483032]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 14.0, 20.0, 28.0, 29.0, 48.0, 65.0, 110.0, 158.0, 310.0, 509.0, 912.0, 1704.0, 3366.0, 7353.0, 18630.0, 60834.0, 296499.0, 507023.0, 103733.0, 27608.0, 10160.0, 4573.0, 2173.0, 1164.0, 631.0, 348.0, 188.0, 121.0, 83.0, 52.0, 25.0, 21.0, 19.0, 14.0, 4.0, 8.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84765625, -2.75634765625, -2.6650390625, -2.57373046875, -2.482421875, -2.39111328125, -2.2998046875, -2.20849609375, -2.1171875, -2.02587890625, -1.9345703125, -1.84326171875, -1.751953125, -1.66064453125, -1.5693359375, -1.47802734375, -1.38671875, -1.29541015625, -1.2041015625, -1.11279296875, -1.021484375, -0.93017578125, -0.8388671875, -0.74755859375, -0.65625, -0.56494140625, -0.4736328125, -0.38232421875, -0.291015625, -0.19970703125, -0.1083984375, -0.01708984375, 0.07421875, 0.16552734375, 0.2568359375, 0.34814453125, 0.439453125, 0.53076171875, 0.6220703125, 0.71337890625, 0.8046875, 0.89599609375, 0.9873046875, 1.07861328125, 1.169921875, 1.26123046875, 1.3525390625, 1.44384765625, 1.53515625, 1.62646484375, 1.7177734375, 1.80908203125, 1.900390625, 1.99169921875, 2.0830078125, 2.17431640625, 2.265625, 2.35693359375, 2.4482421875, 2.53955078125, 2.630859375, 2.72216796875, 2.8134765625, 2.90478515625, 2.99609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 9.0, 3.0, 5.0, 16.0, 13.0, 12.0, 19.0, 27.0, 25.0, 26.0, 32.0, 37.0, 51.0, 62.0, 53.0, 65.0, 66.0, 75.0, 61.0, 46.0, 38.0, 44.0, 34.0, 28.0, 23.0, 15.0, 22.0, 20.0, 19.0, 11.0, 5.0, 12.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.28125, -4.14056396484375, -3.9998779296875, -3.85919189453125, -3.718505859375, -3.57781982421875, -3.4371337890625, -3.29644775390625, -3.15576171875, -3.01507568359375, -2.8743896484375, -2.73370361328125, -2.593017578125, -2.45233154296875, -2.3116455078125, -2.17095947265625, -2.0302734375, -1.88958740234375, -1.7489013671875, -1.60821533203125, -1.467529296875, -1.32684326171875, -1.1861572265625, -1.04547119140625, -0.90478515625, -0.76409912109375, -0.6234130859375, -0.48272705078125, -0.342041015625, -0.20135498046875, -0.0606689453125, 0.08001708984375, 0.220703125, 0.36138916015625, 0.5020751953125, 0.64276123046875, 0.783447265625, 0.92413330078125, 1.0648193359375, 1.20550537109375, 1.34619140625, 1.48687744140625, 1.6275634765625, 1.76824951171875, 1.908935546875, 2.04962158203125, 2.1903076171875, 2.33099365234375, 2.4716796875, 2.61236572265625, 2.7530517578125, 2.89373779296875, 3.034423828125, 3.17510986328125, 3.3157958984375, 3.45648193359375, 3.59716796875, 3.73785400390625, 3.8785400390625, 4.01922607421875, 4.159912109375, 4.30059814453125, 4.4412841796875, 4.58197021484375, 4.72265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 8.0, 14.0, 11.0, 15.0, 11.0, 17.0, 16.0, 26.0, 24.0, 23.0, 34.0, 24.0, 52.0, 45.0, 48.0, 104.0, 411.0, 5130.0, 725483.0, 312707.0, 3478.0, 354.0, 82.0, 62.0, 42.0, 33.0, 32.0, 25.0, 31.0, 27.0, 23.0, 12.0, 12.0, 22.0, 13.0, 11.0, 12.0, 13.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0], "bins": [-11.5546875, -11.19287109375, -10.8310546875, -10.46923828125, -10.107421875, -9.74560546875, -9.3837890625, -9.02197265625, -8.66015625, -8.29833984375, -7.9365234375, -7.57470703125, -7.212890625, -6.85107421875, -6.4892578125, -6.12744140625, -5.765625, -5.40380859375, -5.0419921875, -4.68017578125, -4.318359375, -3.95654296875, -3.5947265625, -3.23291015625, -2.87109375, -2.50927734375, -2.1474609375, -1.78564453125, -1.423828125, -1.06201171875, -0.7001953125, -0.33837890625, 0.0234375, 0.38525390625, 0.7470703125, 1.10888671875, 1.470703125, 1.83251953125, 2.1943359375, 2.55615234375, 2.91796875, 3.27978515625, 3.6416015625, 4.00341796875, 4.365234375, 4.72705078125, 5.0888671875, 5.45068359375, 5.8125, 6.17431640625, 6.5361328125, 6.89794921875, 7.259765625, 7.62158203125, 7.9833984375, 8.34521484375, 8.70703125, 9.06884765625, 9.4306640625, 9.79248046875, 10.154296875, 10.51611328125, 10.8779296875, 11.23974609375, 11.6015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 5.0, 7.0, 12.0, 7.0, 14.0, 17.0, 20.0, 21.0, 23.0, 15.0, 26.0, 33.0, 34.0, 38.0, 27.0, 27.0, 36.0, 45.0, 41.0, 39.0, 32.0, 40.0, 31.0, 43.0, 34.0, 28.0, 30.0, 31.0, 25.0, 23.0, 26.0, 21.0, 14.0, 22.0, 11.0, 12.0, 19.0, 8.0, 11.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.77734375, -3.65057373046875, -3.5238037109375, -3.39703369140625, -3.270263671875, -3.14349365234375, -3.0167236328125, -2.88995361328125, -2.76318359375, -2.63641357421875, -2.5096435546875, -2.38287353515625, -2.256103515625, -2.12933349609375, -2.0025634765625, -1.87579345703125, -1.7490234375, -1.62225341796875, -1.4954833984375, -1.36871337890625, -1.241943359375, -1.11517333984375, -0.9884033203125, -0.86163330078125, -0.73486328125, -0.60809326171875, -0.4813232421875, -0.35455322265625, -0.227783203125, -0.10101318359375, 0.0257568359375, 0.15252685546875, 0.279296875, 0.40606689453125, 0.5328369140625, 0.65960693359375, 0.786376953125, 0.91314697265625, 1.0399169921875, 1.16668701171875, 1.29345703125, 1.42022705078125, 1.5469970703125, 1.67376708984375, 1.800537109375, 1.92730712890625, 2.0540771484375, 2.18084716796875, 2.3076171875, 2.43438720703125, 2.5611572265625, 2.68792724609375, 2.814697265625, 2.94146728515625, 3.0682373046875, 3.19500732421875, 3.32177734375, 3.44854736328125, 3.5753173828125, 3.70208740234375, 3.828857421875, 3.95562744140625, 4.0823974609375, 4.20916748046875, 4.3359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 15.0, 23.0, 19.0, 50.0, 90.0, 139.0, 247.0, 488.0, 943.0, 2012.0, 5286.0, 18294.0, 114226.0, 736898.0, 138859.0, 20778.0, 5824.0, 2265.0, 1002.0, 484.0, 243.0, 136.0, 83.0, 48.0, 34.0, 16.0, 13.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2421875, -1.2028045654296875, -1.163421630859375, -1.1240386962890625, -1.08465576171875, -1.0452728271484375, -1.005889892578125, -0.9665069580078125, -0.9271240234375, -0.8877410888671875, -0.848358154296875, -0.8089752197265625, -0.76959228515625, -0.7302093505859375, -0.690826416015625, -0.6514434814453125, -0.612060546875, -0.5726776123046875, -0.533294677734375, -0.4939117431640625, -0.45452880859375, -0.4151458740234375, -0.375762939453125, -0.3363800048828125, -0.2969970703125, -0.2576141357421875, -0.218231201171875, -0.1788482666015625, -0.13946533203125, -0.1000823974609375, -0.060699462890625, -0.0213165283203125, 0.01806640625, 0.0574493408203125, 0.096832275390625, 0.1362152099609375, 0.17559814453125, 0.2149810791015625, 0.254364013671875, 0.2937469482421875, 0.3331298828125, 0.3725128173828125, 0.411895751953125, 0.4512786865234375, 0.49066162109375, 0.5300445556640625, 0.569427490234375, 0.6088104248046875, 0.648193359375, 0.6875762939453125, 0.726959228515625, 0.7663421630859375, 0.80572509765625, 0.8451080322265625, 0.884490966796875, 0.9238739013671875, 0.9632568359375, 1.0026397705078125, 1.042022705078125, 1.0814056396484375, 1.12078857421875, 1.1601715087890625, 1.199554443359375, 1.2389373779296875, 1.2783203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 2.0, 7.0, 8.0, 8.0, 8.0, 11.0, 16.0, 17.0, 34.0, 60.0, 65.0, 75.0, 84.0, 135.0, 90.0, 77.0, 61.0, 60.0, 44.0, 32.0, 18.0, 19.0, 11.0, 10.0, 10.0, 4.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00015783309936523438, -0.00015268847346305847, -0.00014754384756088257, -0.00014239922165870667, -0.00013725459575653076, -0.00013210996985435486, -0.00012696534395217896, -0.00012182071805000305, -0.00011667609214782715, -0.00011153146624565125, -0.00010638684034347534, -0.00010124221444129944, -9.609758853912354e-05, -9.095296263694763e-05, -8.580833673477173e-05, -8.066371083259583e-05, -7.551908493041992e-05, -7.037445902824402e-05, -6.522983312606812e-05, -6.008520722389221e-05, -5.494058132171631e-05, -4.9795955419540405e-05, -4.46513295173645e-05, -3.95067036151886e-05, -3.4362077713012695e-05, -2.9217451810836792e-05, -2.407282590866089e-05, -1.8928200006484985e-05, -1.3783574104309082e-05, -8.638948202133179e-06, -3.4943222999572754e-06, 1.650303602218628e-06, 6.794929504394531e-06, 1.1939555406570435e-05, 1.7084181308746338e-05, 2.222880721092224e-05, 2.7373433113098145e-05, 3.251805901527405e-05, 3.766268491744995e-05, 4.2807310819625854e-05, 4.795193672180176e-05, 5.309656262397766e-05, 5.8241188526153564e-05, 6.338581442832947e-05, 6.853044033050537e-05, 7.367506623268127e-05, 7.881969213485718e-05, 8.396431803703308e-05, 8.910894393920898e-05, 9.425356984138489e-05, 9.939819574356079e-05, 0.0001045428216457367, 0.0001096874475479126, 0.0001148320734500885, 0.0001199766993522644, 0.0001251213252544403, 0.0001302659511566162, 0.00013541057705879211, 0.00014055520296096802, 0.00014569982886314392, 0.00015084445476531982, 0.00015598908066749573, 0.00016113370656967163, 0.00016627833247184753, 0.00017142295837402344]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 4.0, 8.0, 10.0, 5.0, 24.0, 29.0, 40.0, 51.0, 76.0, 132.0, 197.0, 320.0, 546.0, 1049.0, 2164.0, 5183.0, 14551.0, 58375.0, 384336.0, 480786.0, 72006.0, 17373.0, 6005.0, 2515.0, 1161.0, 603.0, 368.0, 212.0, 134.0, 90.0, 59.0, 34.0, 24.0, 24.0, 17.0, 15.0, 8.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96728515625, -0.9361495971679688, -0.9050140380859375, -0.8738784790039062, -0.842742919921875, -0.8116073608398438, -0.7804718017578125, -0.7493362426757812, -0.71820068359375, -0.6870651245117188, -0.6559295654296875, -0.6247940063476562, -0.593658447265625, -0.5625228881835938, -0.5313873291015625, -0.5002517700195312, -0.4691162109375, -0.43798065185546875, -0.4068450927734375, -0.37570953369140625, -0.344573974609375, -0.31343841552734375, -0.2823028564453125, -0.25116729736328125, -0.22003173828125, -0.18889617919921875, -0.1577606201171875, -0.12662506103515625, -0.095489501953125, -0.06435394287109375, -0.0332183837890625, -0.00208282470703125, 0.029052734375, 0.06018829345703125, 0.0913238525390625, 0.12245941162109375, 0.153594970703125, 0.18473052978515625, 0.2158660888671875, 0.24700164794921875, 0.27813720703125, 0.30927276611328125, 0.3404083251953125, 0.37154388427734375, 0.402679443359375, 0.43381500244140625, 0.4649505615234375, 0.49608612060546875, 0.5272216796875, 0.5583572387695312, 0.5894927978515625, 0.6206283569335938, 0.651763916015625, 0.6828994750976562, 0.7140350341796875, 0.7451705932617188, 0.77630615234375, 0.8074417114257812, 0.8385772705078125, 0.8697128295898438, 0.900848388671875, 0.9319839477539062, 0.9631195068359375, 0.9942550659179688, 1.025390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 8.0, 6.0, 8.0, 21.0, 21.0, 22.0, 29.0, 28.0, 60.0, 78.0, 87.0, 94.0, 107.0, 83.0, 76.0, 75.0, 54.0, 36.0, 30.0, 17.0, 14.0, 4.0, 6.0, 6.0, 10.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3915596008300781, -0.37662506103515625, -0.3616905212402344, -0.3467559814453125, -0.3318214416503906, -0.31688690185546875, -0.3019523620605469, -0.287017822265625, -0.2720832824707031, -0.25714874267578125, -0.24221420288085938, -0.2272796630859375, -0.21234512329101562, -0.19741058349609375, -0.18247604370117188, -0.16754150390625, -0.15260696411132812, -0.13767242431640625, -0.12273788452148438, -0.1078033447265625, -0.09286880493164062, -0.07793426513671875, -0.06299972534179688, -0.048065185546875, -0.033130645751953125, -0.01819610595703125, -0.003261566162109375, 0.0116729736328125, 0.026607513427734375, 0.04154205322265625, 0.056476593017578125, 0.0714111328125, 0.08634567260742188, 0.10128021240234375, 0.11621475219726562, 0.1311492919921875, 0.14608383178710938, 0.16101837158203125, 0.17595291137695312, 0.190887451171875, 0.20582199096679688, 0.22075653076171875, 0.23569107055664062, 0.2506256103515625, 0.2655601501464844, 0.28049468994140625, 0.2954292297363281, 0.31036376953125, 0.3252983093261719, 0.34023284912109375, 0.3551673889160156, 0.3701019287109375, 0.3850364685058594, 0.39997100830078125, 0.4149055480957031, 0.429840087890625, 0.4447746276855469, 0.45970916748046875, 0.4746437072753906, 0.4895782470703125, 0.5045127868652344, 0.5194473266601562, 0.5343818664550781, 0.54931640625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 10.0, 11.0, 20.0, 35.0, 52.0, 128.0, 207.0, 203.0, 152.0, 73.0, 52.0, 25.0, 16.0, 11.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.38946008682251, -5.03520393371582, -4.680947780609131, -4.326691627502441, -3.972435712814331, -3.6181795597076416, -3.2639236450195312, -2.909667491912842, -2.5554113388061523, -2.201155185699463, -1.846899151802063, -1.492643117904663, -1.1383869647979736, -0.7841308116912842, -0.42987489700317383, -0.07561874389648438, 0.2786374092102051, 0.6328935027122498, 0.9871495962142944, 1.3414056301116943, 1.6956617832183838, 2.0499179363250732, 2.4041738510131836, 2.758430004119873, 3.1126861572265625, 3.466942310333252, 3.8211984634399414, 4.175454139709473, 4.52971076965332, 4.883966445922852, 5.238222599029541, 5.5924787521362305, 5.946735382080078, 6.300991535186768, 6.655247688293457, 7.009503364562988, 7.363759994506836, 7.718015670776367, 8.072271347045898, 8.426527976989746, 8.780784606933594, 9.135040283203125, 9.489296913146973, 9.843552589416504, 10.197809219360352, 10.552064895629883, 10.906320571899414, 11.260577201843262, 11.614832878112793, 11.969088554382324, 12.323345184326172, 12.677600860595703, 13.03185749053955, 13.386113166809082, 13.74036979675293, 14.094625473022461, 14.448881149291992, 14.803136825561523, 15.157393455505371, 15.511649131774902, 15.86590576171875, 16.22016143798828, 16.574417114257812, 16.928672790527344, 17.282930374145508]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 2.0, 9.0, 11.0, 13.0, 12.0, 14.0, 17.0, 27.0, 18.0, 36.0, 32.0, 30.0, 34.0, 36.0, 37.0, 30.0, 38.0, 43.0, 43.0, 36.0, 54.0, 41.0, 38.0, 30.0, 37.0, 49.0, 19.0, 26.0, 24.0, 20.0, 23.0, 15.0, 18.0, 13.0, 12.0, 8.0, 8.0, 10.0, 5.0, 2.0, 5.0, 7.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1865620613098145, -6.943087577819824, -6.699612617492676, -6.4561381340026855, -6.212663650512695, -5.969188690185547, -5.725714206695557, -5.482239723205566, -5.238764762878418, -4.995290279388428, -4.751815319061279, -4.508340835571289, -4.264866352081299, -4.021391868591309, -3.77791690826416, -3.53444242477417, -3.2909679412841797, -3.0474932193756104, -2.80401873588562, -2.560544013977051, -2.3170695304870605, -2.073594808578491, -1.8301200866699219, -1.586645483970642, -1.3431708812713623, -1.0996962785720825, -0.856221616268158, -0.6127469539642334, -0.3692723512649536, -0.12579774856567383, 0.11767697334289551, 0.3611515760421753, 0.6046266555786133, 0.8481012582778931, 1.0915758609771729, 1.3350505828857422, 1.578525185585022, 1.8219997882843018, 2.065474510192871, 2.3089489936828613, 2.5524237155914307, 2.7958984375, 3.0393729209899902, 3.2828476428985596, 3.526322364807129, 3.769796848297119, 4.013271331787109, 4.256746292114258, 4.500220775604248, 4.743695259094238, 4.987170219421387, 5.230644702911377, 5.474119186401367, 5.717594146728516, 5.961068630218506, 6.204543113708496, 6.4480180740356445, 6.691492557525635, 6.934967517852783, 7.178442001342773, 7.421916484832764, 7.665390968322754, 7.908865928649902, 8.15234088897705, 8.395814895629883]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 6.0, 16.0, 25.0, 28.0, 50.0, 63.0, 115.0, 136.0, 220.0, 354.0, 657.0, 1183.0, 2451.0, 5655.0, 16456.0, 71271.0, 992198.0, 2938674.0, 127088.0, 23582.0, 7538.0, 3099.0, 1465.0, 755.0, 432.0, 262.0, 170.0, 89.0, 61.0, 42.0, 37.0, 32.0, 16.0, 19.0, 8.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.181640625, -3.059967041015625, -2.93829345703125, -2.816619873046875, -2.6949462890625, -2.573272705078125, -2.45159912109375, -2.329925537109375, -2.208251953125, -2.086578369140625, -1.96490478515625, -1.843231201171875, -1.7215576171875, -1.599884033203125, -1.47821044921875, -1.356536865234375, -1.23486328125, -1.113189697265625, -0.99151611328125, -0.869842529296875, -0.7481689453125, -0.626495361328125, -0.50482177734375, -0.383148193359375, -0.261474609375, -0.139801025390625, -0.01812744140625, 0.103546142578125, 0.2252197265625, 0.346893310546875, 0.46856689453125, 0.590240478515625, 0.7119140625, 0.833587646484375, 0.95526123046875, 1.076934814453125, 1.1986083984375, 1.320281982421875, 1.44195556640625, 1.563629150390625, 1.685302734375, 1.806976318359375, 1.92864990234375, 2.050323486328125, 2.1719970703125, 2.293670654296875, 2.41534423828125, 2.537017822265625, 2.65869140625, 2.780364990234375, 2.90203857421875, 3.023712158203125, 3.1453857421875, 3.267059326171875, 3.38873291015625, 3.510406494140625, 3.632080078125, 3.753753662109375, 3.87542724609375, 3.997100830078125, 4.1187744140625, 4.240447998046875, 4.36212158203125, 4.483795166015625, 4.60546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 6.0, 9.0, 13.0, 16.0, 36.0, 28.0, 38.0, 45.0, 59.0, 65.0, 70.0, 77.0, 58.0, 62.0, 82.0, 54.0, 62.0, 49.0, 32.0, 26.0, 22.0, 22.0, 16.0, 11.0, 13.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.802154541015625, -2.71368408203125, -2.625213623046875, -2.5367431640625, -2.448272705078125, -2.35980224609375, -2.271331787109375, -2.182861328125, -2.094390869140625, -2.00592041015625, -1.917449951171875, -1.8289794921875, -1.740509033203125, -1.65203857421875, -1.563568115234375, -1.47509765625, -1.386627197265625, -1.29815673828125, -1.209686279296875, -1.1212158203125, -1.032745361328125, -0.94427490234375, -0.855804443359375, -0.767333984375, -0.678863525390625, -0.59039306640625, -0.501922607421875, -0.4134521484375, -0.324981689453125, -0.23651123046875, -0.148040771484375, -0.0595703125, 0.028900146484375, 0.11737060546875, 0.205841064453125, 0.2943115234375, 0.382781982421875, 0.47125244140625, 0.559722900390625, 0.648193359375, 0.736663818359375, 0.82513427734375, 0.913604736328125, 1.0020751953125, 1.090545654296875, 1.17901611328125, 1.267486572265625, 1.35595703125, 1.444427490234375, 1.53289794921875, 1.621368408203125, 1.7098388671875, 1.798309326171875, 1.88677978515625, 1.975250244140625, 2.063720703125, 2.152191162109375, 2.24066162109375, 2.329132080078125, 2.4176025390625, 2.506072998046875, 2.59454345703125, 2.683013916015625, 2.771484375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 11.0, 7.0, 11.0, 21.0, 30.0, 45.0, 85.0, 127.0, 342.0, 1472.0, 27982.0, 4120721.0, 40904.0, 1743.0, 397.0, 153.0, 70.0, 54.0, 27.0, 28.0, 16.0, 7.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.2430419921875, -13.853271484375, -13.4635009765625, -13.07373046875, -12.6839599609375, -12.294189453125, -11.9044189453125, -11.5146484375, -11.1248779296875, -10.735107421875, -10.3453369140625, -9.95556640625, -9.5657958984375, -9.176025390625, -8.7862548828125, -8.396484375, -8.0067138671875, -7.616943359375, -7.2271728515625, -6.83740234375, -6.4476318359375, -6.057861328125, -5.6680908203125, -5.2783203125, -4.8885498046875, -4.498779296875, -4.1090087890625, -3.71923828125, -3.3294677734375, -2.939697265625, -2.5499267578125, -2.16015625, -1.7703857421875, -1.380615234375, -0.9908447265625, -0.60107421875, -0.2113037109375, 0.178466796875, 0.5682373046875, 0.9580078125, 1.3477783203125, 1.737548828125, 2.1273193359375, 2.51708984375, 2.9068603515625, 3.296630859375, 3.6864013671875, 4.076171875, 4.4659423828125, 4.855712890625, 5.2454833984375, 5.63525390625, 6.0250244140625, 6.414794921875, 6.8045654296875, 7.1943359375, 7.5841064453125, 7.973876953125, 8.3636474609375, 8.75341796875, 9.1431884765625, 9.532958984375, 9.9227294921875, 10.3125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 21.0, 14.0, 17.0, 29.0, 26.0, 43.0, 74.0, 96.0, 166.0, 273.0, 457.0, 1092.0, 755.0, 378.0, 195.0, 122.0, 92.0, 58.0, 48.0, 24.0, 21.0, 16.0, 17.0, 6.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.97039794921875, -0.9407958984375, -0.91119384765625, -0.881591796875, -0.85198974609375, -0.8223876953125, -0.79278564453125, -0.76318359375, -0.73358154296875, -0.7039794921875, -0.67437744140625, -0.644775390625, -0.61517333984375, -0.5855712890625, -0.55596923828125, -0.5263671875, -0.49676513671875, -0.4671630859375, -0.43756103515625, -0.407958984375, -0.37835693359375, -0.3487548828125, -0.31915283203125, -0.28955078125, -0.25994873046875, -0.2303466796875, -0.20074462890625, -0.171142578125, -0.14154052734375, -0.1119384765625, -0.08233642578125, -0.052734375, -0.02313232421875, 0.0064697265625, 0.03607177734375, 0.065673828125, 0.09527587890625, 0.1248779296875, 0.15447998046875, 0.18408203125, 0.21368408203125, 0.2432861328125, 0.27288818359375, 0.302490234375, 0.33209228515625, 0.3616943359375, 0.39129638671875, 0.4208984375, 0.45050048828125, 0.4801025390625, 0.50970458984375, 0.539306640625, 0.56890869140625, 0.5985107421875, 0.62811279296875, 0.65771484375, 0.68731689453125, 0.7169189453125, 0.74652099609375, 0.776123046875, 0.80572509765625, 0.8353271484375, 0.86492919921875, 0.89453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 8.0, 6.0, 9.0, 18.0, 19.0, 27.0, 48.0, 72.0, 73.0, 100.0, 104.0, 111.0, 96.0, 87.0, 52.0, 37.0, 40.0, 17.0, 12.0, 8.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.718958854675293, -3.6025497913360596, -3.486140727996826, -3.3697316646575928, -3.2533226013183594, -3.136913537979126, -3.0205044746398926, -2.9040956497192383, -2.787686347961426, -2.6712772846221924, -2.554868221282959, -2.4384591579437256, -2.322050094604492, -2.205641031265259, -2.0892319679260254, -1.9728230237960815, -1.8564140796661377, -1.7400050163269043, -1.623595952987671, -1.5071868896484375, -1.390777826309204, -1.2743687629699707, -1.1579598188400269, -1.0415507555007935, -0.9251416921615601, -0.8087326288223267, -0.6923235654830933, -0.5759145617485046, -0.45950549840927124, -0.34309643507003784, -0.22668743133544922, -0.11027836799621582, 0.0061304569244384766, 0.12253950536251068, 0.23894855380058289, 0.3553575873374939, 0.4717666506767273, 0.5881757140159607, 0.7045847177505493, 0.8209937810897827, 0.9374028444290161, 1.0538119077682495, 1.170220971107483, 1.2866299152374268, 1.4030389785766602, 1.5194480419158936, 1.635857105255127, 1.7522661685943604, 1.8686752319335938, 1.9850842952728271, 2.1014933586120605, 2.217902421951294, 2.3343114852905273, 2.4507205486297607, 2.567129611968994, 2.6835384368896484, 2.799947738647461, 2.9163568019866943, 3.0327658653259277, 3.149174928665161, 3.2655839920043945, 3.381993055343628, 3.4984021186828613, 3.6148109436035156, 3.731220006942749]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 12.0, 17.0, 20.0, 21.0, 33.0, 31.0, 35.0, 38.0, 55.0, 55.0, 64.0, 74.0, 61.0, 51.0, 67.0, 58.0, 60.0, 49.0, 41.0, 32.0, 25.0, 22.0, 15.0, 12.0, 10.0, 11.0, 7.0, 7.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.964372158050537, -2.870063543319702, -2.775754928588867, -2.6814465522766113, -2.5871379375457764, -2.4928293228149414, -2.3985207080841064, -2.3042120933532715, -2.2099037170410156, -2.1155951023101807, -2.0212864875793457, -1.9269779920578003, -1.8326694965362549, -1.73836088180542, -1.644052267074585, -1.54974365234375, -1.455435037612915, -1.36112642288208, -1.2668179273605347, -1.1725093126296997, -1.0782008171081543, -0.9838922023773193, -0.8895835876464844, -0.7952750325202942, -0.700966477394104, -0.6066579222679138, -0.5123493671417236, -0.41804075241088867, -0.3237321972846985, -0.2294236421585083, -0.13511502742767334, -0.040806472301483154, 0.05350208282470703, 0.1478106528520584, 0.2421192228794098, 0.33642780780792236, 0.43073636293411255, 0.5250449180603027, 0.6193535327911377, 0.7136620879173279, 0.8079706430435181, 0.9022791981697083, 0.9965877532958984, 1.0908963680267334, 1.1852049827575684, 1.2795134782791138, 1.3738220930099487, 1.4681305885314941, 1.562439203262329, 1.656747817993164, 1.7510563135147095, 1.8453649282455444, 1.9396734237670898, 2.033982038497925, 2.1282906532287598, 2.2225992679595947, 2.3169078826904297, 2.4112164974212646, 2.5055251121520996, 2.5998334884643555, 2.6941421031951904, 2.7884507179260254, 2.8827593326568604, 2.9770679473876953, 3.071376323699951]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 8.0, 10.0, 15.0, 30.0, 42.0, 62.0, 98.0, 208.0, 471.0, 1231.0, 3376.0, 12123.0, 59278.0, 370261.0, 491907.0, 86372.0, 16438.0, 4167.0, 1365.0, 520.0, 245.0, 119.0, 59.0, 46.0, 27.0, 14.0, 18.0, 13.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4714012145996094, -0.45574188232421875, -0.4400825500488281, -0.4244232177734375, -0.4087638854980469, -0.39310455322265625, -0.3774452209472656, -0.361785888671875, -0.3461265563964844, -0.33046722412109375, -0.3148078918457031, -0.2991485595703125, -0.2834892272949219, -0.26782989501953125, -0.2521705627441406, -0.23651123046875, -0.22085189819335938, -0.20519256591796875, -0.18953323364257812, -0.1738739013671875, -0.15821456909179688, -0.14255523681640625, -0.12689590454101562, -0.111236572265625, -0.09557723999023438, -0.07991790771484375, -0.06425857543945312, -0.0485992431640625, -0.032939910888671875, -0.01728057861328125, -0.001621246337890625, 0.0140380859375, 0.029697418212890625, 0.04535675048828125, 0.061016082763671875, 0.0766754150390625, 0.09233474731445312, 0.10799407958984375, 0.12365341186523438, 0.139312744140625, 0.15497207641601562, 0.17063140869140625, 0.18629074096679688, 0.2019500732421875, 0.21760940551757812, 0.23326873779296875, 0.24892807006835938, 0.26458740234375, 0.2802467346191406, 0.29590606689453125, 0.3115653991699219, 0.3272247314453125, 0.3428840637207031, 0.35854339599609375, 0.3742027282714844, 0.389862060546875, 0.4055213928222656, 0.42118072509765625, 0.4368400573730469, 0.4524993896484375, 0.4681587219238281, 0.48381805419921875, 0.4994773864746094, 0.51513671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 14.0, 16.0, 17.0, 29.0, 32.0, 45.0, 59.0, 66.0, 82.0, 90.0, 86.0, 70.0, 85.0, 68.0, 58.0, 45.0, 25.0, 24.0, 15.0, 14.0, 7.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.8203125, -2.74053955078125, -2.6607666015625, -2.58099365234375, -2.501220703125, -2.42144775390625, -2.3416748046875, -2.26190185546875, -2.18212890625, -2.10235595703125, -2.0225830078125, -1.94281005859375, -1.863037109375, -1.78326416015625, -1.7034912109375, -1.62371826171875, -1.5439453125, -1.46417236328125, -1.3843994140625, -1.30462646484375, -1.224853515625, -1.14508056640625, -1.0653076171875, -0.98553466796875, -0.90576171875, -0.82598876953125, -0.7462158203125, -0.66644287109375, -0.586669921875, -0.50689697265625, -0.4271240234375, -0.34735107421875, -0.267578125, -0.18780517578125, -0.1080322265625, -0.02825927734375, 0.051513671875, 0.13128662109375, 0.2110595703125, 0.29083251953125, 0.37060546875, 0.45037841796875, 0.5301513671875, 0.60992431640625, 0.689697265625, 0.76947021484375, 0.8492431640625, 0.92901611328125, 1.0087890625, 1.08856201171875, 1.1683349609375, 1.24810791015625, 1.327880859375, 1.40765380859375, 1.4874267578125, 1.56719970703125, 1.64697265625, 1.72674560546875, 1.8065185546875, 1.88629150390625, 1.966064453125, 2.04583740234375, 2.1256103515625, 2.20538330078125, 2.28515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 7.0, 18.0, 15.0, 23.0, 30.0, 46.0, 67.0, 92.0, 120.0, 181.0, 311.0, 475.0, 948.0, 1865.0, 4090.0, 11101.0, 33998.0, 118573.0, 341070.0, 352817.0, 126051.0, 36329.0, 11511.0, 4487.0, 1886.0, 955.0, 515.0, 310.0, 193.0, 153.0, 93.0, 71.0, 40.0, 34.0, 27.0, 17.0, 14.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2750968933105469, -0.26528167724609375, -0.2554664611816406, -0.2456512451171875, -0.23583602905273438, -0.22602081298828125, -0.21620559692382812, -0.206390380859375, -0.19657516479492188, -0.18675994873046875, -0.17694473266601562, -0.1671295166015625, -0.15731430053710938, -0.14749908447265625, -0.13768386840820312, -0.12786865234375, -0.11805343627929688, -0.10823822021484375, -0.09842300415039062, -0.0886077880859375, -0.07879257202148438, -0.06897735595703125, -0.059162139892578125, -0.049346923828125, -0.039531707763671875, -0.02971649169921875, -0.019901275634765625, -0.0100860595703125, -0.000270843505859375, 0.00954437255859375, 0.019359588623046875, 0.0291748046875, 0.038990020751953125, 0.04880523681640625, 0.058620452880859375, 0.0684356689453125, 0.07825088500976562, 0.08806610107421875, 0.09788131713867188, 0.107696533203125, 0.11751174926757812, 0.12732696533203125, 0.13714218139648438, 0.1469573974609375, 0.15677261352539062, 0.16658782958984375, 0.17640304565429688, 0.18621826171875, 0.19603347778320312, 0.20584869384765625, 0.21566390991210938, 0.2254791259765625, 0.23529434204101562, 0.24510955810546875, 0.2549247741699219, 0.264739990234375, 0.2745552062988281, 0.28437042236328125, 0.2941856384277344, 0.3040008544921875, 0.3138160705566406, 0.32363128662109375, 0.3334465026855469, 0.34326171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 6.0, 5.0, 14.0, 17.0, 18.0, 17.0, 31.0, 32.0, 35.0, 42.0, 52.0, 40.0, 45.0, 49.0, 44.0, 63.0, 65.0, 43.0, 64.0, 45.0, 46.0, 33.0, 33.0, 25.0, 26.0, 24.0, 10.0, 16.0, 8.0, 9.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.92083740234375, -2.8143310546875, -2.70782470703125, -2.601318359375, -2.49481201171875, -2.3883056640625, -2.28179931640625, -2.17529296875, -2.06878662109375, -1.9622802734375, -1.85577392578125, -1.749267578125, -1.64276123046875, -1.5362548828125, -1.42974853515625, -1.3232421875, -1.21673583984375, -1.1102294921875, -1.00372314453125, -0.897216796875, -0.79071044921875, -0.6842041015625, -0.57769775390625, -0.47119140625, -0.36468505859375, -0.2581787109375, -0.15167236328125, -0.045166015625, 0.06134033203125, 0.1678466796875, 0.27435302734375, 0.380859375, 0.48736572265625, 0.5938720703125, 0.70037841796875, 0.806884765625, 0.91339111328125, 1.0198974609375, 1.12640380859375, 1.23291015625, 1.33941650390625, 1.4459228515625, 1.55242919921875, 1.658935546875, 1.76544189453125, 1.8719482421875, 1.97845458984375, 2.0849609375, 2.19146728515625, 2.2979736328125, 2.40447998046875, 2.510986328125, 2.61749267578125, 2.7239990234375, 2.83050537109375, 2.93701171875, 3.04351806640625, 3.1500244140625, 3.25653076171875, 3.363037109375, 3.46954345703125, 3.5760498046875, 3.68255615234375, 3.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 4.0, 12.0, 15.0, 29.0, 52.0, 67.0, 137.0, 303.0, 659.0, 1832.0, 7820.0, 101507.0, 886482.0, 42041.0, 5123.0, 1415.0, 540.0, 216.0, 125.0, 65.0, 36.0, 22.0, 15.0, 12.0, 1.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43505859375, -0.42240142822265625, -0.4097442626953125, -0.39708709716796875, -0.384429931640625, -0.37177276611328125, -0.3591156005859375, -0.34645843505859375, -0.33380126953125, -0.32114410400390625, -0.3084869384765625, -0.29582977294921875, -0.283172607421875, -0.27051544189453125, -0.2578582763671875, -0.24520111083984375, -0.2325439453125, -0.21988677978515625, -0.2072296142578125, -0.19457244873046875, -0.181915283203125, -0.16925811767578125, -0.1566009521484375, -0.14394378662109375, -0.13128662109375, -0.11862945556640625, -0.1059722900390625, -0.09331512451171875, -0.080657958984375, -0.06800079345703125, -0.0553436279296875, -0.04268646240234375, -0.030029296875, -0.01737213134765625, -0.0047149658203125, 0.00794219970703125, 0.020599365234375, 0.03325653076171875, 0.0459136962890625, 0.05857086181640625, 0.07122802734375, 0.08388519287109375, 0.0965423583984375, 0.10919952392578125, 0.121856689453125, 0.13451385498046875, 0.1471710205078125, 0.15982818603515625, 0.1724853515625, 0.18514251708984375, 0.1977996826171875, 0.21045684814453125, 0.223114013671875, 0.23577117919921875, 0.2484283447265625, 0.26108551025390625, 0.27374267578125, 0.28639984130859375, 0.2990570068359375, 0.31171417236328125, 0.324371337890625, 0.33702850341796875, 0.3496856689453125, 0.36234283447265625, 0.375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 6.0, 10.0, 14.0, 16.0, 35.0, 52.0, 78.0, 95.0, 94.0, 116.0, 123.0, 87.0, 88.0, 56.0, 33.0, 31.0, 14.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010162591934204102, -9.807851165533066e-05, -9.45311039686203e-05, -9.098369628190994e-05, -8.743628859519958e-05, -8.388888090848923e-05, -8.034147322177887e-05, -7.679406553506851e-05, -7.324665784835815e-05, -6.96992501616478e-05, -6.615184247493744e-05, -6.260443478822708e-05, -5.9057027101516724e-05, -5.5509619414806366e-05, -5.196221172809601e-05, -4.841480404138565e-05, -4.486739635467529e-05, -4.1319988667964935e-05, -3.777258098125458e-05, -3.422517329454422e-05, -3.067776560783386e-05, -2.7130357921123505e-05, -2.3582950234413147e-05, -2.003554254770279e-05, -1.648813486099243e-05, -1.2940727174282074e-05, -9.393319487571716e-06, -5.845911800861359e-06, -2.298504114151001e-06, 1.2489035725593567e-06, 4.796311259269714e-06, 8.343718945980072e-06, 1.189112663269043e-05, 1.5438534319400787e-05, 1.8985942006111145e-05, 2.2533349692821503e-05, 2.608075737953186e-05, 2.9628165066242218e-05, 3.3175572752952576e-05, 3.672298043966293e-05, 4.027038812637329e-05, 4.381779581308365e-05, 4.7365203499794006e-05, 5.0912611186504364e-05, 5.446001887321472e-05, 5.800742655992508e-05, 6.155483424663544e-05, 6.51022419333458e-05, 6.864964962005615e-05, 7.219705730676651e-05, 7.574446499347687e-05, 7.929187268018723e-05, 8.283928036689758e-05, 8.638668805360794e-05, 8.99340957403183e-05, 9.348150342702866e-05, 9.702891111373901e-05, 0.00010057631880044937, 0.00010412372648715973, 0.00010767113417387009, 0.00011121854186058044, 0.0001147659495472908, 0.00011831335723400116, 0.00012186076492071152, 0.00012540817260742188]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 11.0, 19.0, 25.0, 34.0, 52.0, 69.0, 149.0, 187.0, 368.0, 714.0, 1501.0, 4258.0, 19823.0, 342446.0, 640002.0, 29756.0, 5344.0, 1872.0, 816.0, 439.0, 233.0, 147.0, 98.0, 54.0, 49.0, 30.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.383544921875, -0.3734779357910156, -0.36341094970703125, -0.3533439636230469, -0.3432769775390625, -0.3332099914550781, -0.32314300537109375, -0.3130760192871094, -0.303009033203125, -0.2929420471191406, -0.28287506103515625, -0.2728080749511719, -0.2627410888671875, -0.2526741027832031, -0.24260711669921875, -0.23254013061523438, -0.22247314453125, -0.21240615844726562, -0.20233917236328125, -0.19227218627929688, -0.1822052001953125, -0.17213821411132812, -0.16207122802734375, -0.15200424194335938, -0.141937255859375, -0.13187026977539062, -0.12180328369140625, -0.11173629760742188, -0.1016693115234375, -0.09160232543945312, -0.08153533935546875, -0.07146835327148438, -0.0614013671875, -0.051334381103515625, -0.04126739501953125, -0.031200408935546875, -0.0211334228515625, -0.011066436767578125, -0.00099945068359375, 0.009067535400390625, 0.019134521484375, 0.029201507568359375, 0.03926849365234375, 0.049335479736328125, 0.0594024658203125, 0.06946945190429688, 0.07953643798828125, 0.08960342407226562, 0.09967041015625, 0.10973739624023438, 0.11980438232421875, 0.12987136840820312, 0.1399383544921875, 0.15000534057617188, 0.16007232666015625, 0.17013931274414062, 0.180206298828125, 0.19027328491210938, 0.20034027099609375, 0.21040725708007812, 0.2204742431640625, 0.23054122924804688, 0.24060821533203125, 0.2506752014160156, 0.2607421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 13.0, 19.0, 38.0, 53.0, 78.0, 128.0, 181.0, 158.0, 118.0, 73.0, 46.0, 26.0, 8.0, 10.0, 13.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.044464111328125, -0.0427403450012207, -0.041016578674316406, -0.03929281234741211, -0.03756904602050781, -0.035845279693603516, -0.03412151336669922, -0.03239774703979492, -0.030673980712890625, -0.028950214385986328, -0.02722644805908203, -0.025502681732177734, -0.023778915405273438, -0.02205514907836914, -0.020331382751464844, -0.018607616424560547, -0.01688385009765625, -0.015160083770751953, -0.013436317443847656, -0.01171255111694336, -0.009988784790039062, -0.008265018463134766, -0.006541252136230469, -0.004817485809326172, -0.003093719482421875, -0.0013699531555175781, 0.00035381317138671875, 0.0020775794982910156, 0.0038013458251953125, 0.005525112152099609, 0.007248878479003906, 0.008972644805908203, 0.0106964111328125, 0.012420177459716797, 0.014143943786621094, 0.01586771011352539, 0.017591476440429688, 0.019315242767333984, 0.02103900909423828, 0.022762775421142578, 0.024486541748046875, 0.026210308074951172, 0.02793407440185547, 0.029657840728759766, 0.03138160705566406, 0.03310537338256836, 0.034829139709472656, 0.03655290603637695, 0.03827667236328125, 0.04000043869018555, 0.041724205017089844, 0.04344797134399414, 0.04517173767089844, 0.046895503997802734, 0.04861927032470703, 0.05034303665161133, 0.052066802978515625, 0.05379056930541992, 0.05551433563232422, 0.057238101959228516, 0.05896186828613281, 0.06068563461303711, 0.062409400939941406, 0.0641331672668457, 0.06585693359375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 8.0, 10.0, 8.0, 23.0, 23.0, 45.0, 85.0, 118.0, 146.0, 141.0, 140.0, 81.0, 56.0, 36.0, 15.0, 15.0, 10.0, 5.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5170416831970215, -2.4128308296203613, -2.308619737625122, -2.204408884048462, -2.1001977920532227, -1.9959869384765625, -1.8917760848999023, -1.7875651121139526, -1.683354139328003, -1.5791431665420532, -1.4749321937561035, -1.3707213401794434, -1.2665103673934937, -1.162299394607544, -1.0580885410308838, -0.9538775682449341, -0.8496665954589844, -0.7454556226730347, -0.6412447094917297, -0.5370337963104248, -0.4328228235244751, -0.3286118507385254, -0.22440093755722046, -0.12019002437591553, -0.01597905158996582, 0.0882318913936615, 0.19244283437728882, 0.29665377736091614, 0.40086472034454346, 0.5050756931304932, 0.6092866063117981, 0.713497519493103, 0.8177084922790527, 0.9219194650650024, 1.0261304378509521, 1.1303412914276123, 1.234552264213562, 1.3387632369995117, 1.4429740905761719, 1.5471850633621216, 1.6513960361480713, 1.755607008934021, 1.8598179817199707, 1.9640288352966309, 2.068239688873291, 2.1724507808685303, 2.2766616344451904, 2.3808727264404297, 2.48508358001709, 2.58929443359375, 2.6935055255889893, 2.7977163791656494, 2.9019274711608887, 3.006138324737549, 3.110349178314209, 3.214560031890869, 3.3187711238861084, 3.4229819774627686, 3.527193069458008, 3.631403923034668, 3.735614776611328, 3.8398258686065674, 3.9440367221832275, 4.048247814178467, 4.152458667755127]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 5.0, 16.0, 13.0, 17.0, 30.0, 32.0, 37.0, 50.0, 58.0, 76.0, 91.0, 79.0, 79.0, 75.0, 77.0, 70.0, 51.0, 34.0, 26.0, 25.0, 10.0, 10.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6410934925079346, -2.565190076828003, -2.489286422729492, -2.4133830070495605, -2.337479591369629, -2.2615761756896973, -2.1856727600097656, -2.109769105911255, -2.0338656902313232, -1.9579622745513916, -1.8820587396621704, -1.8061552047729492, -1.7302517890930176, -1.654348373413086, -1.5784448385238647, -1.5025413036346436, -1.426637887954712, -1.3507344722747803, -1.274830937385559, -1.198927402496338, -1.1230239868164062, -1.0471205711364746, -0.9712170362472534, -0.895313560962677, -0.8194100856781006, -0.7435066103935242, -0.6676031351089478, -0.5916996598243713, -0.5157961845397949, -0.4398927092552185, -0.3639892339706421, -0.2880857586860657, -0.21218228340148926, -0.13627880811691284, -0.060375332832336426, 0.01552814245223999, 0.0914316177368164, 0.16733509302139282, 0.24323856830596924, 0.31914204359054565, 0.39504551887512207, 0.4709489941596985, 0.5468524694442749, 0.6227559447288513, 0.6986594200134277, 0.7745628952980042, 0.8504663705825806, 0.926369845867157, 1.0022733211517334, 1.078176736831665, 1.1540802717208862, 1.2299838066101074, 1.305887222290039, 1.3817906379699707, 1.457694172859192, 1.533597707748413, 1.6095011234283447, 1.6854045391082764, 1.7613080739974976, 1.8372116088867188, 1.9131150245666504, 1.989018440246582, 2.0649218559265137, 2.1408255100250244, 2.216728925704956]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 5.0, 23.0, 22.0, 20.0, 44.0, 85.0, 242.0, 1084.0, 6908.0, 95837.0, 876674.0, 61129.0, 5227.0, 805.0, 202.0, 75.0, 35.0, 30.0, 14.0, 13.0, 14.0, 11.0, 7.0, 5.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.6015625, -9.36407470703125, -9.1265869140625, -8.88909912109375, -8.651611328125, -8.41412353515625, -8.1766357421875, -7.93914794921875, -7.70166015625, -7.46417236328125, -7.2266845703125, -6.98919677734375, -6.751708984375, -6.51422119140625, -6.2767333984375, -6.03924560546875, -5.8017578125, -5.56427001953125, -5.3267822265625, -5.08929443359375, -4.851806640625, -4.61431884765625, -4.3768310546875, -4.13934326171875, -3.90185546875, -3.66436767578125, -3.4268798828125, -3.18939208984375, -2.951904296875, -2.71441650390625, -2.4769287109375, -2.23944091796875, -2.001953125, -1.76446533203125, -1.5269775390625, -1.28948974609375, -1.052001953125, -0.81451416015625, -0.5770263671875, -0.33953857421875, -0.10205078125, 0.13543701171875, 0.3729248046875, 0.61041259765625, 0.847900390625, 1.08538818359375, 1.3228759765625, 1.56036376953125, 1.7978515625, 2.03533935546875, 2.2728271484375, 2.51031494140625, 2.747802734375, 2.98529052734375, 3.2227783203125, 3.46026611328125, 3.69775390625, 3.93524169921875, 4.1727294921875, 4.41021728515625, 4.647705078125, 4.88519287109375, 5.1226806640625, 5.36016845703125, 5.59765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 11.0, 19.0, 37.0, 52.0, 117.0, 148.0, 176.0, 164.0, 133.0, 62.0, 37.0, 20.0, 11.0, 8.0, 3.0, 5.0, 2.0, 3.0], "bins": [-21.4375, -21.03033447265625, -20.6231689453125, -20.21600341796875, -19.808837890625, -19.40167236328125, -18.9945068359375, -18.58734130859375, -18.18017578125, -17.77301025390625, -17.3658447265625, -16.95867919921875, -16.551513671875, -16.14434814453125, -15.7371826171875, -15.33001708984375, -14.9228515625, -14.51568603515625, -14.1085205078125, -13.70135498046875, -13.294189453125, -12.88702392578125, -12.4798583984375, -12.07269287109375, -11.66552734375, -11.25836181640625, -10.8511962890625, -10.44403076171875, -10.036865234375, -9.62969970703125, -9.2225341796875, -8.81536865234375, -8.408203125, -8.00103759765625, -7.5938720703125, -7.18670654296875, -6.779541015625, -6.37237548828125, -5.9652099609375, -5.55804443359375, -5.15087890625, -4.74371337890625, -4.3365478515625, -3.92938232421875, -3.522216796875, -3.11505126953125, -2.7078857421875, -2.30072021484375, -1.8935546875, -1.48638916015625, -1.0792236328125, -0.67205810546875, -0.264892578125, 0.14227294921875, 0.5494384765625, 0.95660400390625, 1.36376953125, 1.77093505859375, 2.1781005859375, 2.58526611328125, 2.992431640625, 3.39959716796875, 3.8067626953125, 4.21392822265625, 4.62109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 7.0, 4.0, 7.0, 6.0, 16.0, 24.0, 26.0, 25.0, 45.0, 60.0, 61.0, 83.0, 97.0, 148.0, 272.0, 784.0, 3442.0, 33726.0, 846382.0, 152673.0, 8192.0, 1325.0, 407.0, 180.0, 120.0, 88.0, 76.0, 73.0, 45.0, 38.0, 28.0, 19.0, 20.0, 16.0, 10.0, 11.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.24609375, -6.04278564453125, -5.8394775390625, -5.63616943359375, -5.432861328125, -5.22955322265625, -5.0262451171875, -4.82293701171875, -4.61962890625, -4.41632080078125, -4.2130126953125, -4.00970458984375, -3.806396484375, -3.60308837890625, -3.3997802734375, -3.19647216796875, -2.9931640625, -2.78985595703125, -2.5865478515625, -2.38323974609375, -2.179931640625, -1.97662353515625, -1.7733154296875, -1.57000732421875, -1.36669921875, -1.16339111328125, -0.9600830078125, -0.75677490234375, -0.553466796875, -0.35015869140625, -0.1468505859375, 0.05645751953125, 0.259765625, 0.46307373046875, 0.6663818359375, 0.86968994140625, 1.072998046875, 1.27630615234375, 1.4796142578125, 1.68292236328125, 1.88623046875, 2.08953857421875, 2.2928466796875, 2.49615478515625, 2.699462890625, 2.90277099609375, 3.1060791015625, 3.30938720703125, 3.5126953125, 3.71600341796875, 3.9193115234375, 4.12261962890625, 4.325927734375, 4.52923583984375, 4.7325439453125, 4.93585205078125, 5.13916015625, 5.34246826171875, 5.5457763671875, 5.74908447265625, 5.952392578125, 6.15570068359375, 6.3590087890625, 6.56231689453125, 6.765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 11.0, 20.0, 12.0, 22.0, 20.0, 33.0, 34.0, 34.0, 38.0, 50.0, 52.0, 51.0, 43.0, 44.0, 48.0, 66.0, 43.0, 47.0, 42.0, 42.0, 40.0, 31.0, 28.0, 31.0, 27.0, 22.0, 18.0, 13.0, 9.0, 4.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-6.23828125, -6.07025146484375, -5.9022216796875, -5.73419189453125, -5.566162109375, -5.39813232421875, -5.2301025390625, -5.06207275390625, -4.89404296875, -4.72601318359375, -4.5579833984375, -4.38995361328125, -4.221923828125, -4.05389404296875, -3.8858642578125, -3.71783447265625, -3.5498046875, -3.38177490234375, -3.2137451171875, -3.04571533203125, -2.877685546875, -2.70965576171875, -2.5416259765625, -2.37359619140625, -2.20556640625, -2.03753662109375, -1.8695068359375, -1.70147705078125, -1.533447265625, -1.36541748046875, -1.1973876953125, -1.02935791015625, -0.861328125, -0.69329833984375, -0.5252685546875, -0.35723876953125, -0.189208984375, -0.02117919921875, 0.1468505859375, 0.31488037109375, 0.48291015625, 0.65093994140625, 0.8189697265625, 0.98699951171875, 1.155029296875, 1.32305908203125, 1.4910888671875, 1.65911865234375, 1.8271484375, 1.99517822265625, 2.1632080078125, 2.33123779296875, 2.499267578125, 2.66729736328125, 2.8353271484375, 3.00335693359375, 3.17138671875, 3.33941650390625, 3.5074462890625, 3.67547607421875, 3.843505859375, 4.01153564453125, 4.1795654296875, 4.34759521484375, 4.515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 11.0, 4.0, 17.0, 15.0, 21.0, 22.0, 54.0, 67.0, 109.0, 168.0, 292.0, 474.0, 847.0, 1555.0, 3119.0, 6629.0, 16204.0, 44914.0, 164306.0, 514087.0, 208017.0, 54344.0, 18476.0, 7454.0, 3398.0, 1681.0, 945.0, 519.0, 290.0, 181.0, 121.0, 67.0, 50.0, 28.0, 18.0, 16.0, 5.0, 9.0, 3.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5119857788085938, -0.4927215576171875, -0.47345733642578125, -0.454193115234375, -0.43492889404296875, -0.4156646728515625, -0.39640045166015625, -0.37713623046875, -0.35787200927734375, -0.3386077880859375, -0.31934356689453125, -0.300079345703125, -0.28081512451171875, -0.2615509033203125, -0.24228668212890625, -0.2230224609375, -0.20375823974609375, -0.1844940185546875, -0.16522979736328125, -0.145965576171875, -0.12670135498046875, -0.1074371337890625, -0.08817291259765625, -0.06890869140625, -0.04964447021484375, -0.0303802490234375, -0.01111602783203125, 0.008148193359375, 0.02741241455078125, 0.0466766357421875, 0.06594085693359375, 0.085205078125, 0.10446929931640625, 0.1237335205078125, 0.14299774169921875, 0.162261962890625, 0.18152618408203125, 0.2007904052734375, 0.22005462646484375, 0.23931884765625, 0.25858306884765625, 0.2778472900390625, 0.29711151123046875, 0.316375732421875, 0.33563995361328125, 0.3549041748046875, 0.37416839599609375, 0.3934326171875, 0.41269683837890625, 0.4319610595703125, 0.45122528076171875, 0.470489501953125, 0.48975372314453125, 0.5090179443359375, 0.5282821655273438, 0.54754638671875, 0.5668106079101562, 0.5860748291015625, 0.6053390502929688, 0.624603271484375, 0.6438674926757812, 0.6631317138671875, 0.6823959350585938, 0.70166015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 6.0, 4.0, 17.0, 13.0, 10.0, 19.0, 30.0, 36.0, 45.0, 73.0, 85.0, 77.0, 88.0, 97.0, 94.0, 58.0, 60.0, 47.0, 31.0, 20.0, 15.0, 13.0, 15.0, 12.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012350082397460938, -0.00011936761438846588, -0.00011523440480232239, -0.0001111011952161789, -0.0001069679856300354, -0.0001028347760438919, -9.870156645774841e-05, -9.456835687160492e-05, -9.043514728546143e-05, -8.630193769931793e-05, -8.216872811317444e-05, -7.803551852703094e-05, -7.390230894088745e-05, -6.976909935474396e-05, -6.563588976860046e-05, -6.150268018245697e-05, -5.7369470596313477e-05, -5.323626101016998e-05, -4.910305142402649e-05, -4.4969841837882996e-05, -4.08366322517395e-05, -3.670342266559601e-05, -3.2570213079452515e-05, -2.843700349330902e-05, -2.4303793907165527e-05, -2.0170584321022034e-05, -1.603737473487854e-05, -1.1904165148735046e-05, -7.770955562591553e-06, -3.637745976448059e-06, 4.954636096954346e-07, 4.628673195838928e-06, 8.761882781982422e-06, 1.2895092368125916e-05, 1.702830195426941e-05, 2.1161511540412903e-05, 2.5294721126556396e-05, 2.942793071269989e-05, 3.3561140298843384e-05, 3.769434988498688e-05, 4.182755947113037e-05, 4.5960769057273865e-05, 5.009397864341736e-05, 5.422718822956085e-05, 5.8360397815704346e-05, 6.249360740184784e-05, 6.662681698799133e-05, 7.076002657413483e-05, 7.489323616027832e-05, 7.902644574642181e-05, 8.315965533256531e-05, 8.72928649187088e-05, 9.14260745048523e-05, 9.555928409099579e-05, 9.969249367713928e-05, 0.00010382570326328278, 0.00010795891284942627, 0.00011209212243556976, 0.00011622533202171326, 0.00012035854160785675, 0.00012449175119400024, 0.00012862496078014374, 0.00013275817036628723, 0.00013689137995243073, 0.00014102458953857422]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 8.0, 8.0, 11.0, 17.0, 20.0, 28.0, 47.0, 86.0, 123.0, 182.0, 339.0, 562.0, 1142.0, 2651.0, 6641.0, 21524.0, 98873.0, 596953.0, 257356.0, 43035.0, 11348.0, 3923.0, 1696.0, 779.0, 447.0, 266.0, 155.0, 89.0, 71.0, 50.0, 38.0, 21.0, 14.0, 6.0, 8.0, 2.0, 7.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.93017578125, -0.9017715454101562, -0.8733673095703125, -0.8449630737304688, -0.816558837890625, -0.7881546020507812, -0.7597503662109375, -0.7313461303710938, -0.70294189453125, -0.6745376586914062, -0.6461334228515625, -0.6177291870117188, -0.589324951171875, -0.5609207153320312, -0.5325164794921875, -0.5041122436523438, -0.4757080078125, -0.44730377197265625, -0.4188995361328125, -0.39049530029296875, -0.362091064453125, -0.33368682861328125, -0.3052825927734375, -0.27687835693359375, -0.24847412109375, -0.22006988525390625, -0.1916656494140625, -0.16326141357421875, -0.134857177734375, -0.10645294189453125, -0.0780487060546875, -0.04964447021484375, -0.021240234375, 0.00716400146484375, 0.0355682373046875, 0.06397247314453125, 0.092376708984375, 0.12078094482421875, 0.1491851806640625, 0.17758941650390625, 0.20599365234375, 0.23439788818359375, 0.2628021240234375, 0.29120635986328125, 0.319610595703125, 0.34801483154296875, 0.3764190673828125, 0.40482330322265625, 0.4332275390625, 0.46163177490234375, 0.4900360107421875, 0.5184402465820312, 0.546844482421875, 0.5752487182617188, 0.6036529541015625, 0.6320571899414062, 0.66046142578125, 0.6888656616210938, 0.7172698974609375, 0.7456741333007812, 0.774078369140625, 0.8024826049804688, 0.8308868408203125, 0.8592910766601562, 0.8876953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 11.0, 13.0, 4.0, 6.0, 9.0, 10.0, 23.0, 18.0, 35.0, 39.0, 57.0, 67.0, 77.0, 104.0, 112.0, 69.0, 62.0, 67.0, 59.0, 33.0, 31.0, 19.0, 14.0, 16.0, 14.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.3756523132324219, -0.36238861083984375, -0.3491249084472656, -0.3358612060546875, -0.3225975036621094, -0.30933380126953125, -0.2960700988769531, -0.282806396484375, -0.2695426940917969, -0.25627899169921875, -0.24301528930664062, -0.2297515869140625, -0.21648788452148438, -0.20322418212890625, -0.18996047973632812, -0.17669677734375, -0.16343307495117188, -0.15016937255859375, -0.13690567016601562, -0.1236419677734375, -0.11037826538085938, -0.09711456298828125, -0.08385086059570312, -0.070587158203125, -0.057323455810546875, -0.04405975341796875, -0.030796051025390625, -0.0175323486328125, -0.004268646240234375, 0.00899505615234375, 0.022258758544921875, 0.0355224609375, 0.048786163330078125, 0.06204986572265625, 0.07531356811523438, 0.0885772705078125, 0.10184097290039062, 0.11510467529296875, 0.12836837768554688, 0.141632080078125, 0.15489578247070312, 0.16815948486328125, 0.18142318725585938, 0.1946868896484375, 0.20795059204101562, 0.22121429443359375, 0.23447799682617188, 0.24774169921875, 0.2610054016113281, 0.27426910400390625, 0.2875328063964844, 0.3007965087890625, 0.3140602111816406, 0.32732391357421875, 0.3405876159667969, 0.353851318359375, 0.3671150207519531, 0.38037872314453125, 0.3936424255371094, 0.4069061279296875, 0.4201698303222656, 0.43343353271484375, 0.4466972351074219, 0.4599609375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 23.0, 106.0, 559.0, 262.0, 41.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.55836868286133, -31.56367301940918, -30.56897735595703, -29.574281692504883, -28.579586029052734, -27.584890365600586, -26.590194702148438, -25.595497131347656, -24.60080337524414, -23.606107711791992, -22.611412048339844, -21.616716384887695, -20.622020721435547, -19.6273250579834, -18.63262939453125, -17.63793182373047, -16.64323616027832, -15.648540496826172, -14.653844833374023, -13.659149169921875, -12.664453506469727, -11.669757843017578, -10.675061225891113, -9.680365562438965, -8.685669898986816, -7.690974235534668, -6.6962785720825195, -5.701582431793213, -4.7068867683410645, -3.712191104888916, -2.7174949645996094, -1.722799301147461, -0.7281036376953125, 0.2665921449661255, 1.2612879276275635, 2.255983829498291, 3.2506794929504395, 4.245375156402588, 5.2400712966918945, 6.234766960144043, 7.229462623596191, 8.22415828704834, 9.218853950500488, 10.213550567626953, 11.208246231079102, 12.20294189453125, 13.197637557983398, 14.192333221435547, 15.187028884887695, 16.181724548339844, 17.176420211791992, 18.17111587524414, 19.16581153869629, 20.160507202148438, 21.15520477294922, 22.149898529052734, 23.144596099853516, 24.139291763305664, 25.133987426757812, 26.12868309020996, 27.12337875366211, 28.118074417114258, 29.112770080566406, 30.107467651367188, 31.102161407470703]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 14.0, 17.0, 20.0, 19.0, 28.0, 30.0, 52.0, 45.0, 59.0, 67.0, 63.0, 76.0, 62.0, 78.0, 66.0, 53.0, 53.0, 40.0, 35.0, 31.0, 22.0, 23.0, 15.0, 11.0, 5.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.181644439697266, -16.769371032714844, -16.357097625732422, -15.944825172424316, -15.532552719116211, -15.120279312133789, -14.708006858825684, -14.295733451843262, -13.883460998535156, -13.471187591552734, -13.058915138244629, -12.646641731262207, -12.234369277954102, -11.82209587097168, -11.409823417663574, -10.997550010681152, -10.585277557373047, -10.173004150390625, -9.76073169708252, -9.348458290100098, -8.936185836791992, -8.52391242980957, -8.111639976501465, -7.699366569519043, -7.287093162536621, -6.874820232391357, -6.462547302246094, -6.05027437210083, -5.638001441955566, -5.2257280349731445, -4.813455581665039, -4.401182174682617, -3.9889097213745117, -3.576636791229248, -3.1643638610839844, -2.7520909309387207, -2.339818000793457, -1.9275448322296143, -1.5152719020843506, -1.102998971939087, -0.6907260417938232, -0.2784530818462372, 0.13381987810134888, 0.5460928678512573, 0.958365797996521, 1.3706388473510742, 1.782911777496338, 2.1951847076416016, 2.6074576377868652, 3.019730567932129, 3.4320034980773926, 3.8442764282226562, 4.25654935836792, 4.668822288513184, 5.0810956954956055, 5.493368148803711, 5.905641555786133, 6.3179144859313965, 6.73018741607666, 7.142460346221924, 7.5547332763671875, 7.967006683349609, 8.379279136657715, 8.791552543640137, 9.203824996948242]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 6.0, 8.0, 9.0, 8.0, 10.0, 20.0, 15.0, 27.0, 24.0, 35.0, 64.0, 70.0, 77.0, 147.0, 175.0, 380.0, 958.0, 2851.0, 12565.0, 137615.0, 3896699.0, 125356.0, 12266.0, 2786.0, 960.0, 430.0, 236.0, 119.0, 112.0, 51.0, 43.0, 28.0, 22.0, 28.0, 18.0, 14.0, 18.0, 7.0, 9.0, 5.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6875, -5.512451171875, -5.33740234375, -5.162353515625, -4.9873046875, -4.812255859375, -4.63720703125, -4.462158203125, -4.287109375, -4.112060546875, -3.93701171875, -3.761962890625, -3.5869140625, -3.411865234375, -3.23681640625, -3.061767578125, -2.88671875, -2.711669921875, -2.53662109375, -2.361572265625, -2.1865234375, -2.011474609375, -1.83642578125, -1.661376953125, -1.486328125, -1.311279296875, -1.13623046875, -0.961181640625, -0.7861328125, -0.611083984375, -0.43603515625, -0.260986328125, -0.0859375, 0.089111328125, 0.26416015625, 0.439208984375, 0.6142578125, 0.789306640625, 0.96435546875, 1.139404296875, 1.314453125, 1.489501953125, 1.66455078125, 1.839599609375, 2.0146484375, 2.189697265625, 2.36474609375, 2.539794921875, 2.71484375, 2.889892578125, 3.06494140625, 3.239990234375, 3.4150390625, 3.590087890625, 3.76513671875, 3.940185546875, 4.115234375, 4.290283203125, 4.46533203125, 4.640380859375, 4.8154296875, 4.990478515625, 5.16552734375, 5.340576171875, 5.515625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 4.0, 9.0, 7.0, 15.0, 22.0, 27.0, 22.0, 39.0, 41.0, 48.0, 70.0, 68.0, 71.0, 63.0, 74.0, 62.0, 66.0, 48.0, 44.0, 30.0, 31.0, 31.0, 15.0, 18.0, 13.0, 14.0, 6.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.62890625, -2.548675537109375, -2.46844482421875, -2.388214111328125, -2.3079833984375, -2.227752685546875, -2.14752197265625, -2.067291259765625, -1.987060546875, -1.906829833984375, -1.82659912109375, -1.746368408203125, -1.6661376953125, -1.585906982421875, -1.50567626953125, -1.425445556640625, -1.34521484375, -1.264984130859375, -1.18475341796875, -1.104522705078125, -1.0242919921875, -0.944061279296875, -0.86383056640625, -0.783599853515625, -0.703369140625, -0.623138427734375, -0.54290771484375, -0.462677001953125, -0.3824462890625, -0.302215576171875, -0.22198486328125, -0.141754150390625, -0.0615234375, 0.018707275390625, 0.09893798828125, 0.179168701171875, 0.2593994140625, 0.339630126953125, 0.41986083984375, 0.500091552734375, 0.580322265625, 0.660552978515625, 0.74078369140625, 0.821014404296875, 0.9012451171875, 0.981475830078125, 1.06170654296875, 1.141937255859375, 1.22216796875, 1.302398681640625, 1.38262939453125, 1.462860107421875, 1.5430908203125, 1.623321533203125, 1.70355224609375, 1.783782958984375, 1.864013671875, 1.944244384765625, 2.02447509765625, 2.104705810546875, 2.1849365234375, 2.265167236328125, 2.34539794921875, 2.425628662109375, 2.505859375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 5.0, 13.0, 10.0, 34.0, 23.0, 41.0, 76.0, 135.0, 248.0, 795.0, 4284.0, 99885.0, 4060329.0, 25237.0, 2206.0, 484.0, 179.0, 91.0, 59.0, 24.0, 22.0, 16.0, 21.0, 8.0, 4.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.29833984375, -9.0107421875, -8.72314453125, -8.435546875, -8.14794921875, -7.8603515625, -7.57275390625, -7.28515625, -6.99755859375, -6.7099609375, -6.42236328125, -6.134765625, -5.84716796875, -5.5595703125, -5.27197265625, -4.984375, -4.69677734375, -4.4091796875, -4.12158203125, -3.833984375, -3.54638671875, -3.2587890625, -2.97119140625, -2.68359375, -2.39599609375, -2.1083984375, -1.82080078125, -1.533203125, -1.24560546875, -0.9580078125, -0.67041015625, -0.3828125, -0.09521484375, 0.1923828125, 0.47998046875, 0.767578125, 1.05517578125, 1.3427734375, 1.63037109375, 1.91796875, 2.20556640625, 2.4931640625, 2.78076171875, 3.068359375, 3.35595703125, 3.6435546875, 3.93115234375, 4.21875, 4.50634765625, 4.7939453125, 5.08154296875, 5.369140625, 5.65673828125, 5.9443359375, 6.23193359375, 6.51953125, 6.80712890625, 7.0947265625, 7.38232421875, 7.669921875, 7.95751953125, 8.2451171875, 8.53271484375, 8.8203125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 12.0, 11.0, 34.0, 16.0, 55.0, 87.0, 136.0, 239.0, 584.0, 1632.0, 598.0, 262.0, 134.0, 76.0, 55.0, 29.0, 25.0, 23.0, 12.0, 10.0, 6.0, 3.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.9434814453125, -0.910400390625, -0.8773193359375, -0.84423828125, -0.8111572265625, -0.778076171875, -0.7449951171875, -0.7119140625, -0.6788330078125, -0.645751953125, -0.6126708984375, -0.57958984375, -0.5465087890625, -0.513427734375, -0.4803466796875, -0.447265625, -0.4141845703125, -0.381103515625, -0.3480224609375, -0.31494140625, -0.2818603515625, -0.248779296875, -0.2156982421875, -0.1826171875, -0.1495361328125, -0.116455078125, -0.0833740234375, -0.05029296875, -0.0172119140625, 0.015869140625, 0.0489501953125, 0.08203125, 0.1151123046875, 0.148193359375, 0.1812744140625, 0.21435546875, 0.2474365234375, 0.280517578125, 0.3135986328125, 0.3466796875, 0.3797607421875, 0.412841796875, 0.4459228515625, 0.47900390625, 0.5120849609375, 0.545166015625, 0.5782470703125, 0.611328125, 0.6444091796875, 0.677490234375, 0.7105712890625, 0.74365234375, 0.7767333984375, 0.809814453125, 0.8428955078125, 0.8759765625, 0.9090576171875, 0.942138671875, 0.9752197265625, 1.00830078125, 1.0413818359375, 1.074462890625, 1.1075439453125, 1.140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 10.0, 2.0, 6.0, 2.0, 7.0, 3.0, 10.0, 9.0, 9.0, 16.0, 21.0, 21.0, 33.0, 57.0, 78.0, 77.0, 107.0, 104.0, 99.0, 73.0, 60.0, 43.0, 24.0, 32.0, 30.0, 15.0, 12.0, 8.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.676827907562256, -2.5784897804260254, -2.480151653289795, -2.3818135261535645, -2.283475160598755, -2.1851370334625244, -2.086798906326294, -1.9884607791900635, -1.8901225328445435, -1.791784405708313, -1.693446159362793, -1.5951080322265625, -1.496769905090332, -1.398431658744812, -1.3000935316085815, -1.2017552852630615, -1.103417158126831, -1.0050790309906006, -0.9067407846450806, -0.8084026575088501, -0.7100644707679749, -0.6117262840270996, -0.5133881568908691, -0.4150499701499939, -0.31671178340911865, -0.2183736115694046, -0.12003543972969055, -0.021697282791137695, 0.07664090394973755, 0.1749790906906128, 0.27331721782684326, 0.3716554045677185, 0.46999359130859375, 0.568331778049469, 0.6666699647903442, 0.7650080919265747, 0.86334627866745, 0.9616844654083252, 1.0600225925445557, 1.1583607196807861, 1.2566989660263062, 1.3550370931625366, 1.4533753395080566, 1.551713466644287, 1.6500515937805176, 1.7483898401260376, 1.846727967262268, 1.945066213607788, 2.0434043407440186, 2.141742467880249, 2.2400805950164795, 2.338418960571289, 2.4367570877075195, 2.53509521484375, 2.6334333419799805, 2.731771469116211, 2.8301095962524414, 2.928447723388672, 3.0267858505249023, 3.125123977661133, 3.2234623432159424, 3.321800470352173, 3.4201385974884033, 3.518476724624634, 3.6168150901794434]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 5.0, 13.0, 9.0, 15.0, 15.0, 29.0, 25.0, 37.0, 39.0, 51.0, 60.0, 51.0, 60.0, 61.0, 52.0, 55.0, 49.0, 51.0, 46.0, 43.0, 28.0, 32.0, 26.0, 25.0, 27.0, 15.0, 14.0, 12.0, 10.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.384866952896118, -2.3088696002960205, -2.232872486114502, -2.1568751335144043, -2.0808777809143066, -2.004880666732788, -1.9288833141326904, -1.8528860807418823, -1.7768888473510742, -1.7008916139602661, -1.624894380569458, -1.5488970279693604, -1.4728997945785522, -1.3969025611877441, -1.3209052085876465, -1.2449079751968384, -1.1689107418060303, -1.0929135084152222, -1.016916275024414, -0.9409189224243164, -0.8649216890335083, -0.7889244556427002, -0.7129271626472473, -0.6369298696517944, -0.5609326362609863, -0.48493537306785583, -0.40893810987472534, -0.33294084668159485, -0.25694358348846436, -0.18094632029533386, -0.10494905710220337, -0.02895176410675049, 0.047045230865478516, 0.12304249405860901, 0.1990397572517395, 0.27503702044487, 0.3510342836380005, 0.427031546831131, 0.5030288100242615, 0.5790261030197144, 0.6550233364105225, 0.7310205698013306, 0.8070178627967834, 0.8830151557922363, 0.9590123891830444, 1.0350096225738525, 1.1110069751739502, 1.1870042085647583, 1.2630014419555664, 1.3389986753463745, 1.4149959087371826, 1.4909932613372803, 1.5669904947280884, 1.6429877281188965, 1.7189850807189941, 1.7949823141098022, 1.8709795475006104, 1.9469767808914185, 2.0229740142822266, 2.098971366882324, 2.174968719482422, 2.2509658336639404, 2.326963186264038, 2.4029603004455566, 2.4789576530456543]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 7.0, 14.0, 7.0, 30.0, 53.0, 68.0, 86.0, 125.0, 265.0, 421.0, 779.0, 1354.0, 2672.0, 5580.0, 12198.0, 29630.0, 80675.0, 221649.0, 368276.0, 202828.0, 72691.0, 27167.0, 11463.0, 5150.0, 2448.0, 1237.0, 660.0, 395.0, 235.0, 124.0, 88.0, 54.0, 43.0, 26.0, 9.0, 12.0, 7.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2457275390625, -0.23815536499023438, -0.23058319091796875, -0.22301101684570312, -0.2154388427734375, -0.20786666870117188, -0.20029449462890625, -0.19272232055664062, -0.185150146484375, -0.17757797241210938, -0.17000579833984375, -0.16243362426757812, -0.1548614501953125, -0.14728927612304688, -0.13971710205078125, -0.13214492797851562, -0.12457275390625, -0.11700057983398438, -0.10942840576171875, -0.10185623168945312, -0.0942840576171875, -0.08671188354492188, -0.07913970947265625, -0.07156753540039062, -0.063995361328125, -0.056423187255859375, -0.04885101318359375, -0.041278839111328125, -0.0337066650390625, -0.026134490966796875, -0.01856231689453125, -0.010990142822265625, -0.00341796875, 0.004154205322265625, 0.01172637939453125, 0.019298553466796875, 0.0268707275390625, 0.034442901611328125, 0.04201507568359375, 0.049587249755859375, 0.057159423828125, 0.06473159790039062, 0.07230377197265625, 0.07987594604492188, 0.0874481201171875, 0.09502029418945312, 0.10259246826171875, 0.11016464233398438, 0.11773681640625, 0.12530899047851562, 0.13288116455078125, 0.14045333862304688, 0.1480255126953125, 0.15559768676757812, 0.16316986083984375, 0.17074203491210938, 0.178314208984375, 0.18588638305664062, 0.19345855712890625, 0.20103073120117188, 0.2086029052734375, 0.21617507934570312, 0.22374725341796875, 0.23131942749023438, 0.2388916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 17.0, 11.0, 17.0, 37.0, 53.0, 52.0, 64.0, 74.0, 101.0, 88.0, 82.0, 65.0, 70.0, 46.0, 43.0, 40.0, 22.0, 20.0, 27.0, 12.0, 10.0, 9.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.90234375, -2.82733154296875, -2.7523193359375, -2.67730712890625, -2.602294921875, -2.52728271484375, -2.4522705078125, -2.37725830078125, -2.30224609375, -2.22723388671875, -2.1522216796875, -2.07720947265625, -2.002197265625, -1.92718505859375, -1.8521728515625, -1.77716064453125, -1.7021484375, -1.62713623046875, -1.5521240234375, -1.47711181640625, -1.402099609375, -1.32708740234375, -1.2520751953125, -1.17706298828125, -1.10205078125, -1.02703857421875, -0.9520263671875, -0.87701416015625, -0.802001953125, -0.72698974609375, -0.6519775390625, -0.57696533203125, -0.501953125, -0.42694091796875, -0.3519287109375, -0.27691650390625, -0.201904296875, -0.12689208984375, -0.0518798828125, 0.02313232421875, 0.09814453125, 0.17315673828125, 0.2481689453125, 0.32318115234375, 0.398193359375, 0.47320556640625, 0.5482177734375, 0.62322998046875, 0.6982421875, 0.77325439453125, 0.8482666015625, 0.92327880859375, 0.998291015625, 1.07330322265625, 1.1483154296875, 1.22332763671875, 1.29833984375, 1.37335205078125, 1.4483642578125, 1.52337646484375, 1.598388671875, 1.67340087890625, 1.7484130859375, 1.82342529296875, 1.8984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 6.0, 7.0, 8.0, 1.0, 21.0, 17.0, 27.0, 46.0, 45.0, 88.0, 105.0, 120.0, 197.0, 358.0, 535.0, 875.0, 1592.0, 3433.0, 8473.0, 24553.0, 79099.0, 239742.0, 388488.0, 203819.0, 63299.0, 19939.0, 7246.0, 2949.0, 1384.0, 746.0, 418.0, 265.0, 187.0, 126.0, 94.0, 64.0, 54.0, 36.0, 31.0, 19.0, 10.0, 9.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2359619140625, -0.2276592254638672, -0.21935653686523438, -0.21105384826660156, -0.20275115966796875, -0.19444847106933594, -0.18614578247070312, -0.1778430938720703, -0.1695404052734375, -0.1612377166748047, -0.15293502807617188, -0.14463233947753906, -0.13632965087890625, -0.12802696228027344, -0.11972427368164062, -0.11142158508300781, -0.103118896484375, -0.09481620788574219, -0.08651351928710938, -0.07821083068847656, -0.06990814208984375, -0.06160545349121094, -0.053302764892578125, -0.04500007629394531, -0.0366973876953125, -0.028394699096679688, -0.020092010498046875, -0.011789321899414062, -0.00348663330078125, 0.0048160552978515625, 0.013118743896484375, 0.021421432495117188, 0.02972412109375, 0.03802680969238281, 0.046329498291015625, 0.05463218688964844, 0.06293487548828125, 0.07123756408691406, 0.07954025268554688, 0.08784294128417969, 0.0961456298828125, 0.10444831848144531, 0.11275100708007812, 0.12105369567871094, 0.12935638427734375, 0.13765907287597656, 0.14596176147460938, 0.1542644500732422, 0.162567138671875, 0.1708698272705078, 0.17917251586914062, 0.18747520446777344, 0.19577789306640625, 0.20408058166503906, 0.21238327026367188, 0.2206859588623047, 0.2289886474609375, 0.2372913360595703, 0.24559402465820312, 0.25389671325683594, 0.26219940185546875, 0.27050209045410156, 0.2788047790527344, 0.2871074676513672, 0.29541015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 13.0, 8.0, 7.0, 14.0, 27.0, 16.0, 22.0, 21.0, 36.0, 45.0, 39.0, 44.0, 48.0, 44.0, 51.0, 53.0, 52.0, 50.0, 52.0, 51.0, 35.0, 55.0, 38.0, 39.0, 30.0, 27.0, 8.0, 13.0, 17.0, 7.0, 5.0, 6.0, 6.0, 1.0, 4.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.794921875, -3.69329833984375, -3.5916748046875, -3.49005126953125, -3.388427734375, -3.28680419921875, -3.1851806640625, -3.08355712890625, -2.98193359375, -2.88031005859375, -2.7786865234375, -2.67706298828125, -2.575439453125, -2.47381591796875, -2.3721923828125, -2.27056884765625, -2.1689453125, -2.06732177734375, -1.9656982421875, -1.86407470703125, -1.762451171875, -1.66082763671875, -1.5592041015625, -1.45758056640625, -1.35595703125, -1.25433349609375, -1.1527099609375, -1.05108642578125, -0.949462890625, -0.84783935546875, -0.7462158203125, -0.64459228515625, -0.54296875, -0.44134521484375, -0.3397216796875, -0.23809814453125, -0.136474609375, -0.03485107421875, 0.0667724609375, 0.16839599609375, 0.27001953125, 0.37164306640625, 0.4732666015625, 0.57489013671875, 0.676513671875, 0.77813720703125, 0.8797607421875, 0.98138427734375, 1.0830078125, 1.18463134765625, 1.2862548828125, 1.38787841796875, 1.489501953125, 1.59112548828125, 1.6927490234375, 1.79437255859375, 1.89599609375, 1.99761962890625, 2.0992431640625, 2.20086669921875, 2.302490234375, 2.40411376953125, 2.5057373046875, 2.60736083984375, 2.708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 5.0, 16.0, 19.0, 26.0, 39.0, 60.0, 66.0, 103.0, 186.0, 321.0, 494.0, 958.0, 2044.0, 5114.0, 16498.0, 74225.0, 383241.0, 445559.0, 89533.0, 19422.0, 5887.0, 2233.0, 1075.0, 505.0, 309.0, 205.0, 110.0, 89.0, 49.0, 32.0, 30.0, 24.0, 20.0, 7.0, 7.0, 2.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.123046875, -0.11881256103515625, -0.1145782470703125, -0.11034393310546875, -0.106109619140625, -0.10187530517578125, -0.0976409912109375, -0.09340667724609375, -0.08917236328125, -0.08493804931640625, -0.0807037353515625, -0.07646942138671875, -0.072235107421875, -0.06800079345703125, -0.0637664794921875, -0.05953216552734375, -0.0552978515625, -0.05106353759765625, -0.0468292236328125, -0.04259490966796875, -0.038360595703125, -0.03412628173828125, -0.0298919677734375, -0.02565765380859375, -0.02142333984375, -0.01718902587890625, -0.0129547119140625, -0.00872039794921875, -0.004486083984375, -0.00025177001953125, 0.0039825439453125, 0.00821685791015625, 0.012451171875, 0.01668548583984375, 0.0209197998046875, 0.02515411376953125, 0.029388427734375, 0.03362274169921875, 0.0378570556640625, 0.04209136962890625, 0.04632568359375, 0.05055999755859375, 0.0547943115234375, 0.05902862548828125, 0.063262939453125, 0.06749725341796875, 0.0717315673828125, 0.07596588134765625, 0.0802001953125, 0.08443450927734375, 0.0886688232421875, 0.09290313720703125, 0.097137451171875, 0.10137176513671875, 0.1056060791015625, 0.10984039306640625, 0.11407470703125, 0.11830902099609375, 0.1225433349609375, 0.12677764892578125, 0.131011962890625, 0.13524627685546875, 0.1394805908203125, 0.14371490478515625, 0.14794921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 6.0, 6.0, 11.0, 15.0, 14.0, 34.0, 47.0, 54.0, 81.0, 85.0, 108.0, 115.0, 100.0, 86.0, 64.0, 45.0, 32.0, 27.0, 20.0, 17.0, 15.0, 2.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001232624053955078, -0.00012029241770505905, -0.00011732243001461029, -0.00011435244232416153, -0.00011138245463371277, -0.00010841246694326401, -0.00010544247925281525, -0.00010247249156236649, -9.950250387191772e-05, -9.653251618146896e-05, -9.35625284910202e-05, -9.059254080057144e-05, -8.762255311012268e-05, -8.465256541967392e-05, -8.168257772922516e-05, -7.87125900387764e-05, -7.574260234832764e-05, -7.277261465787888e-05, -6.980262696743011e-05, -6.683263927698135e-05, -6.386265158653259e-05, -6.089266389608383e-05, -5.792267620563507e-05, -5.495268851518631e-05, -5.198270082473755e-05, -4.901271313428879e-05, -4.604272544384003e-05, -4.3072737753391266e-05, -4.0102750062942505e-05, -3.7132762372493744e-05, -3.416277468204498e-05, -3.119278699159622e-05, -2.822279930114746e-05, -2.52528116106987e-05, -2.228282392024994e-05, -1.9312836229801178e-05, -1.6342848539352417e-05, -1.3372860848903656e-05, -1.0402873158454895e-05, -7.432885468006134e-06, -4.462897777557373e-06, -1.492910087108612e-06, 1.477077603340149e-06, 4.44706529378891e-06, 7.417052984237671e-06, 1.0387040674686432e-05, 1.3357028365135193e-05, 1.6327016055583954e-05, 1.9297003746032715e-05, 2.2266991436481476e-05, 2.5236979126930237e-05, 2.8206966817378998e-05, 3.117695450782776e-05, 3.414694219827652e-05, 3.711692988872528e-05, 4.008691757917404e-05, 4.30569052696228e-05, 4.6026892960071564e-05, 4.8996880650520325e-05, 5.1966868340969086e-05, 5.493685603141785e-05, 5.790684372186661e-05, 6.087683141231537e-05, 6.384681910276413e-05, 6.681680679321289e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 9.0, 19.0, 28.0, 37.0, 55.0, 97.0, 249.0, 640.0, 2083.0, 9092.0, 71176.0, 704578.0, 234217.0, 20740.0, 3763.0, 1044.0, 341.0, 153.0, 93.0, 36.0, 34.0, 20.0, 17.0, 4.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1907958984375, -0.18437767028808594, -0.17795944213867188, -0.1715412139892578, -0.16512298583984375, -0.1587047576904297, -0.15228652954101562, -0.14586830139160156, -0.1394500732421875, -0.13303184509277344, -0.12661361694335938, -0.12019538879394531, -0.11377716064453125, -0.10735893249511719, -0.10094070434570312, -0.09452247619628906, -0.088104248046875, -0.08168601989746094, -0.07526779174804688, -0.06884956359863281, -0.06243133544921875, -0.05601310729980469, -0.049594879150390625, -0.04317665100097656, -0.0367584228515625, -0.030340194702148438, -0.023921966552734375, -0.017503738403320312, -0.01108551025390625, -0.0046672821044921875, 0.001750946044921875, 0.008169174194335938, 0.01458740234375, 0.021005630493164062, 0.027423858642578125, 0.03384208679199219, 0.04026031494140625, 0.04667854309082031, 0.053096771240234375, 0.05951499938964844, 0.0659332275390625, 0.07235145568847656, 0.07876968383789062, 0.08518791198730469, 0.09160614013671875, 0.09802436828613281, 0.10444259643554688, 0.11086082458496094, 0.117279052734375, 0.12369728088378906, 0.13011550903320312, 0.1365337371826172, 0.14295196533203125, 0.1493701934814453, 0.15578842163085938, 0.16220664978027344, 0.1686248779296875, 0.17504310607910156, 0.18146133422851562, 0.1878795623779297, 0.19429779052734375, 0.2007160186767578, 0.20713424682617188, 0.21355247497558594, 0.219970703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 6.0, 11.0, 12.0, 17.0, 22.0, 28.0, 44.0, 50.0, 50.0, 64.0, 89.0, 99.0, 82.0, 74.0, 70.0, 62.0, 35.0, 43.0, 30.0, 28.0, 15.0, 14.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0281829833984375, -0.02735733985900879, -0.026531696319580078, -0.025706052780151367, -0.024880409240722656, -0.024054765701293945, -0.023229122161865234, -0.022403478622436523, -0.021577835083007812, -0.0207521915435791, -0.01992654800415039, -0.01910090446472168, -0.01827526092529297, -0.017449617385864258, -0.016623973846435547, -0.015798330307006836, -0.014972686767578125, -0.014147043228149414, -0.013321399688720703, -0.012495756149291992, -0.011670112609863281, -0.01084446907043457, -0.01001882553100586, -0.009193181991577148, -0.008367538452148438, -0.0075418949127197266, -0.006716251373291016, -0.005890607833862305, -0.005064964294433594, -0.004239320755004883, -0.003413677215576172, -0.002588033676147461, -0.00176239013671875, -0.0009367465972900391, -0.00011110305786132812, 0.0007145404815673828, 0.0015401840209960938, 0.0023658275604248047, 0.0031914710998535156, 0.0040171146392822266, 0.0048427581787109375, 0.0056684017181396484, 0.006494045257568359, 0.00731968879699707, 0.008145332336425781, 0.008970975875854492, 0.009796619415283203, 0.010622262954711914, 0.011447906494140625, 0.012273550033569336, 0.013099193572998047, 0.013924837112426758, 0.014750480651855469, 0.01557612419128418, 0.01640176773071289, 0.0172274112701416, 0.018053054809570312, 0.018878698348999023, 0.019704341888427734, 0.020529985427856445, 0.021355628967285156, 0.022181272506713867, 0.023006916046142578, 0.02383255958557129, 0.024658203125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 3.0, 13.0, 8.0, 11.0, 10.0, 24.0, 31.0, 44.0, 89.0, 133.0, 150.0, 155.0, 101.0, 62.0, 53.0, 28.0, 25.0, 10.0, 12.0, 1.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9297759532928467, -1.8323655128479004, -1.734955072402954, -1.6375447511672974, -1.540134310722351, -1.4427238702774048, -1.345313549041748, -1.2479031085968018, -1.1504926681518555, -1.0530822277069092, -0.9556718468666077, -0.8582614660263062, -0.7608510255813599, -0.6634405851364136, -0.5660302042961121, -0.46861982345581055, -0.37120938301086426, -0.27379897236824036, -0.17638856172561646, -0.07897815108299255, 0.018432259559631348, 0.11584267020225525, 0.21325308084487915, 0.31066346168518066, 0.40807390213012695, 0.5054843425750732, 0.6028947234153748, 0.7003051042556763, 0.7977155447006226, 0.8951259851455688, 0.9925363659858704, 1.0899467468261719, 1.1873574256896973, 1.2847678661346436, 1.3821783065795898, 1.4795886278152466, 1.5769990682601929, 1.6744095087051392, 1.771819829940796, 1.8692302703857422, 1.9666407108306885, 2.0640511512756348, 2.161461591720581, 2.2588720321655273, 2.3562822341918945, 2.453692674636841, 2.551103115081787, 2.6485135555267334, 2.7459239959716797, 2.843334436416626, 2.9407448768615723, 3.0381553173065186, 3.135565757751465, 3.232975959777832, 3.3303864002227783, 3.4277968406677246, 3.525207281112671, 3.622617721557617, 3.7200281620025635, 3.8174386024475098, 3.914848804473877, 4.012259483337402, 4.1096696853637695, 4.207079887390137, 4.304490566253662]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 9.0, 5.0, 4.0, 11.0, 14.0, 21.0, 16.0, 38.0, 51.0, 59.0, 78.0, 85.0, 90.0, 89.0, 84.0, 65.0, 66.0, 42.0, 44.0, 32.0, 31.0, 21.0, 14.0, 13.0, 5.0, 7.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.9620790481567383, -2.8868136405944824, -2.8115482330322266, -2.7362828254699707, -2.661017417907715, -2.585752010345459, -2.510486602783203, -2.435220956802368, -2.3599555492401123, -2.2846901416778564, -2.2094247341156006, -2.1341593265533447, -2.058893918991089, -1.9836283922195435, -1.9083629846572876, -1.8330974578857422, -1.7578321695327759, -1.68256676197052, -1.6073013544082642, -1.5320358276367188, -1.456770420074463, -1.381505012512207, -1.3062396049499512, -1.2309741973876953, -1.1557087898254395, -1.0804433822631836, -1.0051779747009277, -0.9299125075340271, -0.8546470403671265, -0.7793816328048706, -0.7041162252426147, -0.6288507580757141, -0.5535851716995239, -0.4783197343349457, -0.40305429697036743, -0.3277888894081116, -0.2525234520435333, -0.17725801467895508, -0.10199260711669922, -0.026727139949798584, 0.048538267612457275, 0.12380369752645493, 0.19906912744045258, 0.27433454990386963, 0.3495999872684479, 0.4248654246330261, 0.500130832195282, 0.5753962993621826, 0.6506617069244385, 0.7259271144866943, 0.801192581653595, 0.8764579892158508, 0.9517234563827515, 1.0269888639450073, 1.1022542715072632, 1.1775197982788086, 1.2527852058410645, 1.3280506134033203, 1.4033160209655762, 1.478581428527832, 1.5538469552993774, 1.6291123628616333, 1.7043777704238892, 1.7796432971954346, 1.8549085855484009]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 15.0, 22.0, 18.0, 57.0, 83.0, 180.0, 453.0, 1308.0, 4412.0, 20735.0, 177501.0, 756125.0, 71941.0, 11362.0, 2756.0, 843.0, 364.0, 151.0, 81.0, 32.0, 27.0, 15.0, 9.0, 12.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55859375, -3.44122314453125, -3.3238525390625, -3.20648193359375, -3.089111328125, -2.97174072265625, -2.8543701171875, -2.73699951171875, -2.61962890625, -2.50225830078125, -2.3848876953125, -2.26751708984375, -2.150146484375, -2.03277587890625, -1.9154052734375, -1.79803466796875, -1.6806640625, -1.56329345703125, -1.4459228515625, -1.32855224609375, -1.211181640625, -1.09381103515625, -0.9764404296875, -0.85906982421875, -0.74169921875, -0.62432861328125, -0.5069580078125, -0.38958740234375, -0.272216796875, -0.15484619140625, -0.0374755859375, 0.07989501953125, 0.197265625, 0.31463623046875, 0.4320068359375, 0.54937744140625, 0.666748046875, 0.78411865234375, 0.9014892578125, 1.01885986328125, 1.13623046875, 1.25360107421875, 1.3709716796875, 1.48834228515625, 1.605712890625, 1.72308349609375, 1.8404541015625, 1.95782470703125, 2.0751953125, 2.19256591796875, 2.3099365234375, 2.42730712890625, 2.544677734375, 2.66204833984375, 2.7794189453125, 2.89678955078125, 3.01416015625, 3.13153076171875, 3.2489013671875, 3.36627197265625, 3.483642578125, 3.60101318359375, 3.7183837890625, 3.83575439453125, 3.953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 9.0, 20.0, 33.0, 78.0, 142.0, 176.0, 184.0, 151.0, 89.0, 57.0, 35.0, 19.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-20.765625, -20.36798095703125, -19.9703369140625, -19.57269287109375, -19.175048828125, -18.77740478515625, -18.3797607421875, -17.98211669921875, -17.58447265625, -17.18682861328125, -16.7891845703125, -16.39154052734375, -15.993896484375, -15.59625244140625, -15.1986083984375, -14.80096435546875, -14.4033203125, -14.00567626953125, -13.6080322265625, -13.21038818359375, -12.812744140625, -12.41510009765625, -12.0174560546875, -11.61981201171875, -11.22216796875, -10.82452392578125, -10.4268798828125, -10.02923583984375, -9.631591796875, -9.23394775390625, -8.8363037109375, -8.43865966796875, -8.041015625, -7.64337158203125, -7.2457275390625, -6.84808349609375, -6.450439453125, -6.05279541015625, -5.6551513671875, -5.25750732421875, -4.85986328125, -4.46221923828125, -4.0645751953125, -3.66693115234375, -3.269287109375, -2.87164306640625, -2.4739990234375, -2.07635498046875, -1.6787109375, -1.28106689453125, -0.8834228515625, -0.48577880859375, -0.088134765625, 0.30950927734375, 0.7071533203125, 1.10479736328125, 1.50244140625, 1.90008544921875, 2.2977294921875, 2.69537353515625, 3.093017578125, 3.49066162109375, 3.8883056640625, 4.28594970703125, 4.68359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 10.0, 7.0, 11.0, 22.0, 36.0, 51.0, 75.0, 113.0, 214.0, 350.0, 771.0, 1997.0, 7234.0, 47887.0, 756436.0, 208986.0, 18030.0, 3902.0, 1215.0, 510.0, 278.0, 159.0, 61.0, 56.0, 38.0, 38.0, 23.0, 10.0, 12.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.916015625, -2.82122802734375, -2.7264404296875, -2.63165283203125, -2.536865234375, -2.44207763671875, -2.3472900390625, -2.25250244140625, -2.15771484375, -2.06292724609375, -1.9681396484375, -1.87335205078125, -1.778564453125, -1.68377685546875, -1.5889892578125, -1.49420166015625, -1.3994140625, -1.30462646484375, -1.2098388671875, -1.11505126953125, -1.020263671875, -0.92547607421875, -0.8306884765625, -0.73590087890625, -0.64111328125, -0.54632568359375, -0.4515380859375, -0.35675048828125, -0.261962890625, -0.16717529296875, -0.0723876953125, 0.02239990234375, 0.1171875, 0.21197509765625, 0.3067626953125, 0.40155029296875, 0.496337890625, 0.59112548828125, 0.6859130859375, 0.78070068359375, 0.87548828125, 0.97027587890625, 1.0650634765625, 1.15985107421875, 1.254638671875, 1.34942626953125, 1.4442138671875, 1.53900146484375, 1.6337890625, 1.72857666015625, 1.8233642578125, 1.91815185546875, 2.012939453125, 2.10772705078125, 2.2025146484375, 2.29730224609375, 2.39208984375, 2.48687744140625, 2.5816650390625, 2.67645263671875, 2.771240234375, 2.86602783203125, 2.9608154296875, 3.05560302734375, 3.150390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 7.0, 10.0, 12.0, 17.0, 13.0, 17.0, 26.0, 30.0, 26.0, 26.0, 39.0, 38.0, 38.0, 31.0, 41.0, 38.0, 41.0, 37.0, 44.0, 45.0, 45.0, 38.0, 39.0, 36.0, 41.0, 32.0, 19.0, 26.0, 20.0, 18.0, 10.0, 11.0, 8.0, 13.0, 7.0, 8.0, 12.0, 5.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.1112060546875, -3.976318359375, -3.8414306640625, -3.70654296875, -3.5716552734375, -3.436767578125, -3.3018798828125, -3.1669921875, -3.0321044921875, -2.897216796875, -2.7623291015625, -2.62744140625, -2.4925537109375, -2.357666015625, -2.2227783203125, -2.087890625, -1.9530029296875, -1.818115234375, -1.6832275390625, -1.54833984375, -1.4134521484375, -1.278564453125, -1.1436767578125, -1.0087890625, -0.8739013671875, -0.739013671875, -0.6041259765625, -0.46923828125, -0.3343505859375, -0.199462890625, -0.0645751953125, 0.0703125, 0.2052001953125, 0.340087890625, 0.4749755859375, 0.60986328125, 0.7447509765625, 0.879638671875, 1.0145263671875, 1.1494140625, 1.2843017578125, 1.419189453125, 1.5540771484375, 1.68896484375, 1.8238525390625, 1.958740234375, 2.0936279296875, 2.228515625, 2.3634033203125, 2.498291015625, 2.6331787109375, 2.76806640625, 2.9029541015625, 3.037841796875, 3.1727294921875, 3.3076171875, 3.4425048828125, 3.577392578125, 3.7122802734375, 3.84716796875, 3.9820556640625, 4.116943359375, 4.2518310546875, 4.38671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 6.0, 4.0, 3.0, 4.0, 10.0, 14.0, 13.0, 14.0, 30.0, 34.0, 39.0, 74.0, 69.0, 108.0, 188.0, 244.0, 420.0, 611.0, 1065.0, 1843.0, 3390.0, 6355.0, 13637.0, 32414.0, 92517.0, 356980.0, 377154.0, 97465.0, 34458.0, 14420.0, 6752.0, 3328.0, 1849.0, 1075.0, 678.0, 430.0, 293.0, 175.0, 112.0, 83.0, 59.0, 49.0, 25.0, 19.0, 9.0, 14.0, 10.0, 7.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.427490234375, -0.4132499694824219, -0.39900970458984375, -0.3847694396972656, -0.3705291748046875, -0.3562889099121094, -0.34204864501953125, -0.3278083801269531, -0.313568115234375, -0.2993278503417969, -0.28508758544921875, -0.2708473205566406, -0.2566070556640625, -0.24236679077148438, -0.22812652587890625, -0.21388626098632812, -0.19964599609375, -0.18540573120117188, -0.17116546630859375, -0.15692520141601562, -0.1426849365234375, -0.12844467163085938, -0.11420440673828125, -0.09996414184570312, -0.085723876953125, -0.07148361206054688, -0.05724334716796875, -0.043003082275390625, -0.0287628173828125, -0.014522552490234375, -0.00028228759765625, 0.013957977294921875, 0.0281982421875, 0.042438507080078125, 0.05667877197265625, 0.07091903686523438, 0.0851593017578125, 0.09939956665039062, 0.11363983154296875, 0.12788009643554688, 0.142120361328125, 0.15636062622070312, 0.17060089111328125, 0.18484115600585938, 0.1990814208984375, 0.21332168579101562, 0.22756195068359375, 0.24180221557617188, 0.25604248046875, 0.2702827453613281, 0.28452301025390625, 0.2987632751464844, 0.3130035400390625, 0.3272438049316406, 0.34148406982421875, 0.3557243347167969, 0.369964599609375, 0.3842048645019531, 0.39844512939453125, 0.4126853942871094, 0.4269256591796875, 0.4411659240722656, 0.45540618896484375, 0.4696464538574219, 0.48388671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 7.0, 3.0, 4.0, 9.0, 10.0, 17.0, 26.0, 29.0, 27.0, 34.0, 49.0, 58.0, 104.0, 105.0, 125.0, 97.0, 63.0, 48.0, 40.0, 31.0, 20.0, 14.0, 12.0, 13.0, 9.0, 10.0, 2.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00012373924255371094, -0.00011987611651420593, -0.00011601299047470093, -0.00011214986443519592, -0.00010828673839569092, -0.00010442361235618591, -0.00010056048631668091, -9.66973602771759e-05, -9.28342342376709e-05, -8.89711081981659e-05, -8.510798215866089e-05, -8.124485611915588e-05, -7.738173007965088e-05, -7.351860404014587e-05, -6.965547800064087e-05, -6.579235196113586e-05, -6.192922592163086e-05, -5.8066099882125854e-05, -5.420297384262085e-05, -5.0339847803115845e-05, -4.647672176361084e-05, -4.2613595724105835e-05, -3.875046968460083e-05, -3.4887343645095825e-05, -3.102421760559082e-05, -2.7161091566085815e-05, -2.329796552658081e-05, -1.9434839487075806e-05, -1.55717134475708e-05, -1.1708587408065796e-05, -7.845461368560791e-06, -3.982335329055786e-06, -1.1920928955078125e-07, 3.7439167499542236e-06, 7.6070427894592285e-06, 1.1470168828964233e-05, 1.5333294868469238e-05, 1.9196420907974243e-05, 2.3059546947479248e-05, 2.6922672986984253e-05, 3.078579902648926e-05, 3.464892506599426e-05, 3.851205110549927e-05, 4.237517714500427e-05, 4.623830318450928e-05, 5.010142922401428e-05, 5.396455526351929e-05, 5.782768130302429e-05, 6.16908073425293e-05, 6.55539333820343e-05, 6.94170594215393e-05, 7.328018546104431e-05, 7.714331150054932e-05, 8.100643754005432e-05, 8.486956357955933e-05, 8.873268961906433e-05, 9.259581565856934e-05, 9.645894169807434e-05, 0.00010032206773757935, 0.00010418519377708435, 0.00010804831981658936, 0.00011191144585609436, 0.00011577457189559937, 0.00011963769793510437, 0.00012350082397460938]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 2.0, 7.0, 14.0, 23.0, 22.0, 24.0, 60.0, 71.0, 117.0, 170.0, 273.0, 550.0, 888.0, 1853.0, 4104.0, 10722.0, 36693.0, 205627.0, 650645.0, 100163.0, 22547.0, 7681.0, 3059.0, 1374.0, 679.0, 427.0, 231.0, 170.0, 89.0, 66.0, 60.0, 25.0, 22.0, 29.0, 15.0, 10.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.70751953125, -0.6833877563476562, -0.6592559814453125, -0.6351242065429688, -0.610992431640625, -0.5868606567382812, -0.5627288818359375, -0.5385971069335938, -0.51446533203125, -0.49033355712890625, -0.4662017822265625, -0.44207000732421875, -0.417938232421875, -0.39380645751953125, -0.3696746826171875, -0.34554290771484375, -0.3214111328125, -0.29727935791015625, -0.2731475830078125, -0.24901580810546875, -0.224884033203125, -0.20075225830078125, -0.1766204833984375, -0.15248870849609375, -0.12835693359375, -0.10422515869140625, -0.0800933837890625, -0.05596160888671875, -0.031829833984375, -0.00769805908203125, 0.0164337158203125, 0.04056549072265625, 0.064697265625, 0.08882904052734375, 0.1129608154296875, 0.13709259033203125, 0.161224365234375, 0.18535614013671875, 0.2094879150390625, 0.23361968994140625, 0.25775146484375, 0.28188323974609375, 0.3060150146484375, 0.33014678955078125, 0.354278564453125, 0.37841033935546875, 0.4025421142578125, 0.42667388916015625, 0.4508056640625, 0.47493743896484375, 0.4990692138671875, 0.5232009887695312, 0.547332763671875, 0.5714645385742188, 0.5955963134765625, 0.6197280883789062, 0.64385986328125, 0.6679916381835938, 0.6921234130859375, 0.7162551879882812, 0.740386962890625, 0.7645187377929688, 0.7886505126953125, 0.8127822875976562, 0.8369140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 10.0, 11.0, 21.0, 17.0, 18.0, 25.0, 32.0, 35.0, 47.0, 63.0, 72.0, 101.0, 98.0, 82.0, 72.0, 49.0, 44.0, 40.0, 25.0, 17.0, 14.0, 14.0, 11.0, 15.0, 10.0, 9.0, 4.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36669921875, -0.3563041687011719, -0.34590911865234375, -0.3355140686035156, -0.3251190185546875, -0.3147239685058594, -0.30432891845703125, -0.2939338684082031, -0.283538818359375, -0.2731437683105469, -0.26274871826171875, -0.2523536682128906, -0.2419586181640625, -0.23156356811523438, -0.22116851806640625, -0.21077346801757812, -0.20037841796875, -0.18998336791992188, -0.17958831787109375, -0.16919326782226562, -0.1587982177734375, -0.14840316772460938, -0.13800811767578125, -0.12761306762695312, -0.117218017578125, -0.10682296752929688, -0.09642791748046875, -0.08603286743164062, -0.0756378173828125, -0.06524276733398438, -0.05484771728515625, -0.044452667236328125, -0.0340576171875, -0.023662567138671875, -0.01326751708984375, -0.002872467041015625, 0.0075225830078125, 0.017917633056640625, 0.02831268310546875, 0.038707733154296875, 0.049102783203125, 0.059497833251953125, 0.06989288330078125, 0.08028793334960938, 0.0906829833984375, 0.10107803344726562, 0.11147308349609375, 0.12186813354492188, 0.13226318359375, 0.14265823364257812, 0.15305328369140625, 0.16344833374023438, 0.1738433837890625, 0.18423843383789062, 0.19463348388671875, 0.20502853393554688, 0.215423583984375, 0.22581863403320312, 0.23621368408203125, 0.24660873413085938, 0.2570037841796875, 0.2673988342285156, 0.27779388427734375, 0.2881889343261719, 0.298583984375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 12.0, 28.0, 94.0, 333.0, 365.0, 103.0, 33.0, 14.0, 5.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.957146644592285, -10.350625991821289, -9.74410629272461, -9.137585639953613, -8.531065940856934, -7.9245452880859375, -7.3180251121521, -6.711504936218262, -6.104984760284424, -5.498464584350586, -4.891944408416748, -4.28542423248291, -3.678903818130493, -3.0723836421966553, -2.4658632278442383, -1.8593430519104004, -1.2528228759765625, -0.6463026404380798, -0.03978240489959717, 0.5667378902435303, 1.1732580661773682, 1.779778242111206, 2.386298656463623, 2.992818832397461, 3.599339008331299, 4.205859184265137, 4.812379360198975, 5.4188995361328125, 6.025420188903809, 6.631939888000488, 7.238460540771484, 7.844980716705322, 8.451499938964844, 9.05802059173584, 9.66454029083252, 10.271060943603516, 10.877580642700195, 11.484101295471191, 12.090621948242188, 12.697141647338867, 13.303661346435547, 13.910181999206543, 14.516701698303223, 15.123222351074219, 15.729742050170898, 16.336261749267578, 16.94278335571289, 17.54930305480957, 18.15582275390625, 18.76234245300293, 19.368864059448242, 19.975383758544922, 20.5819034576416, 21.18842315673828, 21.794944763183594, 22.401464462280273, 23.007986068725586, 23.614505767822266, 24.221027374267578, 24.827547073364258, 25.434066772460938, 26.040586471557617, 26.64710807800293, 27.25362777709961, 27.86014747619629]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 13.0, 13.0, 18.0, 27.0, 30.0, 44.0, 45.0, 56.0, 59.0, 56.0, 71.0, 58.0, 71.0, 69.0, 52.0, 68.0, 38.0, 41.0, 43.0, 32.0, 23.0, 13.0, 12.0, 13.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.36768341064453, -17.93861198425293, -17.509538650512695, -17.080467224121094, -16.651395797729492, -16.222322463989258, -15.793251037597656, -15.364178657531738, -14.93510627746582, -14.506033897399902, -14.0769624710083, -13.647890090942383, -13.218817710876465, -12.789745330810547, -12.360673904418945, -11.931601524353027, -11.502530097961426, -11.073457717895508, -10.644386291503906, -10.215313911437988, -9.78624153137207, -9.357170104980469, -8.92809772491455, -8.499025344848633, -8.069953918457031, -7.6408820152282715, -7.2118096351623535, -6.782737731933594, -6.353665351867676, -5.924593448638916, -5.495521545410156, -5.066449165344238, -4.63737678527832, -4.2083048820495605, -3.7792325019836426, -3.350160598754883, -2.921088457107544, -2.492016315460205, -2.0629444122314453, -1.6338722705841064, -1.2048001289367676, -0.7757280468940735, -0.3466559648513794, 0.08241605758666992, 0.5114881992340088, 0.9405603408813477, 1.3696322441101074, 1.7987043857574463, 2.227776527404785, 2.656848669052124, 3.085920810699463, 3.5149927139282227, 3.9440648555755615, 4.3731369972229, 4.80220890045166, 5.231281280517578, 5.660353183746338, 6.089425086975098, 6.518497467041016, 6.947569370269775, 7.376641273498535, 7.805713653564453, 8.234785079956055, 8.663857460021973, 9.09292984008789]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 16.0, 15.0, 25.0, 34.0, 53.0, 102.0, 135.0, 206.0, 376.0, 580.0, 1054.0, 2029.0, 4658.0, 12200.0, 48435.0, 549766.0, 3395785.0, 140877.0, 23619.0, 7532.0, 3136.0, 1537.0, 845.0, 455.0, 276.0, 186.0, 103.0, 75.0, 38.0, 59.0, 17.0, 17.0, 13.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.412109375, -3.303009033203125, -3.19390869140625, -3.084808349609375, -2.9757080078125, -2.866607666015625, -2.75750732421875, -2.648406982421875, -2.539306640625, -2.430206298828125, -2.32110595703125, -2.212005615234375, -2.1029052734375, -1.993804931640625, -1.88470458984375, -1.775604248046875, -1.66650390625, -1.557403564453125, -1.44830322265625, -1.339202880859375, -1.2301025390625, -1.121002197265625, -1.01190185546875, -0.902801513671875, -0.793701171875, -0.684600830078125, -0.57550048828125, -0.466400146484375, -0.3572998046875, -0.248199462890625, -0.13909912109375, -0.029998779296875, 0.0791015625, 0.188201904296875, 0.29730224609375, 0.406402587890625, 0.5155029296875, 0.624603271484375, 0.73370361328125, 0.842803955078125, 0.951904296875, 1.061004638671875, 1.17010498046875, 1.279205322265625, 1.3883056640625, 1.497406005859375, 1.60650634765625, 1.715606689453125, 1.82470703125, 1.933807373046875, 2.04290771484375, 2.152008056640625, 2.2611083984375, 2.370208740234375, 2.47930908203125, 2.588409423828125, 2.697509765625, 2.806610107421875, 2.91571044921875, 3.024810791015625, 3.1339111328125, 3.243011474609375, 3.35211181640625, 3.461212158203125, 3.5703125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 7.0, 19.0, 12.0, 14.0, 15.0, 25.0, 39.0, 52.0, 66.0, 68.0, 81.0, 69.0, 75.0, 78.0, 61.0, 47.0, 35.0, 45.0, 33.0, 24.0, 25.0, 12.0, 9.0, 15.0, 19.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02734375, -1.958282470703125, -1.88922119140625, -1.820159912109375, -1.7510986328125, -1.682037353515625, -1.61297607421875, -1.543914794921875, -1.474853515625, -1.405792236328125, -1.33673095703125, -1.267669677734375, -1.1986083984375, -1.129547119140625, -1.06048583984375, -0.991424560546875, -0.92236328125, -0.853302001953125, -0.78424072265625, -0.715179443359375, -0.6461181640625, -0.577056884765625, -0.50799560546875, -0.438934326171875, -0.369873046875, -0.300811767578125, -0.23175048828125, -0.162689208984375, -0.0936279296875, -0.024566650390625, 0.04449462890625, 0.113555908203125, 0.1826171875, 0.251678466796875, 0.32073974609375, 0.389801025390625, 0.4588623046875, 0.527923583984375, 0.59698486328125, 0.666046142578125, 0.735107421875, 0.804168701171875, 0.87322998046875, 0.942291259765625, 1.0113525390625, 1.080413818359375, 1.14947509765625, 1.218536376953125, 1.28759765625, 1.356658935546875, 1.42572021484375, 1.494781494140625, 1.5638427734375, 1.632904052734375, 1.70196533203125, 1.771026611328125, 1.840087890625, 1.909149169921875, 1.97821044921875, 2.047271728515625, 2.1163330078125, 2.185394287109375, 2.25445556640625, 2.323516845703125, 2.392578125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 14.0, 16.0, 31.0, 35.0, 45.0, 81.0, 149.0, 239.0, 421.0, 971.0, 2608.0, 9637.0, 64408.0, 3642105.0, 439564.0, 25731.0, 5095.0, 1579.0, 669.0, 348.0, 180.0, 105.0, 66.0, 45.0, 33.0, 24.0, 11.0, 13.0, 7.0, 7.0, 8.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.08551025390625, -3.9483642578125, -3.81121826171875, -3.674072265625, -3.53692626953125, -3.3997802734375, -3.26263427734375, -3.12548828125, -2.98834228515625, -2.8511962890625, -2.71405029296875, -2.576904296875, -2.43975830078125, -2.3026123046875, -2.16546630859375, -2.0283203125, -1.89117431640625, -1.7540283203125, -1.61688232421875, -1.479736328125, -1.34259033203125, -1.2054443359375, -1.06829833984375, -0.93115234375, -0.79400634765625, -0.6568603515625, -0.51971435546875, -0.382568359375, -0.24542236328125, -0.1082763671875, 0.02886962890625, 0.166015625, 0.30316162109375, 0.4403076171875, 0.57745361328125, 0.714599609375, 0.85174560546875, 0.9888916015625, 1.12603759765625, 1.26318359375, 1.40032958984375, 1.5374755859375, 1.67462158203125, 1.811767578125, 1.94891357421875, 2.0860595703125, 2.22320556640625, 2.3603515625, 2.49749755859375, 2.6346435546875, 2.77178955078125, 2.908935546875, 3.04608154296875, 3.1832275390625, 3.32037353515625, 3.45751953125, 3.59466552734375, 3.7318115234375, 3.86895751953125, 4.006103515625, 4.14324951171875, 4.2803955078125, 4.41754150390625, 4.5546875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 6.0, 10.0, 14.0, 11.0, 31.0, 20.0, 46.0, 55.0, 74.0, 88.0, 173.0, 283.0, 595.0, 1046.0, 653.0, 327.0, 184.0, 113.0, 82.0, 66.0, 47.0, 30.0, 30.0, 16.0, 13.0, 12.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6375045776367188, -0.6143646240234375, -0.5912246704101562, -0.568084716796875, -0.5449447631835938, -0.5218048095703125, -0.49866485595703125, -0.47552490234375, -0.45238494873046875, -0.4292449951171875, -0.40610504150390625, -0.382965087890625, -0.35982513427734375, -0.3366851806640625, -0.31354522705078125, -0.2904052734375, -0.26726531982421875, -0.2441253662109375, -0.22098541259765625, -0.197845458984375, -0.17470550537109375, -0.1515655517578125, -0.12842559814453125, -0.10528564453125, -0.08214569091796875, -0.0590057373046875, -0.03586578369140625, -0.012725830078125, 0.01041412353515625, 0.0335540771484375, 0.05669403076171875, 0.079833984375, 0.10297393798828125, 0.1261138916015625, 0.14925384521484375, 0.172393798828125, 0.19553375244140625, 0.2186737060546875, 0.24181365966796875, 0.26495361328125, 0.28809356689453125, 0.3112335205078125, 0.33437347412109375, 0.357513427734375, 0.38065338134765625, 0.4037933349609375, 0.42693328857421875, 0.4500732421875, 0.47321319580078125, 0.4963531494140625, 0.5194931030273438, 0.542633056640625, 0.5657730102539062, 0.5889129638671875, 0.6120529174804688, 0.63519287109375, 0.6583328247070312, 0.6814727783203125, 0.7046127319335938, 0.727752685546875, 0.7508926391601562, 0.7740325927734375, 0.7971725463867188, 0.8203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 8.0, 17.0, 24.0, 56.0, 84.0, 139.0, 190.0, 139.0, 104.0, 70.0, 37.0, 37.0, 15.0, 12.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.906198978424072, -4.765286922454834, -4.624375343322754, -4.483463287353516, -4.342551231384277, -4.201639652252197, -4.060727596282959, -3.9198157787323, -3.7789039611816406, -3.6379921436309814, -3.497080087661743, -3.356168270111084, -3.215256452560425, -3.0743446350097656, -2.9334325790405273, -2.792520761489868, -2.65160870552063, -2.5106968879699707, -2.3697848320007324, -2.2288730144500732, -2.087961196899414, -1.9470492601394653, -1.8061373233795166, -1.6652255058288574, -1.5243135690689087, -1.38340163230896, -1.2424898147583008, -1.101577877998352, -0.9606660008430481, -0.8197541236877441, -0.6788421869277954, -0.5379303097724915, -0.3970184326171875, -0.25610655546188354, -0.1151946485042572, 0.02571725845336914, 0.1666291356086731, 0.30754101276397705, 0.4484529495239258, 0.5893648266792297, 0.7302767038345337, 0.8711885809898376, 1.0121004581451416, 1.1530123949050903, 1.293924331665039, 1.4348361492156982, 1.575748085975647, 1.7166600227355957, 1.8575718402862549, 1.9984837770462036, 2.1393957138061523, 2.2803075313568115, 2.4212193489074707, 2.562131404876709, 2.703043222427368, 2.8439550399780273, 2.9848670959472656, 3.125778913497925, 3.266690969467163, 3.4076027870178223, 3.5485146045684814, 3.6894264221191406, 3.830338478088379, 3.971250295639038, 4.112162113189697]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 7.0, 13.0, 20.0, 18.0, 14.0, 17.0, 37.0, 40.0, 27.0, 45.0, 40.0, 53.0, 53.0, 61.0, 65.0, 61.0, 41.0, 51.0, 49.0, 43.0, 24.0, 31.0, 36.0, 23.0, 15.0, 15.0, 18.0, 13.0, 9.0, 9.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7863608598709106, -1.7207067012786865, -1.6550525426864624, -1.5893983840942383, -1.5237441062927246, -1.4580899477005005, -1.3924357891082764, -1.3267816305160522, -1.2611274719238281, -1.195473313331604, -1.1298191547393799, -1.0641648769378662, -0.9985107183456421, -0.932856559753418, -0.8672024011611938, -0.8015482425689697, -0.735893964767456, -0.6702398061752319, -0.604585587978363, -0.5389314293861389, -0.4732772409915924, -0.4076230525970459, -0.3419688940048218, -0.27631470561027527, -0.21066051721572876, -0.14500632882118225, -0.07935215532779694, -0.013697981834411621, 0.05195620656013489, 0.1176103949546814, 0.18326455354690552, 0.24891874194145203, 0.3145730495452881, 0.3802272379398346, 0.4458814263343811, 0.5115355849266052, 0.5771898031234741, 0.6428439617156982, 0.7084981203079224, 0.7741522789001465, 0.8398064970970154, 0.9054606556892395, 0.9711148738861084, 1.0367690324783325, 1.1024231910705566, 1.1680774688720703, 1.2337315082550049, 1.2993857860565186, 1.3650399446487427, 1.4306941032409668, 1.496348261833191, 1.562002420425415, 1.6276566982269287, 1.6933108568191528, 1.758965015411377, 1.824619174003601, 1.8902733325958252, 1.9559274911880493, 2.0215816497802734, 2.087235927581787, 2.1528899669647217, 2.2185442447662354, 2.28419828414917, 2.3498525619506836, 2.4155068397521973]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 13.0, 17.0, 28.0, 38.0, 57.0, 84.0, 137.0, 249.0, 431.0, 719.0, 1341.0, 2669.0, 5740.0, 13176.0, 33859.0, 98176.0, 284134.0, 369496.0, 152609.0, 50918.0, 19028.0, 7936.0, 3647.0, 1834.0, 959.0, 499.0, 288.0, 193.0, 122.0, 65.0, 32.0, 11.0, 16.0, 11.0, 11.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2335205078125, -0.22669219970703125, -0.2198638916015625, -0.21303558349609375, -0.206207275390625, -0.19937896728515625, -0.1925506591796875, -0.18572235107421875, -0.17889404296875, -0.17206573486328125, -0.1652374267578125, -0.15840911865234375, -0.151580810546875, -0.14475250244140625, -0.1379241943359375, -0.13109588623046875, -0.124267578125, -0.11743927001953125, -0.1106109619140625, -0.10378265380859375, -0.096954345703125, -0.09012603759765625, -0.0832977294921875, -0.07646942138671875, -0.06964111328125, -0.06281280517578125, -0.0559844970703125, -0.04915618896484375, -0.042327880859375, -0.03549957275390625, -0.0286712646484375, -0.02184295654296875, -0.0150146484375, -0.00818634033203125, -0.0013580322265625, 0.00547027587890625, 0.012298583984375, 0.01912689208984375, 0.0259552001953125, 0.03278350830078125, 0.03961181640625, 0.04644012451171875, 0.0532684326171875, 0.06009674072265625, 0.066925048828125, 0.07375335693359375, 0.0805816650390625, 0.08740997314453125, 0.09423828125, 0.10106658935546875, 0.1078948974609375, 0.11472320556640625, 0.121551513671875, 0.12837982177734375, 0.1352081298828125, 0.14203643798828125, 0.14886474609375, 0.15569305419921875, 0.1625213623046875, 0.16934967041015625, 0.176177978515625, 0.18300628662109375, 0.1898345947265625, 0.19666290283203125, 0.2034912109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 6.0, 16.0, 21.0, 17.0, 26.0, 30.0, 42.0, 43.0, 64.0, 66.0, 76.0, 83.0, 55.0, 66.0, 53.0, 61.0, 46.0, 35.0, 29.0, 32.0, 25.0, 22.0, 10.0, 9.0, 13.0, 13.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.5955963134765625, -1.540802001953125, -1.4860076904296875, -1.43121337890625, -1.3764190673828125, -1.321624755859375, -1.2668304443359375, -1.2120361328125, -1.1572418212890625, -1.102447509765625, -1.0476531982421875, -0.99285888671875, -0.9380645751953125, -0.883270263671875, -0.8284759521484375, -0.773681640625, -0.7188873291015625, -0.664093017578125, -0.6092987060546875, -0.55450439453125, -0.4997100830078125, -0.444915771484375, -0.3901214599609375, -0.3353271484375, -0.2805328369140625, -0.225738525390625, -0.1709442138671875, -0.11614990234375, -0.0613555908203125, -0.006561279296875, 0.0482330322265625, 0.10302734375, 0.1578216552734375, 0.212615966796875, 0.2674102783203125, 0.32220458984375, 0.3769989013671875, 0.431793212890625, 0.4865875244140625, 0.5413818359375, 0.5961761474609375, 0.650970458984375, 0.7057647705078125, 0.76055908203125, 0.8153533935546875, 0.870147705078125, 0.9249420166015625, 0.979736328125, 1.0345306396484375, 1.089324951171875, 1.1441192626953125, 1.19891357421875, 1.2537078857421875, 1.308502197265625, 1.3632965087890625, 1.4180908203125, 1.4728851318359375, 1.527679443359375, 1.5824737548828125, 1.63726806640625, 1.6920623779296875, 1.746856689453125, 1.8016510009765625, 1.8564453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 13.0, 9.0, 19.0, 24.0, 38.0, 40.0, 63.0, 98.0, 154.0, 180.0, 310.0, 530.0, 1021.0, 2294.0, 5874.0, 18895.0, 73060.0, 270229.0, 432472.0, 176810.0, 45570.0, 12695.0, 4209.0, 1778.0, 824.0, 468.0, 253.0, 177.0, 131.0, 75.0, 78.0, 36.0, 31.0, 27.0, 17.0, 13.0, 7.0, 4.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.261962890625, -0.2541027069091797, -0.24624252319335938, -0.23838233947753906, -0.23052215576171875, -0.22266197204589844, -0.21480178833007812, -0.2069416046142578, -0.1990814208984375, -0.1912212371826172, -0.18336105346679688, -0.17550086975097656, -0.16764068603515625, -0.15978050231933594, -0.15192031860351562, -0.1440601348876953, -0.136199951171875, -0.1283397674560547, -0.12047958374023438, -0.11261940002441406, -0.10475921630859375, -0.09689903259277344, -0.08903884887695312, -0.08117866516113281, -0.0733184814453125, -0.06545829772949219, -0.057598114013671875, -0.04973793029785156, -0.04187774658203125, -0.03401756286621094, -0.026157379150390625, -0.018297195434570312, -0.01043701171875, -0.0025768280029296875, 0.005283355712890625, 0.013143539428710938, 0.02100372314453125, 0.028863906860351562, 0.036724090576171875, 0.04458427429199219, 0.0524444580078125, 0.06030464172363281, 0.06816482543945312, 0.07602500915527344, 0.08388519287109375, 0.09174537658691406, 0.09960556030273438, 0.10746574401855469, 0.115325927734375, 0.12318611145019531, 0.13104629516601562, 0.13890647888183594, 0.14676666259765625, 0.15462684631347656, 0.16248703002929688, 0.1703472137451172, 0.1782073974609375, 0.1860675811767578, 0.19392776489257812, 0.20178794860839844, 0.20964813232421875, 0.21750831604003906, 0.22536849975585938, 0.2332286834716797, 0.2410888671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 4.0, 3.0, 5.0, 10.0, 4.0, 10.0, 16.0, 20.0, 13.0, 20.0, 24.0, 32.0, 26.0, 39.0, 46.0, 54.0, 54.0, 51.0, 64.0, 60.0, 58.0, 38.0, 39.0, 44.0, 45.0, 30.0, 28.0, 31.0, 33.0, 18.0, 18.0, 11.0, 10.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.181640625, -3.088714599609375, -2.99578857421875, -2.902862548828125, -2.8099365234375, -2.717010498046875, -2.62408447265625, -2.531158447265625, -2.438232421875, -2.345306396484375, -2.25238037109375, -2.159454345703125, -2.0665283203125, -1.973602294921875, -1.88067626953125, -1.787750244140625, -1.69482421875, -1.601898193359375, -1.50897216796875, -1.416046142578125, -1.3231201171875, -1.230194091796875, -1.13726806640625, -1.044342041015625, -0.951416015625, -0.858489990234375, -0.76556396484375, -0.672637939453125, -0.5797119140625, -0.486785888671875, -0.39385986328125, -0.300933837890625, -0.2080078125, -0.115081787109375, -0.02215576171875, 0.070770263671875, 0.1636962890625, 0.256622314453125, 0.34954833984375, 0.442474365234375, 0.535400390625, 0.628326416015625, 0.72125244140625, 0.814178466796875, 0.9071044921875, 1.000030517578125, 1.09295654296875, 1.185882568359375, 1.27880859375, 1.371734619140625, 1.46466064453125, 1.557586669921875, 1.6505126953125, 1.743438720703125, 1.83636474609375, 1.929290771484375, 2.022216796875, 2.115142822265625, 2.20806884765625, 2.300994873046875, 2.3939208984375, 2.486846923828125, 2.57977294921875, 2.672698974609375, 2.765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 13.0, 29.0, 34.0, 33.0, 92.0, 117.0, 190.0, 394.0, 656.0, 1373.0, 3350.0, 10500.0, 74894.0, 775706.0, 157590.0, 15696.0, 4314.0, 1695.0, 822.0, 422.0, 220.0, 131.0, 78.0, 59.0, 42.0, 16.0, 17.0, 14.0, 10.0, 4.0, 7.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.167236328125, -0.1615924835205078, -0.15594863891601562, -0.15030479431152344, -0.14466094970703125, -0.13901710510253906, -0.13337326049804688, -0.1277294158935547, -0.1220855712890625, -0.11644172668457031, -0.11079788208007812, -0.10515403747558594, -0.09951019287109375, -0.09386634826660156, -0.08822250366210938, -0.08257865905761719, -0.076934814453125, -0.07129096984863281, -0.06564712524414062, -0.06000328063964844, -0.05435943603515625, -0.04871559143066406, -0.043071746826171875, -0.03742790222167969, -0.0317840576171875, -0.026140213012695312, -0.020496368408203125, -0.014852523803710938, -0.00920867919921875, -0.0035648345947265625, 0.002079010009765625, 0.0077228546142578125, 0.01336669921875, 0.019010543823242188, 0.024654388427734375, 0.030298233032226562, 0.03594207763671875, 0.04158592224121094, 0.047229766845703125, 0.05287361145019531, 0.0585174560546875, 0.06416130065917969, 0.06980514526367188, 0.07544898986816406, 0.08109283447265625, 0.08673667907714844, 0.09238052368164062, 0.09802436828613281, 0.103668212890625, 0.10931205749511719, 0.11495590209960938, 0.12059974670410156, 0.12624359130859375, 0.13188743591308594, 0.13753128051757812, 0.1431751251220703, 0.1488189697265625, 0.1544628143310547, 0.16010665893554688, 0.16575050354003906, 0.17139434814453125, 0.17703819274902344, 0.18268203735351562, 0.1883258819580078, 0.1939697265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 10.0, 2.0, 15.0, 18.0, 28.0, 55.0, 103.0, 212.0, 252.0, 164.0, 77.0, 30.0, 14.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001590251922607422, -0.00015451014041900635, -0.0001499950885772705, -0.00014548003673553467, -0.00014096498489379883, -0.000136449933052063, -0.00013193488121032715, -0.0001274198293685913, -0.00012290477752685547, -0.00011838972568511963, -0.00011387467384338379, -0.00010935962200164795, -0.00010484457015991211, -0.00010032951831817627, -9.581446647644043e-05, -9.129941463470459e-05, -8.678436279296875e-05, -8.226931095123291e-05, -7.775425910949707e-05, -7.323920726776123e-05, -6.872415542602539e-05, -6.420910358428955e-05, -5.969405174255371e-05, -5.517899990081787e-05, -5.066394805908203e-05, -4.614889621734619e-05, -4.163384437561035e-05, -3.711879253387451e-05, -3.260374069213867e-05, -2.8088688850402832e-05, -2.3573637008666992e-05, -1.9058585166931152e-05, -1.4543533325195312e-05, -1.0028481483459473e-05, -5.513429641723633e-06, -9.98377799987793e-07, 3.516674041748047e-06, 8.031725883483887e-06, 1.2546777725219727e-05, 1.7061829566955566e-05, 2.1576881408691406e-05, 2.6091933250427246e-05, 3.0606985092163086e-05, 3.5122036933898926e-05, 3.9637088775634766e-05, 4.4152140617370605e-05, 4.8667192459106445e-05, 5.3182244300842285e-05, 5.7697296142578125e-05, 6.221234798431396e-05, 6.67273998260498e-05, 7.124245166778564e-05, 7.575750350952148e-05, 8.027255535125732e-05, 8.478760719299316e-05, 8.9302659034729e-05, 9.381771087646484e-05, 9.833276271820068e-05, 0.00010284781455993652, 0.00010736286640167236, 0.0001118779182434082, 0.00011639297008514404, 0.00012090802192687988, 0.00012542307376861572, 0.00012993812561035156]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 12.0, 11.0, 23.0, 23.0, 29.0, 45.0, 67.0, 101.0, 120.0, 207.0, 336.0, 599.0, 1248.0, 3188.0, 9822.0, 58798.0, 736624.0, 208219.0, 20139.0, 5098.0, 1832.0, 839.0, 390.0, 268.0, 135.0, 113.0, 71.0, 52.0, 31.0, 28.0, 23.0, 16.0, 8.0, 10.0, 6.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.209228515625, -0.20337295532226562, -0.19751739501953125, -0.19166183471679688, -0.1858062744140625, -0.17995071411132812, -0.17409515380859375, -0.16823959350585938, -0.162384033203125, -0.15652847290039062, -0.15067291259765625, -0.14481735229492188, -0.1389617919921875, -0.13310623168945312, -0.12725067138671875, -0.12139511108398438, -0.11553955078125, -0.10968399047851562, -0.10382843017578125, -0.09797286987304688, -0.0921173095703125, -0.08626174926757812, -0.08040618896484375, -0.07455062866210938, -0.068695068359375, -0.06283950805664062, -0.05698394775390625, -0.051128387451171875, -0.0452728271484375, -0.039417266845703125, -0.03356170654296875, -0.027706146240234375, -0.0218505859375, -0.015995025634765625, -0.01013946533203125, -0.004283905029296875, 0.0015716552734375, 0.007427215576171875, 0.01328277587890625, 0.019138336181640625, 0.024993896484375, 0.030849456787109375, 0.03670501708984375, 0.042560577392578125, 0.0484161376953125, 0.054271697998046875, 0.06012725830078125, 0.06598281860351562, 0.07183837890625, 0.07769393920898438, 0.08354949951171875, 0.08940505981445312, 0.0952606201171875, 0.10111618041992188, 0.10697174072265625, 0.11282730102539062, 0.118682861328125, 0.12453842163085938, 0.13039398193359375, 0.13624954223632812, 0.1421051025390625, 0.14796066284179688, 0.15381622314453125, 0.15967178344726562, 0.16552734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 5.0, 14.0, 12.0, 22.0, 24.0, 43.0, 40.0, 72.0, 101.0, 112.0, 120.0, 94.0, 84.0, 52.0, 48.0, 32.0, 33.0, 12.0, 14.0, 16.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03656005859375, -0.03555583953857422, -0.03455162048339844, -0.033547401428222656, -0.032543182373046875, -0.031538963317871094, -0.030534744262695312, -0.02953052520751953, -0.02852630615234375, -0.02752208709716797, -0.026517868041992188, -0.025513648986816406, -0.024509429931640625, -0.023505210876464844, -0.022500991821289062, -0.02149677276611328, -0.0204925537109375, -0.01948833465576172, -0.018484115600585938, -0.017479896545410156, -0.016475677490234375, -0.015471458435058594, -0.014467239379882812, -0.013463020324707031, -0.01245880126953125, -0.011454582214355469, -0.010450363159179688, -0.009446144104003906, -0.008441925048828125, -0.007437705993652344, -0.0064334869384765625, -0.005429267883300781, -0.004425048828125, -0.0034208297729492188, -0.0024166107177734375, -0.0014123916625976562, -0.000408172607421875, 0.0005960464477539062, 0.0016002655029296875, 0.0026044845581054688, 0.00360870361328125, 0.004612922668457031, 0.0056171417236328125, 0.006621360778808594, 0.007625579833984375, 0.008629798889160156, 0.009634017944335938, 0.010638236999511719, 0.0116424560546875, 0.012646675109863281, 0.013650894165039062, 0.014655113220214844, 0.015659332275390625, 0.016663551330566406, 0.017667770385742188, 0.01867198944091797, 0.01967620849609375, 0.02068042755126953, 0.021684646606445312, 0.022688865661621094, 0.023693084716796875, 0.024697303771972656, 0.025701522827148438, 0.02670574188232422, 0.0277099609375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 10.0, 13.0, 24.0, 32.0, 115.0, 266.0, 285.0, 128.0, 58.0, 27.0, 13.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.100545883178711, -3.9370317459106445, -3.773517608642578, -3.6100034713745117, -3.4464893341064453, -3.282975196838379, -3.1194610595703125, -2.955946922302246, -2.7924327850341797, -2.6289186477661133, -2.465404510498047, -2.3018903732299805, -2.138376235961914, -1.9748620986938477, -1.8113479614257812, -1.6478338241577148, -1.4843196868896484, -1.320805549621582, -1.1572914123535156, -0.9937772750854492, -0.8302631378173828, -0.6667490005493164, -0.50323486328125, -0.3397207260131836, -0.1762065887451172, -0.012692451477050781, 0.15082168579101562, 0.31433582305908203, 0.47784996032714844, 0.6413640975952148, 0.8048782348632812, 0.9683923721313477, 1.1319069862365723, 1.2954211235046387, 1.458935260772705, 1.6224493980407715, 1.785963535308838, 1.9494776725769043, 2.1129918098449707, 2.276505947113037, 2.4400200843811035, 2.60353422164917, 2.7670483589172363, 2.9305624961853027, 3.094076633453369, 3.2575907707214355, 3.421104907989502, 3.5846190452575684, 3.7481331825256348, 3.911647319793701, 4.075161457061768, 4.238675594329834, 4.4021897315979, 4.565703868865967, 4.729218006134033, 4.8927321434021, 5.056246280670166, 5.219760417938232, 5.383274555206299, 5.546788692474365, 5.710302829742432, 5.873816967010498, 6.0373311042785645, 6.200845241546631, 6.364359378814697]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 17.0, 16.0, 28.0, 29.0, 35.0, 50.0, 60.0, 54.0, 67.0, 82.0, 86.0, 72.0, 73.0, 60.0, 38.0, 34.0, 40.0, 30.0, 23.0, 10.0, 11.0, 13.0, 9.0, 6.0, 10.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6169227361679077, -1.5615910291671753, -1.5062594413757324, -1.450927734375, -1.3955961465835571, -1.3402644395828247, -1.2849328517913818, -1.2296011447906494, -1.174269437789917, -1.1189377307891846, -1.0636061429977417, -1.0082744359970093, -0.9529428482055664, -0.897611141204834, -0.8422794938087463, -0.7869478464126587, -0.7316162586212158, -0.6762846112251282, -0.6209529638290405, -0.5656212568283081, -0.5102896690368652, -0.4549579918384552, -0.39962631464004517, -0.3442946672439575, -0.2889630198478699, -0.23363137245178223, -0.1782997101545334, -0.12296804785728455, -0.0676364004611969, -0.012304753065109253, 0.04302692413330078, 0.09835857152938843, 0.15369033813476562, 0.20902198553085327, 0.2643536329269409, 0.31968531012535095, 0.3750169575214386, 0.43034860491752625, 0.4856802821159363, 0.5410119295120239, 0.5963435769081116, 0.6516752243041992, 0.7070068717002869, 0.7623385190963745, 0.8176702260971069, 0.8730018138885498, 0.9283335208892822, 0.9836651682853699, 1.0389968156814575, 1.09432852268219, 1.1496601104736328, 1.2049918174743652, 1.260323405265808, 1.3156551122665405, 1.3709867000579834, 1.4263184070587158, 1.4816501140594482, 1.5369818210601807, 1.5923134088516235, 1.647645115852356, 1.7029767036437988, 1.7583084106445312, 1.8136401176452637, 1.8689717054367065, 1.9243032932281494]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 19.0, 13.0, 25.0, 35.0, 51.0, 83.0, 100.0, 143.0, 235.0, 359.0, 565.0, 835.0, 1442.0, 2433.0, 4662.0, 9154.0, 20178.0, 53350.0, 194108.0, 528481.0, 151479.0, 44947.0, 17543.0, 8204.0, 4141.0, 2195.0, 1354.0, 849.0, 505.0, 349.0, 200.0, 145.0, 100.0, 88.0, 49.0, 34.0, 22.0, 14.0, 11.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1552734375, -1.1172943115234375, -1.079315185546875, -1.0413360595703125, -1.00335693359375, -0.9653778076171875, -0.927398681640625, -0.8894195556640625, -0.8514404296875, -0.8134613037109375, -0.775482177734375, -0.7375030517578125, -0.69952392578125, -0.6615447998046875, -0.623565673828125, -0.5855865478515625, -0.547607421875, -0.5096282958984375, -0.471649169921875, -0.4336700439453125, -0.39569091796875, -0.3577117919921875, -0.319732666015625, -0.2817535400390625, -0.2437744140625, -0.2057952880859375, -0.167816162109375, -0.1298370361328125, -0.09185791015625, -0.0538787841796875, -0.015899658203125, 0.0220794677734375, 0.06005859375, 0.0980377197265625, 0.136016845703125, 0.1739959716796875, 0.21197509765625, 0.2499542236328125, 0.287933349609375, 0.3259124755859375, 0.3638916015625, 0.4018707275390625, 0.439849853515625, 0.4778289794921875, 0.51580810546875, 0.5537872314453125, 0.591766357421875, 0.6297454833984375, 0.667724609375, 0.7057037353515625, 0.743682861328125, 0.7816619873046875, 0.81964111328125, 0.8576202392578125, 0.895599365234375, 0.9335784912109375, 0.9715576171875, 1.0095367431640625, 1.047515869140625, 1.0854949951171875, 1.12347412109375, 1.1614532470703125, 1.199432373046875, 1.2374114990234375, 1.275390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 7.0, 2.0, 10.0, 10.0, 22.0, 24.0, 28.0, 38.0, 35.0, 40.0, 56.0, 63.0, 68.0, 85.0, 80.0, 71.0, 54.0, 57.0, 53.0, 33.0, 32.0, 25.0, 24.0, 17.0, 14.0, 9.0, 6.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817901611328125, -3.67681884765625, -3.535736083984375, -3.3946533203125, -3.253570556640625, -3.11248779296875, -2.971405029296875, -2.830322265625, -2.689239501953125, -2.54815673828125, -2.407073974609375, -2.2659912109375, -2.124908447265625, -1.98382568359375, -1.842742919921875, -1.70166015625, -1.560577392578125, -1.41949462890625, -1.278411865234375, -1.1373291015625, -0.996246337890625, -0.85516357421875, -0.714080810546875, -0.572998046875, -0.431915283203125, -0.29083251953125, -0.149749755859375, -0.0086669921875, 0.132415771484375, 0.27349853515625, 0.414581298828125, 0.5556640625, 0.696746826171875, 0.83782958984375, 0.978912353515625, 1.1199951171875, 1.261077880859375, 1.40216064453125, 1.543243408203125, 1.684326171875, 1.825408935546875, 1.96649169921875, 2.107574462890625, 2.2486572265625, 2.389739990234375, 2.53082275390625, 2.671905517578125, 2.81298828125, 2.954071044921875, 3.09515380859375, 3.236236572265625, 3.3773193359375, 3.518402099609375, 3.65948486328125, 3.800567626953125, 3.941650390625, 4.082733154296875, 4.22381591796875, 4.364898681640625, 4.5059814453125, 4.647064208984375, 4.78814697265625, 4.929229736328125, 5.0703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 12.0, 21.0, 26.0, 40.0, 51.0, 71.0, 109.0, 193.0, 346.0, 580.0, 1158.0, 2592.0, 6358.0, 20128.0, 94393.0, 662087.0, 210294.0, 33664.0, 9460.0, 3561.0, 1540.0, 747.0, 409.0, 210.0, 157.0, 94.0, 65.0, 40.0, 29.0, 23.0, 16.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.26171875, -1.217742919921875, -1.17376708984375, -1.129791259765625, -1.0858154296875, -1.041839599609375, -0.99786376953125, -0.953887939453125, -0.909912109375, -0.865936279296875, -0.82196044921875, -0.777984619140625, -0.7340087890625, -0.690032958984375, -0.64605712890625, -0.602081298828125, -0.55810546875, -0.514129638671875, -0.47015380859375, -0.426177978515625, -0.3822021484375, -0.338226318359375, -0.29425048828125, -0.250274658203125, -0.206298828125, -0.162322998046875, -0.11834716796875, -0.074371337890625, -0.0303955078125, 0.013580322265625, 0.05755615234375, 0.101531982421875, 0.1455078125, 0.189483642578125, 0.23345947265625, 0.277435302734375, 0.3214111328125, 0.365386962890625, 0.40936279296875, 0.453338623046875, 0.497314453125, 0.541290283203125, 0.58526611328125, 0.629241943359375, 0.6732177734375, 0.717193603515625, 0.76116943359375, 0.805145263671875, 0.84912109375, 0.893096923828125, 0.93707275390625, 0.981048583984375, 1.0250244140625, 1.069000244140625, 1.11297607421875, 1.156951904296875, 1.200927734375, 1.244903564453125, 1.28887939453125, 1.332855224609375, 1.3768310546875, 1.420806884765625, 1.46478271484375, 1.508758544921875, 1.552734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 12.0, 6.0, 11.0, 11.0, 10.0, 15.0, 19.0, 19.0, 28.0, 36.0, 29.0, 36.0, 48.0, 43.0, 37.0, 50.0, 42.0, 42.0, 45.0, 47.0, 41.0, 39.0, 41.0, 34.0, 31.0, 40.0, 33.0, 30.0, 19.0, 16.0, 17.0, 11.0, 8.0, 13.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.1729736328125, -4.041259765625, -3.9095458984375, -3.77783203125, -3.6461181640625, -3.514404296875, -3.3826904296875, -3.2509765625, -3.1192626953125, -2.987548828125, -2.8558349609375, -2.72412109375, -2.5924072265625, -2.460693359375, -2.3289794921875, -2.197265625, -2.0655517578125, -1.933837890625, -1.8021240234375, -1.67041015625, -1.5386962890625, -1.406982421875, -1.2752685546875, -1.1435546875, -1.0118408203125, -0.880126953125, -0.7484130859375, -0.61669921875, -0.4849853515625, -0.353271484375, -0.2215576171875, -0.08984375, 0.0418701171875, 0.173583984375, 0.3052978515625, 0.43701171875, 0.5687255859375, 0.700439453125, 0.8321533203125, 0.9638671875, 1.0955810546875, 1.227294921875, 1.3590087890625, 1.49072265625, 1.6224365234375, 1.754150390625, 1.8858642578125, 2.017578125, 2.1492919921875, 2.281005859375, 2.4127197265625, 2.54443359375, 2.6761474609375, 2.807861328125, 2.9395751953125, 3.0712890625, 3.2030029296875, 3.334716796875, 3.4664306640625, 3.59814453125, 3.7298583984375, 3.861572265625, 3.9932861328125, 4.125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 11.0, 18.0, 39.0, 44.0, 125.0, 308.0, 1245.0, 9409.0, 481812.0, 543592.0, 10184.0, 1223.0, 330.0, 107.0, 52.0, 17.0, 15.0, 9.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.583984375, -1.5443954467773438, -1.5048065185546875, -1.4652175903320312, -1.425628662109375, -1.3860397338867188, -1.3464508056640625, -1.3068618774414062, -1.26727294921875, -1.2276840209960938, -1.1880950927734375, -1.1485061645507812, -1.108917236328125, -1.0693283081054688, -1.0297393798828125, -0.9901504516601562, -0.9505615234375, -0.9109725952148438, -0.8713836669921875, -0.8317947387695312, -0.792205810546875, -0.7526168823242188, -0.7130279541015625, -0.6734390258789062, -0.63385009765625, -0.5942611694335938, -0.5546722412109375, -0.5150833129882812, -0.475494384765625, -0.43590545654296875, -0.3963165283203125, -0.35672760009765625, -0.317138671875, -0.27754974365234375, -0.2379608154296875, -0.19837188720703125, -0.158782958984375, -0.11919403076171875, -0.0796051025390625, -0.04001617431640625, -0.00042724609375, 0.03916168212890625, 0.0787506103515625, 0.11833953857421875, 0.157928466796875, 0.19751739501953125, 0.2371063232421875, 0.27669525146484375, 0.3162841796875, 0.35587310791015625, 0.3954620361328125, 0.43505096435546875, 0.474639892578125, 0.5142288208007812, 0.5538177490234375, 0.5934066772460938, 0.63299560546875, 0.6725845336914062, 0.7121734619140625, 0.7517623901367188, 0.791351318359375, 0.8309402465820312, 0.8705291748046875, 0.9101181030273438, 0.94970703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 13.0, 28.0, 66.0, 110.0, 228.0, 232.0, 116.0, 78.0, 38.0, 28.0, 18.0, 14.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001556873321533203, -0.00015014410018920898, -0.00014460086822509766, -0.00013905763626098633, -0.000133514404296875, -0.00012797117233276367, -0.00012242794036865234, -0.00011688470840454102, -0.00011134147644042969, -0.00010579824447631836, -0.00010025501251220703, -9.47117805480957e-05, -8.916854858398438e-05, -8.362531661987305e-05, -7.808208465576172e-05, -7.253885269165039e-05, -6.699562072753906e-05, -6.145238876342773e-05, -5.5909156799316406e-05, -5.036592483520508e-05, -4.482269287109375e-05, -3.927946090698242e-05, -3.3736228942871094e-05, -2.8192996978759766e-05, -2.2649765014648438e-05, -1.710653305053711e-05, -1.1563301086425781e-05, -6.020069122314453e-06, -4.76837158203125e-07, 5.066394805908203e-06, 1.0609626770019531e-05, 1.615285873413086e-05, 2.1696090698242188e-05, 2.7239322662353516e-05, 3.2782554626464844e-05, 3.832578659057617e-05, 4.38690185546875e-05, 4.941225051879883e-05, 5.4955482482910156e-05, 6.0498714447021484e-05, 6.604194641113281e-05, 7.158517837524414e-05, 7.712841033935547e-05, 8.26716423034668e-05, 8.821487426757812e-05, 9.375810623168945e-05, 9.930133819580078e-05, 0.00010484457015991211, 0.00011038780212402344, 0.00011593103408813477, 0.0001214742660522461, 0.00012701749801635742, 0.00013256072998046875, 0.00013810396194458008, 0.0001436471939086914, 0.00014919042587280273, 0.00015473365783691406, 0.0001602768898010254, 0.00016582012176513672, 0.00017136335372924805, 0.00017690658569335938, 0.0001824498176574707, 0.00018799304962158203, 0.00019353628158569336, 0.0001990795135498047]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 15.0, 22.0, 47.0, 99.0, 252.0, 675.0, 2571.0, 15849.0, 491806.0, 517155.0, 16229.0, 2602.0, 775.0, 226.0, 93.0, 55.0, 25.0, 16.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92529296875, -0.8910293579101562, -0.8567657470703125, -0.8225021362304688, -0.788238525390625, -0.7539749145507812, -0.7197113037109375, -0.6854476928710938, -0.65118408203125, -0.6169204711914062, -0.5826568603515625, -0.5483932495117188, -0.514129638671875, -0.47986602783203125, -0.4456024169921875, -0.41133880615234375, -0.3770751953125, -0.34281158447265625, -0.3085479736328125, -0.27428436279296875, -0.240020751953125, -0.20575714111328125, -0.1714935302734375, -0.13722991943359375, -0.10296630859375, -0.06870269775390625, -0.0344390869140625, -0.00017547607421875, 0.034088134765625, 0.06835174560546875, 0.1026153564453125, 0.13687896728515625, 0.171142578125, 0.20540618896484375, 0.2396697998046875, 0.27393341064453125, 0.308197021484375, 0.34246063232421875, 0.3767242431640625, 0.41098785400390625, 0.44525146484375, 0.47951507568359375, 0.5137786865234375, 0.5480422973632812, 0.582305908203125, 0.6165695190429688, 0.6508331298828125, 0.6850967407226562, 0.7193603515625, 0.7536239624023438, 0.7878875732421875, 0.8221511840820312, 0.856414794921875, 0.8906784057617188, 0.9249420166015625, 0.9592056274414062, 0.99346923828125, 1.0277328491210938, 1.0619964599609375, 1.0962600708007812, 1.130523681640625, 1.1647872924804688, 1.1990509033203125, 1.2333145141601562, 1.267578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 13.0, 32.0, 60.0, 90.0, 162.0, 224.0, 163.0, 103.0, 51.0, 29.0, 23.0, 16.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6420707702636719, -0.6239852905273438, -0.6058998107910156, -0.5878143310546875, -0.5697288513183594, -0.5516433715820312, -0.5335578918457031, -0.515472412109375, -0.4973869323730469, -0.47930145263671875, -0.4612159729003906, -0.4431304931640625, -0.4250450134277344, -0.40695953369140625, -0.3888740539550781, -0.37078857421875, -0.3527030944824219, -0.33461761474609375, -0.3165321350097656, -0.2984466552734375, -0.2803611755371094, -0.26227569580078125, -0.24419021606445312, -0.226104736328125, -0.20801925659179688, -0.18993377685546875, -0.17184829711914062, -0.1537628173828125, -0.13567733764648438, -0.11759185791015625, -0.09950637817382812, -0.0814208984375, -0.06333541870117188, -0.04524993896484375, -0.027164459228515625, -0.0090789794921875, 0.009006500244140625, 0.02709197998046875, 0.045177459716796875, 0.063262939453125, 0.08134841918945312, 0.09943389892578125, 0.11751937866210938, 0.1356048583984375, 0.15369033813476562, 0.17177581787109375, 0.18986129760742188, 0.20794677734375, 0.22603225708007812, 0.24411773681640625, 0.2622032165527344, 0.2802886962890625, 0.2983741760253906, 0.31645965576171875, 0.3345451354980469, 0.352630615234375, 0.3707160949707031, 0.38880157470703125, 0.4068870544433594, 0.4249725341796875, 0.4430580139160156, 0.46114349365234375, 0.4792289733886719, 0.497314453125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 14.0, 28.0, 221.0, 639.0, 87.0, 18.0, 4.0, 3.0, 1.0], "bins": [-57.02280807495117, -56.044891357421875, -55.06697082519531, -54.089054107666016, -53.11113739013672, -52.133216857910156, -51.15530014038086, -50.17738342285156, -49.199462890625, -48.2215461730957, -47.24362564086914, -46.265708923339844, -45.28779220581055, -44.309871673583984, -43.33195495605469, -42.354034423828125, -41.37611770629883, -40.39820098876953, -39.42028045654297, -38.44236373901367, -37.464447021484375, -36.48652648925781, -35.508609771728516, -34.53069305419922, -33.552772521972656, -32.57485580444336, -31.59693717956543, -30.6190185546875, -29.64109992980957, -28.66318130493164, -27.685264587402344, -26.707345962524414, -25.729429244995117, -24.751510620117188, -23.77359390258789, -22.79567527770996, -21.81775665283203, -20.839839935302734, -19.861921310424805, -18.884002685546875, -17.906084060668945, -16.928165435791016, -15.950247764587402, -14.972330093383789, -13.99441146850586, -13.016493797302246, -12.038576126098633, -11.060657501220703, -10.082738876342773, -9.10482120513916, -8.12690258026123, -7.148984909057617, -6.1710662841796875, -5.193148612976074, -4.215230464935303, -3.2373123168945312, -2.259394645690918, -1.2814764976501465, -0.30355846881866455, 0.6743595600128174, 1.6522777080535889, 2.6301956176757812, 3.6081137657165527, 4.586031913757324, 5.563950061798096]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 7.0, 10.0, 16.0, 12.0, 17.0, 17.0, 27.0, 25.0, 22.0, 25.0, 29.0, 42.0, 34.0, 41.0, 49.0, 32.0, 33.0, 39.0, 47.0, 37.0, 41.0, 31.0, 34.0, 43.0, 19.0, 26.0, 25.0, 23.0, 21.0, 15.0, 19.0, 21.0, 20.0, 18.0, 13.0, 6.0, 9.0, 9.0, 5.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.727214336395264, -6.497513294219971, -6.2678117752075195, -6.038110733032227, -5.808409690856934, -5.578708648681641, -5.349007606506348, -5.1193060874938965, -4.8896050453186035, -4.6599040031433105, -4.430202484130859, -4.200501441955566, -3.9708003997802734, -3.7410993576049805, -3.5113980770111084, -3.2816967964172363, -3.0519957542419434, -2.8222947120666504, -2.5925934314727783, -2.3628921508789062, -2.1331911087036133, -1.9034899473190308, -1.6737887859344482, -1.4440876245498657, -1.2143864631652832, -0.9846853017807007, -0.7549841403961182, -0.5252829790115356, -0.2955818176269531, -0.0658806562423706, 0.16382050514221191, 0.39352166652679443, 0.6232233047485352, 0.8529244661331177, 1.0826256275177002, 1.3123267889022827, 1.5420279502868652, 1.7717291116714478, 2.0014302730560303, 2.2311315536499023, 2.4608325958251953, 2.6905336380004883, 2.9202349185943604, 3.1499361991882324, 3.3796372413635254, 3.6093382835388184, 3.8390395641326904, 4.0687408447265625, 4.2984418869018555, 4.528142929077148, 4.757843971252441, 4.987545490264893, 5.2172465324401855, 5.4469475746154785, 5.67664909362793, 5.906350135803223, 6.136051177978516, 6.365752220153809, 6.595453262329102, 6.825154781341553, 7.054855823516846, 7.284556865692139, 7.51425838470459, 7.743959426879883, 7.973660469055176]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 17.0, 16.0, 23.0, 34.0, 42.0, 66.0, 92.0, 139.0, 193.0, 321.0, 496.0, 777.0, 1330.0, 2385.0, 4661.0, 10608.0, 31128.0, 141712.0, 2584516.0, 1272444.0, 100071.0, 24427.0, 9067.0, 4097.0, 2132.0, 1255.0, 763.0, 484.0, 341.0, 220.0, 134.0, 87.0, 53.0, 42.0, 40.0, 19.0, 13.0, 8.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.033203125, -1.965240478515625, -1.89727783203125, -1.829315185546875, -1.7613525390625, -1.693389892578125, -1.62542724609375, -1.557464599609375, -1.489501953125, -1.421539306640625, -1.35357666015625, -1.285614013671875, -1.2176513671875, -1.149688720703125, -1.08172607421875, -1.013763427734375, -0.94580078125, -0.877838134765625, -0.80987548828125, -0.741912841796875, -0.6739501953125, -0.605987548828125, -0.53802490234375, -0.470062255859375, -0.402099609375, -0.334136962890625, -0.26617431640625, -0.198211669921875, -0.1302490234375, -0.062286376953125, 0.00567626953125, 0.073638916015625, 0.1416015625, 0.209564208984375, 0.27752685546875, 0.345489501953125, 0.4134521484375, 0.481414794921875, 0.54937744140625, 0.617340087890625, 0.685302734375, 0.753265380859375, 0.82122802734375, 0.889190673828125, 0.9571533203125, 1.025115966796875, 1.09307861328125, 1.161041259765625, 1.22900390625, 1.296966552734375, 1.36492919921875, 1.432891845703125, 1.5008544921875, 1.568817138671875, 1.63677978515625, 1.704742431640625, 1.772705078125, 1.840667724609375, 1.90863037109375, 1.976593017578125, 2.0445556640625, 2.112518310546875, 2.18048095703125, 2.248443603515625, 2.31640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 6.0, 7.0, 10.0, 8.0, 15.0, 22.0, 40.0, 37.0, 49.0, 58.0, 78.0, 77.0, 87.0, 67.0, 83.0, 65.0, 54.0, 56.0, 31.0, 25.0, 25.0, 18.0, 15.0, 12.0, 11.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.095703125, -2.0281982421875, -1.960693359375, -1.8931884765625, -1.82568359375, -1.7581787109375, -1.690673828125, -1.6231689453125, -1.5556640625, -1.4881591796875, -1.420654296875, -1.3531494140625, -1.28564453125, -1.2181396484375, -1.150634765625, -1.0831298828125, -1.015625, -0.9481201171875, -0.880615234375, -0.8131103515625, -0.74560546875, -0.6781005859375, -0.610595703125, -0.5430908203125, -0.4755859375, -0.4080810546875, -0.340576171875, -0.2730712890625, -0.20556640625, -0.1380615234375, -0.070556640625, -0.0030517578125, 0.064453125, 0.1319580078125, 0.199462890625, 0.2669677734375, 0.33447265625, 0.4019775390625, 0.469482421875, 0.5369873046875, 0.6044921875, 0.6719970703125, 0.739501953125, 0.8070068359375, 0.87451171875, 0.9420166015625, 1.009521484375, 1.0770263671875, 1.14453125, 1.2120361328125, 1.279541015625, 1.3470458984375, 1.41455078125, 1.4820556640625, 1.549560546875, 1.6170654296875, 1.6845703125, 1.7520751953125, 1.819580078125, 1.8870849609375, 1.95458984375, 2.0220947265625, 2.089599609375, 2.1571044921875, 2.224609375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 9.0, 9.0, 14.0, 31.0, 30.0, 69.0, 133.0, 223.0, 596.0, 2024.0, 10606.0, 188176.0, 3933832.0, 51001.0, 5348.0, 1280.0, 442.0, 211.0, 106.0, 49.0, 27.0, 12.0, 23.0, 11.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.3787841796875, -4.218505859375, -4.0582275390625, -3.89794921875, -3.7376708984375, -3.577392578125, -3.4171142578125, -3.2568359375, -3.0965576171875, -2.936279296875, -2.7760009765625, -2.61572265625, -2.4554443359375, -2.295166015625, -2.1348876953125, -1.974609375, -1.8143310546875, -1.654052734375, -1.4937744140625, -1.33349609375, -1.1732177734375, -1.012939453125, -0.8526611328125, -0.6923828125, -0.5321044921875, -0.371826171875, -0.2115478515625, -0.05126953125, 0.1090087890625, 0.269287109375, 0.4295654296875, 0.58984375, 0.7501220703125, 0.910400390625, 1.0706787109375, 1.23095703125, 1.3912353515625, 1.551513671875, 1.7117919921875, 1.8720703125, 2.0323486328125, 2.192626953125, 2.3529052734375, 2.51318359375, 2.6734619140625, 2.833740234375, 2.9940185546875, 3.154296875, 3.3145751953125, 3.474853515625, 3.6351318359375, 3.79541015625, 3.9556884765625, 4.115966796875, 4.2762451171875, 4.4365234375, 4.5968017578125, 4.757080078125, 4.9173583984375, 5.07763671875, 5.2379150390625, 5.398193359375, 5.5584716796875, 5.71875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 9.0, 11.0, 12.0, 27.0, 33.0, 58.0, 69.0, 132.0, 264.0, 505.0, 1435.0, 716.0, 359.0, 177.0, 76.0, 67.0, 32.0, 27.0, 16.0, 10.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93212890625, -0.9052200317382812, -0.8783111572265625, -0.8514022827148438, -0.824493408203125, -0.7975845336914062, -0.7706756591796875, -0.7437667846679688, -0.71685791015625, -0.6899490356445312, -0.6630401611328125, -0.6361312866210938, -0.609222412109375, -0.5823135375976562, -0.5554046630859375, -0.5284957885742188, -0.5015869140625, -0.47467803955078125, -0.4477691650390625, -0.42086029052734375, -0.393951416015625, -0.36704254150390625, -0.3401336669921875, -0.31322479248046875, -0.28631591796875, -0.25940704345703125, -0.2324981689453125, -0.20558929443359375, -0.178680419921875, -0.15177154541015625, -0.1248626708984375, -0.09795379638671875, -0.071044921875, -0.04413604736328125, -0.0172271728515625, 0.00968170166015625, 0.036590576171875, 0.06349945068359375, 0.0904083251953125, 0.11731719970703125, 0.14422607421875, 0.17113494873046875, 0.1980438232421875, 0.22495269775390625, 0.251861572265625, 0.27877044677734375, 0.3056793212890625, 0.33258819580078125, 0.3594970703125, 0.38640594482421875, 0.4133148193359375, 0.44022369384765625, 0.467132568359375, 0.49404144287109375, 0.5209503173828125, 0.5478591918945312, 0.57476806640625, 0.6016769409179688, 0.6285858154296875, 0.6554946899414062, 0.682403564453125, 0.7093124389648438, 0.7362213134765625, 0.7631301879882812, 0.7900390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 8.0, 8.0, 12.0, 11.0, 19.0, 29.0, 51.0, 77.0, 158.0, 204.0, 166.0, 96.0, 57.0, 36.0, 17.0, 15.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.210004806518555, -5.067798137664795, -4.925590991973877, -4.783384323120117, -4.641177177429199, -4.4989705085754395, -4.35676383972168, -4.214556694030762, -4.072350025177002, -3.930143117904663, -3.787936210632324, -3.6457295417785645, -3.5035226345062256, -3.3613157272338867, -3.219109058380127, -3.076902151107788, -2.934695243835449, -2.7924883365631104, -2.6502814292907715, -2.5080747604370117, -2.365867853164673, -2.223660945892334, -2.081454277038574, -1.9392473697662354, -1.7970404624938965, -1.6548335552215576, -1.5126267671585083, -1.370419979095459, -1.2282130718231201, -1.0860061645507812, -0.9437993764877319, -0.8015925288200378, -0.6593859195709229, -0.5171790719032288, -0.37497222423553467, -0.23276537656784058, -0.09055852890014648, 0.05164831876754761, 0.1938551664352417, 0.3360620141029358, 0.4782688617706299, 0.620475709438324, 0.7626825571060181, 0.9048894047737122, 1.0470962524414062, 1.1893031597137451, 1.3315099477767944, 1.4737167358398438, 1.6159236431121826, 1.7581305503845215, 1.9003373384475708, 2.04254412651062, 2.184751033782959, 2.326957941055298, 2.4691648483276367, 2.6113715171813965, 2.7535784244537354, 2.895785331726074, 3.037992000579834, 3.180198907852173, 3.3224058151245117, 3.4646127223968506, 3.6068196296691895, 3.749026298522949, 3.891233205795288]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 3.0, 1.0, 5.0, 7.0, 2.0, 9.0, 3.0, 12.0, 12.0, 18.0, 25.0, 30.0, 35.0, 45.0, 46.0, 61.0, 71.0, 76.0, 64.0, 55.0, 55.0, 50.0, 55.0, 41.0, 34.0, 34.0, 30.0, 28.0, 15.0, 20.0, 14.0, 8.0, 8.0, 12.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9250521659851074, -1.8598415851593018, -1.794631004333496, -1.7294204235076904, -1.6642097234725952, -1.5989991426467896, -1.5337885618209839, -1.4685779809951782, -1.403367280960083, -1.3381567001342773, -1.2729461193084717, -1.207735538482666, -1.1425248384475708, -1.0773142576217651, -1.0121036767959595, -0.9468930959701538, -0.8816825151443481, -0.8164719343185425, -0.751261293888092, -0.6860507130622864, -0.6208400726318359, -0.5556294918060303, -0.4904189109802246, -0.42520830035209656, -0.3599976897239685, -0.29478707909584045, -0.2295764833688736, -0.16436588764190674, -0.09915527701377869, -0.033944666385650635, 0.03126591444015503, 0.09647652506828308, 0.16168713569641113, 0.22689774632453918, 0.29210835695266724, 0.3573189377784729, 0.42252954840660095, 0.487740159034729, 0.5529507398605347, 0.6181613206863403, 0.6833719611167908, 0.7485825419425964, 0.8137931823730469, 0.8790037631988525, 0.9442143440246582, 1.0094249248504639, 1.0746355056762695, 1.1398462057113647, 1.2050567865371704, 1.270267367362976, 1.3354779481887817, 1.400688648223877, 1.4658992290496826, 1.5311098098754883, 1.596320390701294, 1.6615309715270996, 1.7267415523529053, 1.791952133178711, 1.8571627140045166, 1.9223732948303223, 1.9875839948654175, 2.0527944564819336, 2.1180052757263184, 2.183215856552124, 2.2484264373779297]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 11.0, 24.0, 29.0, 71.0, 78.0, 190.0, 317.0, 576.0, 1265.0, 2916.0, 7994.0, 24983.0, 97619.0, 413008.0, 378325.0, 86668.0, 21956.0, 7273.0, 2760.0, 1181.0, 539.0, 261.0, 197.0, 90.0, 59.0, 39.0, 29.0, 19.0, 14.0, 10.0, 7.0, 3.0, 4.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273193359375, -0.2649040222167969, -0.25661468505859375, -0.24832534790039062, -0.2400360107421875, -0.23174667358398438, -0.22345733642578125, -0.21516799926757812, -0.206878662109375, -0.19858932495117188, -0.19029998779296875, -0.18201065063476562, -0.1737213134765625, -0.16543197631835938, -0.15714263916015625, -0.14885330200195312, -0.14056396484375, -0.13227462768554688, -0.12398529052734375, -0.11569595336914062, -0.1074066162109375, -0.09911727905273438, -0.09082794189453125, -0.08253860473632812, -0.074249267578125, -0.06595993041992188, -0.05767059326171875, -0.049381256103515625, -0.0410919189453125, -0.032802581787109375, -0.02451324462890625, -0.016223907470703125, -0.0079345703125, 0.000354766845703125, 0.00864410400390625, 0.016933441162109375, 0.0252227783203125, 0.033512115478515625, 0.04180145263671875, 0.050090789794921875, 0.058380126953125, 0.06666946411132812, 0.07495880126953125, 0.08324813842773438, 0.0915374755859375, 0.09982681274414062, 0.10811614990234375, 0.11640548706054688, 0.12469482421875, 0.13298416137695312, 0.14127349853515625, 0.14956283569335938, 0.1578521728515625, 0.16614151000976562, 0.17443084716796875, 0.18272018432617188, 0.191009521484375, 0.19929885864257812, 0.20758819580078125, 0.21587753295898438, 0.2241668701171875, 0.23245620727539062, 0.24074554443359375, 0.24903488159179688, 0.25732421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 3.0, 4.0, 8.0, 11.0, 17.0, 14.0, 20.0, 30.0, 35.0, 55.0, 47.0, 85.0, 81.0, 60.0, 81.0, 62.0, 71.0, 49.0, 47.0, 35.0, 23.0, 31.0, 26.0, 27.0, 18.0, 5.0, 12.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.52313232421875, -1.4710693359375, -1.41900634765625, -1.366943359375, -1.31488037109375, -1.2628173828125, -1.21075439453125, -1.15869140625, -1.10662841796875, -1.0545654296875, -1.00250244140625, -0.950439453125, -0.89837646484375, -0.8463134765625, -0.79425048828125, -0.7421875, -0.69012451171875, -0.6380615234375, -0.58599853515625, -0.533935546875, -0.48187255859375, -0.4298095703125, -0.37774658203125, -0.32568359375, -0.27362060546875, -0.2215576171875, -0.16949462890625, -0.117431640625, -0.06536865234375, -0.0133056640625, 0.03875732421875, 0.0908203125, 0.14288330078125, 0.1949462890625, 0.24700927734375, 0.299072265625, 0.35113525390625, 0.4031982421875, 0.45526123046875, 0.50732421875, 0.55938720703125, 0.6114501953125, 0.66351318359375, 0.715576171875, 0.76763916015625, 0.8197021484375, 0.87176513671875, 0.923828125, 0.97589111328125, 1.0279541015625, 1.08001708984375, 1.132080078125, 1.18414306640625, 1.2362060546875, 1.28826904296875, 1.34033203125, 1.39239501953125, 1.4444580078125, 1.49652099609375, 1.548583984375, 1.60064697265625, 1.6527099609375, 1.70477294921875, 1.7568359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 8.0, 15.0, 14.0, 18.0, 25.0, 45.0, 63.0, 71.0, 127.0, 153.0, 215.0, 293.0, 462.0, 761.0, 1476.0, 3586.0, 9540.0, 33069.0, 124339.0, 359523.0, 348481.0, 118261.0, 31639.0, 9302.0, 3321.0, 1495.0, 754.0, 473.0, 258.0, 219.0, 158.0, 100.0, 77.0, 59.0, 32.0, 37.0, 24.0, 22.0, 8.0, 6.0, 12.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1920166015625, -0.18581771850585938, -0.17961883544921875, -0.17341995239257812, -0.1672210693359375, -0.16102218627929688, -0.15482330322265625, -0.14862442016601562, -0.142425537109375, -0.13622665405273438, -0.13002777099609375, -0.12382888793945312, -0.1176300048828125, -0.11143112182617188, -0.10523223876953125, -0.09903335571289062, -0.09283447265625, -0.08663558959960938, -0.08043670654296875, -0.07423782348632812, -0.0680389404296875, -0.061840057373046875, -0.05564117431640625, -0.049442291259765625, -0.043243408203125, -0.037044525146484375, -0.03084564208984375, -0.024646759033203125, -0.0184478759765625, -0.012248992919921875, -0.00605010986328125, 0.000148773193359375, 0.00634765625, 0.012546539306640625, 0.01874542236328125, 0.024944305419921875, 0.0311431884765625, 0.037342071533203125, 0.04354095458984375, 0.049739837646484375, 0.055938720703125, 0.062137603759765625, 0.06833648681640625, 0.07453536987304688, 0.0807342529296875, 0.08693313598632812, 0.09313201904296875, 0.09933090209960938, 0.10552978515625, 0.11172866821289062, 0.11792755126953125, 0.12412643432617188, 0.1303253173828125, 0.13652420043945312, 0.14272308349609375, 0.14892196655273438, 0.155120849609375, 0.16131973266601562, 0.16751861572265625, 0.17371749877929688, 0.1799163818359375, 0.18611526489257812, 0.19231414794921875, 0.19851303100585938, 0.2047119140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 10.0, 6.0, 9.0, 13.0, 17.0, 20.0, 23.0, 19.0, 20.0, 24.0, 32.0, 47.0, 28.0, 39.0, 34.0, 50.0, 49.0, 45.0, 43.0, 41.0, 45.0, 39.0, 35.0, 39.0, 37.0, 34.0, 28.0, 23.0, 21.0, 20.0, 18.0, 12.0, 13.0, 11.0, 8.0, 4.0, 10.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.31640625, -2.24383544921875, -2.1712646484375, -2.09869384765625, -2.026123046875, -1.95355224609375, -1.8809814453125, -1.80841064453125, -1.73583984375, -1.66326904296875, -1.5906982421875, -1.51812744140625, -1.445556640625, -1.37298583984375, -1.3004150390625, -1.22784423828125, -1.1552734375, -1.08270263671875, -1.0101318359375, -0.93756103515625, -0.864990234375, -0.79241943359375, -0.7198486328125, -0.64727783203125, -0.57470703125, -0.50213623046875, -0.4295654296875, -0.35699462890625, -0.284423828125, -0.21185302734375, -0.1392822265625, -0.06671142578125, 0.005859375, 0.07843017578125, 0.1510009765625, 0.22357177734375, 0.296142578125, 0.36871337890625, 0.4412841796875, 0.51385498046875, 0.58642578125, 0.65899658203125, 0.7315673828125, 0.80413818359375, 0.876708984375, 0.94927978515625, 1.0218505859375, 1.09442138671875, 1.1669921875, 1.23956298828125, 1.3121337890625, 1.38470458984375, 1.457275390625, 1.52984619140625, 1.6024169921875, 1.67498779296875, 1.74755859375, 1.82012939453125, 1.8927001953125, 1.96527099609375, 2.037841796875, 2.11041259765625, 2.1829833984375, 2.25555419921875, 2.328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 9.0, 18.0, 20.0, 47.0, 97.0, 217.0, 630.0, 2024.0, 11669.0, 195606.0, 790763.0, 41070.0, 4705.0, 993.0, 323.0, 152.0, 75.0, 52.0, 32.0, 11.0, 11.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2197265625, -0.21452713012695312, -0.20932769775390625, -0.20412826538085938, -0.1989288330078125, -0.19372940063476562, -0.18852996826171875, -0.18333053588867188, -0.178131103515625, -0.17293167114257812, -0.16773223876953125, -0.16253280639648438, -0.1573333740234375, -0.15213394165039062, -0.14693450927734375, -0.14173507690429688, -0.13653564453125, -0.13133621215820312, -0.12613677978515625, -0.12093734741210938, -0.1157379150390625, -0.11053848266601562, -0.10533905029296875, -0.10013961791992188, -0.094940185546875, -0.08974075317382812, -0.08454132080078125, -0.07934188842773438, -0.0741424560546875, -0.06894302368164062, -0.06374359130859375, -0.058544158935546875, -0.0533447265625, -0.048145294189453125, -0.04294586181640625, -0.037746429443359375, -0.0325469970703125, -0.027347564697265625, -0.02214813232421875, -0.016948699951171875, -0.011749267578125, -0.006549835205078125, -0.00135040283203125, 0.003849029541015625, 0.0090484619140625, 0.014247894287109375, 0.01944732666015625, 0.024646759033203125, 0.02984619140625, 0.035045623779296875, 0.04024505615234375, 0.045444488525390625, 0.0506439208984375, 0.055843353271484375, 0.06104278564453125, 0.06624221801757812, 0.071441650390625, 0.07664108276367188, 0.08184051513671875, 0.08703994750976562, 0.0922393798828125, 0.09743881225585938, 0.10263824462890625, 0.10783767700195312, 0.113037109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 27.0, 34.0, 41.0, 108.0, 129.0, 142.0, 149.0, 135.0, 90.0, 49.0, 30.0, 15.0, 20.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00011348724365234375, -0.00011090654879808426, -0.00010832585394382477, -0.00010574515908956528, -0.00010316446423530579, -0.0001005837693810463, -9.80030745267868e-05, -9.542237967252731e-05, -9.284168481826782e-05, -9.026098996400833e-05, -8.768029510974884e-05, -8.509960025548935e-05, -8.251890540122986e-05, -7.993821054697037e-05, -7.735751569271088e-05, -7.477682083845139e-05, -7.21961259841919e-05, -6.96154311299324e-05, -6.703473627567291e-05, -6.445404142141342e-05, -6.187334656715393e-05, -5.929265171289444e-05, -5.671195685863495e-05, -5.413126200437546e-05, -5.155056715011597e-05, -4.8969872295856476e-05, -4.6389177441596985e-05, -4.3808482587337494e-05, -4.1227787733078e-05, -3.864709287881851e-05, -3.606639802455902e-05, -3.348570317029953e-05, -3.090500831604004e-05, -2.8324313461780548e-05, -2.5743618607521057e-05, -2.3162923753261566e-05, -2.0582228899002075e-05, -1.8001534044742584e-05, -1.5420839190483093e-05, -1.2840144336223602e-05, -1.0259449481964111e-05, -7.67875462770462e-06, -5.098059773445129e-06, -2.5173649191856384e-06, 6.332993507385254e-08, 2.6440247893333435e-06, 5.2247196435928345e-06, 7.805414497852325e-06, 1.0386109352111816e-05, 1.2966804206371307e-05, 1.55474990606308e-05, 1.812819391489029e-05, 2.070888876914978e-05, 2.328958362340927e-05, 2.5870278477668762e-05, 2.8450973331928253e-05, 3.1031668186187744e-05, 3.3612363040447235e-05, 3.6193057894706726e-05, 3.877375274896622e-05, 4.135444760322571e-05, 4.39351424574852e-05, 4.651583731174469e-05, 4.909653216600418e-05, 5.167722702026367e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 7.0, 12.0, 9.0, 17.0, 15.0, 46.0, 87.0, 179.0, 442.0, 1507.0, 10669.0, 430810.0, 589175.0, 13101.0, 1634.0, 472.0, 165.0, 84.0, 47.0, 32.0, 15.0, 9.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.28076171875, -0.27392005920410156, -0.2670783996582031, -0.2602367401123047, -0.25339508056640625, -0.2465534210205078, -0.23971176147460938, -0.23287010192871094, -0.2260284423828125, -0.21918678283691406, -0.21234512329101562, -0.2055034637451172, -0.19866180419921875, -0.1918201446533203, -0.18497848510742188, -0.17813682556152344, -0.171295166015625, -0.16445350646972656, -0.15761184692382812, -0.1507701873779297, -0.14392852783203125, -0.1370868682861328, -0.13024520874023438, -0.12340354919433594, -0.1165618896484375, -0.10972023010253906, -0.10287857055664062, -0.09603691101074219, -0.08919525146484375, -0.08235359191894531, -0.07551193237304688, -0.06867027282714844, -0.06182861328125, -0.05498695373535156, -0.048145294189453125, -0.04130363464355469, -0.03446197509765625, -0.027620315551757812, -0.020778656005859375, -0.013936996459960938, -0.0070953369140625, -0.0002536773681640625, 0.006587982177734375, 0.013429641723632812, 0.02027130126953125, 0.027112960815429688, 0.033954620361328125, 0.04079627990722656, 0.047637939453125, 0.05447959899902344, 0.061321258544921875, 0.06816291809082031, 0.07500457763671875, 0.08184623718261719, 0.08868789672851562, 0.09552955627441406, 0.1023712158203125, 0.10921287536621094, 0.11605453491210938, 0.12289619445800781, 0.12973785400390625, 0.1365795135498047, 0.14342117309570312, 0.15026283264160156, 0.1571044921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 19.0, 24.0, 77.0, 149.0, 262.0, 234.0, 113.0, 51.0, 30.0, 13.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036895751953125, -0.0352787971496582, -0.033661842346191406, -0.03204488754272461, -0.030427932739257812, -0.028810977935791016, -0.02719402313232422, -0.025577068328857422, -0.023960113525390625, -0.022343158721923828, -0.02072620391845703, -0.019109249114990234, -0.017492294311523438, -0.01587533950805664, -0.014258384704589844, -0.012641429901123047, -0.01102447509765625, -0.009407520294189453, -0.007790565490722656, -0.006173610687255859, -0.0045566558837890625, -0.0029397010803222656, -0.0013227462768554688, 0.0002942085266113281, 0.001911163330078125, 0.003528118133544922, 0.005145072937011719, 0.006762027740478516, 0.008378982543945312, 0.00999593734741211, 0.011612892150878906, 0.013229846954345703, 0.0148468017578125, 0.016463756561279297, 0.018080711364746094, 0.01969766616821289, 0.021314620971679688, 0.022931575775146484, 0.02454853057861328, 0.026165485382080078, 0.027782440185546875, 0.029399394989013672, 0.03101634979248047, 0.032633304595947266, 0.03425025939941406, 0.03586721420288086, 0.037484169006347656, 0.03910112380981445, 0.04071807861328125, 0.04233503341674805, 0.043951988220214844, 0.04556894302368164, 0.04718589782714844, 0.048802852630615234, 0.05041980743408203, 0.05203676223754883, 0.053653717041015625, 0.05527067184448242, 0.05688762664794922, 0.058504581451416016, 0.06012153625488281, 0.06173849105834961, 0.0633554458618164, 0.0649724006652832, 0.06658935546875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 4.0, 10.0, 12.0, 11.0, 21.0, 32.0, 59.0, 129.0, 224.0, 213.0, 107.0, 66.0, 29.0, 30.0, 17.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4636218547821045, -3.3551101684570312, -3.246598482131958, -3.1380867958068848, -3.0295751094818115, -2.9210634231567383, -2.812551736831665, -2.704040050506592, -2.5955283641815186, -2.4870166778564453, -2.378504991531372, -2.269993305206299, -2.1614816188812256, -2.0529699325561523, -1.944458246231079, -1.8359465599060059, -1.7274348735809326, -1.6189231872558594, -1.5104115009307861, -1.401899814605713, -1.2933881282806396, -1.1848764419555664, -1.0763647556304932, -0.9678530693054199, -0.8593413829803467, -0.7508296966552734, -0.6423180103302002, -0.533806324005127, -0.4252946376800537, -0.31678295135498047, -0.20827126502990723, -0.09975957870483398, 0.008751869201660156, 0.1172635555267334, 0.22577524185180664, 0.3342869281768799, 0.4427986145019531, 0.5513103008270264, 0.6598219871520996, 0.7683336734771729, 0.8768453598022461, 0.9853570461273193, 1.0938687324523926, 1.2023804187774658, 1.310892105102539, 1.4194037914276123, 1.5279154777526855, 1.6364271640777588, 1.744938850402832, 1.8534505367279053, 1.9619622230529785, 2.0704739093780518, 2.178985595703125, 2.2874972820281982, 2.3960089683532715, 2.5045206546783447, 2.613032341003418, 2.721544027328491, 2.8300557136535645, 2.9385673999786377, 3.047079086303711, 3.155590772628784, 3.2641024589538574, 3.3726141452789307, 3.481125831604004]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 9.0, 1.0, 5.0, 5.0, 10.0, 9.0, 14.0, 25.0, 29.0, 28.0, 45.0, 50.0, 64.0, 84.0, 74.0, 73.0, 58.0, 61.0, 63.0, 47.0, 44.0, 40.0, 25.0, 32.0, 20.0, 16.0, 13.0, 11.0, 6.0, 11.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5008580684661865, -1.452011227607727, -1.4031645059585571, -1.3543176651000977, -1.3054708242416382, -1.2566239833831787, -1.2077772617340088, -1.1589304208755493, -1.1100835800170898, -1.0612367391586304, -1.0123900175094604, -0.963543176651001, -0.9146963357925415, -0.8658495545387268, -0.8170027732849121, -0.7681559324264526, -0.7193092107772827, -0.670462429523468, -0.6216155886650085, -0.5727688074111938, -0.5239219665527344, -0.4750751852989197, -0.426228404045105, -0.3773815929889679, -0.3285347819328308, -0.2796879708766937, -0.23084117472171783, -0.18199437856674194, -0.13314756751060486, -0.08430075645446777, -0.035453975200653076, 0.013392835855484009, 0.06223952770233154, 0.11108633130788803, 0.15993313491344452, 0.2087799310684204, 0.2576267421245575, 0.3064735531806946, 0.3553203344345093, 0.40416714549064636, 0.45301395654678345, 0.5018607378005981, 0.5507075786590576, 0.5995543599128723, 0.648401141166687, 0.6972479820251465, 0.7460947632789612, 0.7949415445327759, 0.8437883853912354, 0.89263516664505, 0.9414820075035095, 0.9903287887573242, 1.0391756296157837, 1.0880224704742432, 1.136869192123413, 1.1857160329818726, 1.234562873840332, 1.2834097146987915, 1.3322564363479614, 1.381103277206421, 1.4299501180648804, 1.4787969589233398, 1.5276436805725098, 1.5764905214309692, 1.6253372430801392]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 3.0, 8.0, 8.0, 23.0, 25.0, 26.0, 33.0, 56.0, 73.0, 93.0, 141.0, 188.0, 285.0, 402.0, 672.0, 1062.0, 1910.0, 3350.0, 6794.0, 16386.0, 55945.0, 543165.0, 344691.0, 44998.0, 14403.0, 6180.0, 2945.0, 1724.0, 990.0, 647.0, 419.0, 256.0, 148.0, 126.0, 108.0, 64.0, 49.0, 35.0, 32.0, 14.0, 20.0, 12.0, 7.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.7451171875, -1.6936798095703125, -1.642242431640625, -1.5908050537109375, -1.53936767578125, -1.4879302978515625, -1.436492919921875, -1.3850555419921875, -1.3336181640625, -1.2821807861328125, -1.230743408203125, -1.1793060302734375, -1.12786865234375, -1.0764312744140625, -1.024993896484375, -0.9735565185546875, -0.922119140625, -0.8706817626953125, -0.819244384765625, -0.7678070068359375, -0.71636962890625, -0.6649322509765625, -0.613494873046875, -0.5620574951171875, -0.5106201171875, -0.4591827392578125, -0.407745361328125, -0.3563079833984375, -0.30487060546875, -0.2534332275390625, -0.201995849609375, -0.1505584716796875, -0.09912109375, -0.0476837158203125, 0.003753662109375, 0.0551910400390625, 0.10662841796875, 0.1580657958984375, 0.209503173828125, 0.2609405517578125, 0.3123779296875, 0.3638153076171875, 0.415252685546875, 0.4666900634765625, 0.51812744140625, 0.5695648193359375, 0.621002197265625, 0.6724395751953125, 0.723876953125, 0.7753143310546875, 0.826751708984375, 0.8781890869140625, 0.92962646484375, 0.9810638427734375, 1.032501220703125, 1.0839385986328125, 1.1353759765625, 1.1868133544921875, 1.238250732421875, 1.2896881103515625, 1.34112548828125, 1.3925628662109375, 1.444000244140625, 1.4954376220703125, 1.546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 6.0, 2.0, 8.0, 4.0, 7.0, 5.0, 9.0, 18.0, 21.0, 23.0, 45.0, 55.0, 66.0, 95.0, 99.0, 79.0, 63.0, 72.0, 62.0, 53.0, 45.0, 38.0, 36.0, 21.0, 13.0, 15.0, 8.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.9921875, -3.86663818359375, -3.7410888671875, -3.61553955078125, -3.489990234375, -3.36444091796875, -3.2388916015625, -3.11334228515625, -2.98779296875, -2.86224365234375, -2.7366943359375, -2.61114501953125, -2.485595703125, -2.36004638671875, -2.2344970703125, -2.10894775390625, -1.9833984375, -1.85784912109375, -1.7322998046875, -1.60675048828125, -1.481201171875, -1.35565185546875, -1.2301025390625, -1.10455322265625, -0.97900390625, -0.85345458984375, -0.7279052734375, -0.60235595703125, -0.476806640625, -0.35125732421875, -0.2257080078125, -0.10015869140625, 0.025390625, 0.15093994140625, 0.2764892578125, 0.40203857421875, 0.527587890625, 0.65313720703125, 0.7786865234375, 0.90423583984375, 1.02978515625, 1.15533447265625, 1.2808837890625, 1.40643310546875, 1.531982421875, 1.65753173828125, 1.7830810546875, 1.90863037109375, 2.0341796875, 2.15972900390625, 2.2852783203125, 2.41082763671875, 2.536376953125, 2.66192626953125, 2.7874755859375, 2.91302490234375, 3.03857421875, 3.16412353515625, 3.2896728515625, 3.41522216796875, 3.540771484375, 3.66632080078125, 3.7918701171875, 3.91741943359375, 4.04296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 9.0, 12.0, 17.0, 39.0, 65.0, 83.0, 165.0, 265.0, 552.0, 1031.0, 2395.0, 6653.0, 25597.0, 329164.0, 635779.0, 33327.0, 7960.0, 2800.0, 1224.0, 596.0, 295.0, 185.0, 112.0, 60.0, 43.0, 33.0, 19.0, 14.0, 8.0, 5.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.587890625, -1.527008056640625, -1.46612548828125, -1.405242919921875, -1.3443603515625, -1.283477783203125, -1.22259521484375, -1.161712646484375, -1.100830078125, -1.039947509765625, -0.97906494140625, -0.918182373046875, -0.8572998046875, -0.796417236328125, -0.73553466796875, -0.674652099609375, -0.61376953125, -0.552886962890625, -0.49200439453125, -0.431121826171875, -0.3702392578125, -0.309356689453125, -0.24847412109375, -0.187591552734375, -0.126708984375, -0.065826416015625, -0.00494384765625, 0.055938720703125, 0.1168212890625, 0.177703857421875, 0.23858642578125, 0.299468994140625, 0.3603515625, 0.421234130859375, 0.48211669921875, 0.542999267578125, 0.6038818359375, 0.664764404296875, 0.72564697265625, 0.786529541015625, 0.847412109375, 0.908294677734375, 0.96917724609375, 1.030059814453125, 1.0909423828125, 1.151824951171875, 1.21270751953125, 1.273590087890625, 1.33447265625, 1.395355224609375, 1.45623779296875, 1.517120361328125, 1.5780029296875, 1.638885498046875, 1.69976806640625, 1.760650634765625, 1.821533203125, 1.882415771484375, 1.94329833984375, 2.004180908203125, 2.0650634765625, 2.125946044921875, 2.18682861328125, 2.247711181640625, 2.30859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 0.0, 3.0, 7.0, 6.0, 5.0, 5.0, 10.0, 12.0, 11.0, 11.0, 17.0, 22.0, 27.0, 25.0, 29.0, 26.0, 40.0, 39.0, 44.0, 42.0, 43.0, 48.0, 48.0, 34.0, 34.0, 45.0, 37.0, 44.0, 32.0, 32.0, 22.0, 28.0, 26.0, 23.0, 20.0, 15.0, 20.0, 17.0, 9.0, 9.0, 5.0, 8.0, 7.0, 1.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.16015625, -3.055450439453125, -2.95074462890625, -2.846038818359375, -2.7413330078125, -2.636627197265625, -2.53192138671875, -2.427215576171875, -2.322509765625, -2.217803955078125, -2.11309814453125, -2.008392333984375, -1.9036865234375, -1.798980712890625, -1.69427490234375, -1.589569091796875, -1.48486328125, -1.380157470703125, -1.27545166015625, -1.170745849609375, -1.0660400390625, -0.961334228515625, -0.85662841796875, -0.751922607421875, -0.647216796875, -0.542510986328125, -0.43780517578125, -0.333099365234375, -0.2283935546875, -0.123687744140625, -0.01898193359375, 0.085723876953125, 0.1904296875, 0.295135498046875, 0.39984130859375, 0.504547119140625, 0.6092529296875, 0.713958740234375, 0.81866455078125, 0.923370361328125, 1.028076171875, 1.132781982421875, 1.23748779296875, 1.342193603515625, 1.4468994140625, 1.551605224609375, 1.65631103515625, 1.761016845703125, 1.86572265625, 1.970428466796875, 2.07513427734375, 2.179840087890625, 2.2845458984375, 2.389251708984375, 2.49395751953125, 2.598663330078125, 2.703369140625, 2.808074951171875, 2.91278076171875, 3.017486572265625, 3.1221923828125, 3.226898193359375, 3.33160400390625, 3.436309814453125, 3.541015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 8.0, 15.0, 21.0, 38.0, 58.0, 111.0, 189.0, 372.0, 719.0, 2169.0, 6543.0, 29291.0, 682685.0, 295464.0, 22057.0, 5466.0, 1802.0, 696.0, 332.0, 197.0, 105.0, 60.0, 41.0, 25.0, 24.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0224609375, -0.9904327392578125, -0.958404541015625, -0.9263763427734375, -0.89434814453125, -0.8623199462890625, -0.830291748046875, -0.7982635498046875, -0.7662353515625, -0.7342071533203125, -0.702178955078125, -0.6701507568359375, -0.63812255859375, -0.6060943603515625, -0.574066162109375, -0.5420379638671875, -0.510009765625, -0.4779815673828125, -0.445953369140625, -0.4139251708984375, -0.38189697265625, -0.3498687744140625, -0.317840576171875, -0.2858123779296875, -0.2537841796875, -0.2217559814453125, -0.189727783203125, -0.1576995849609375, -0.12567138671875, -0.0936431884765625, -0.061614990234375, -0.0295867919921875, 0.00244140625, 0.0344696044921875, 0.066497802734375, 0.0985260009765625, 0.13055419921875, 0.1625823974609375, 0.194610595703125, 0.2266387939453125, 0.2586669921875, 0.2906951904296875, 0.322723388671875, 0.3547515869140625, 0.38677978515625, 0.4188079833984375, 0.450836181640625, 0.4828643798828125, 0.514892578125, 0.5469207763671875, 0.578948974609375, 0.6109771728515625, 0.64300537109375, 0.6750335693359375, 0.707061767578125, 0.7390899658203125, 0.7711181640625, 0.8031463623046875, 0.835174560546875, 0.8672027587890625, 0.89923095703125, 0.9312591552734375, 0.963287353515625, 0.9953155517578125, 1.02734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 9.0, 19.0, 17.0, 38.0, 77.0, 150.0, 390.0, 112.0, 61.0, 34.0, 16.0, 22.0, 8.0, 5.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.0002191103994846344, -0.00021291524171829224, -0.00020672008395195007, -0.0002005249261856079, -0.00019432976841926575, -0.00018813461065292358, -0.00018193945288658142, -0.00017574429512023926, -0.0001695491373538971, -0.00016335397958755493, -0.00015715882182121277, -0.0001509636640548706, -0.00014476850628852844, -0.00013857334852218628, -0.00013237819075584412, -0.00012618303298950195, -0.00011998787522315979, -0.00011379271745681763, -0.00010759755969047546, -0.0001014024019241333, -9.520724415779114e-05, -8.901208639144897e-05, -8.281692862510681e-05, -7.662177085876465e-05, -7.042661309242249e-05, -6.423145532608032e-05, -5.803629755973816e-05, -5.1841139793395996e-05, -4.564598202705383e-05, -3.945082426071167e-05, -3.325566649436951e-05, -2.7060508728027344e-05, -2.086535096168518e-05, -1.4670193195343018e-05, -8.475035429000854e-06, -2.2798776626586914e-06, 3.915280103683472e-06, 1.0110437870025635e-05, 1.6305595636367798e-05, 2.250075340270996e-05, 2.8695911169052124e-05, 3.489106893539429e-05, 4.108622670173645e-05, 4.728138446807861e-05, 5.3476542234420776e-05, 5.967170000076294e-05, 6.58668577671051e-05, 7.206201553344727e-05, 7.825717329978943e-05, 8.445233106613159e-05, 9.064748883247375e-05, 9.684264659881592e-05, 0.00010303780436515808, 0.00010923296213150024, 0.00011542811989784241, 0.00012162327766418457, 0.00012781843543052673, 0.0001340135931968689, 0.00014020875096321106, 0.00014640390872955322, 0.00015259906649589539, 0.00015879422426223755, 0.0001649893820285797, 0.00017118453979492188]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 11.0, 16.0, 18.0, 25.0, 23.0, 31.0, 42.0, 65.0, 75.0, 109.0, 181.0, 264.0, 538.0, 983.0, 2062.0, 4775.0, 13587.0, 63189.0, 773865.0, 152679.0, 22947.0, 7044.0, 2895.0, 1276.0, 705.0, 386.0, 231.0, 149.0, 111.0, 73.0, 53.0, 25.0, 21.0, 27.0, 10.0, 16.0, 14.0, 8.0, 2.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.794921875, -0.771331787109375, -0.74774169921875, -0.724151611328125, -0.7005615234375, -0.676971435546875, -0.65338134765625, -0.629791259765625, -0.606201171875, -0.582611083984375, -0.55902099609375, -0.535430908203125, -0.5118408203125, -0.488250732421875, -0.46466064453125, -0.441070556640625, -0.41748046875, -0.393890380859375, -0.37030029296875, -0.346710205078125, -0.3231201171875, -0.299530029296875, -0.27593994140625, -0.252349853515625, -0.228759765625, -0.205169677734375, -0.18157958984375, -0.157989501953125, -0.1343994140625, -0.110809326171875, -0.08721923828125, -0.063629150390625, -0.0400390625, -0.016448974609375, 0.00714111328125, 0.030731201171875, 0.0543212890625, 0.077911376953125, 0.10150146484375, 0.125091552734375, 0.148681640625, 0.172271728515625, 0.19586181640625, 0.219451904296875, 0.2430419921875, 0.266632080078125, 0.29022216796875, 0.313812255859375, 0.33740234375, 0.360992431640625, 0.38458251953125, 0.408172607421875, 0.4317626953125, 0.455352783203125, 0.47894287109375, 0.502532958984375, 0.526123046875, 0.549713134765625, 0.57330322265625, 0.596893310546875, 0.6204833984375, 0.644073486328125, 0.66766357421875, 0.691253662109375, 0.71484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 8.0, 13.0, 10.0, 15.0, 12.0, 30.0, 39.0, 30.0, 61.0, 112.0, 232.0, 139.0, 61.0, 51.0, 37.0, 21.0, 23.0, 14.0, 14.0, 9.0, 7.0, 2.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3388671875, -0.3288421630859375, -0.318817138671875, -0.3087921142578125, -0.29876708984375, -0.2887420654296875, -0.278717041015625, -0.2686920166015625, -0.2586669921875, -0.2486419677734375, -0.238616943359375, -0.2285919189453125, -0.21856689453125, -0.2085418701171875, -0.198516845703125, -0.1884918212890625, -0.178466796875, -0.1684417724609375, -0.158416748046875, -0.1483917236328125, -0.13836669921875, -0.1283416748046875, -0.118316650390625, -0.1082916259765625, -0.0982666015625, -0.0882415771484375, -0.078216552734375, -0.0681915283203125, -0.05816650390625, -0.0481414794921875, -0.038116455078125, -0.0280914306640625, -0.01806640625, -0.0080413818359375, 0.001983642578125, 0.0120086669921875, 0.02203369140625, 0.0320587158203125, 0.042083740234375, 0.0521087646484375, 0.0621337890625, 0.0721588134765625, 0.082183837890625, 0.0922088623046875, 0.10223388671875, 0.1122589111328125, 0.122283935546875, 0.1323089599609375, 0.142333984375, 0.1523590087890625, 0.162384033203125, 0.1724090576171875, 0.18243408203125, 0.1924591064453125, 0.202484130859375, 0.2125091552734375, 0.2225341796875, 0.2325592041015625, 0.242584228515625, 0.2526092529296875, 0.26263427734375, 0.2726593017578125, 0.282684326171875, 0.2927093505859375, 0.302734375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 11.0, 18.0, 30.0, 82.0, 229.0, 366.0, 162.0, 57.0, 23.0, 7.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68994665145874, -4.275148391723633, -3.8603501319885254, -3.445551872253418, -3.0307536125183105, -2.6159555912017822, -2.201157331466675, -1.7863590717315674, -1.37156081199646, -0.9567625522613525, -0.5419643521308899, -0.12716615200042725, 0.2876321077346802, 0.702430248260498, 1.1172285079956055, 1.532026767730713, 1.9468250274658203, 2.3616232872009277, 2.776421546936035, 3.1912198066711426, 3.60601806640625, 4.020815849304199, 4.435614585876465, 4.850412368774414, 5.26521110534668, 5.680009365081787, 6.0948076248168945, 6.509605884552002, 6.924404144287109, 7.339201927185059, 7.754000663757324, 8.168798446655273, 8.583596229553223, 8.998394012451172, 9.413192749023438, 9.827990531921387, 10.242789268493652, 10.657587051391602, 11.072385787963867, 11.487183570861816, 11.901982307434082, 12.316780090332031, 12.731578826904297, 13.146376609802246, 13.561175346374512, 13.975973129272461, 14.390771865844727, 14.805569648742676, 15.220367431640625, 15.635165214538574, 16.049962997436523, 16.46476173400879, 16.879560470581055, 17.29435920715332, 17.709156036376953, 18.12395477294922, 18.538753509521484, 18.95355224609375, 19.368349075317383, 19.78314781188965, 20.197946548461914, 20.61274528503418, 21.027542114257812, 21.442340850830078, 21.857139587402344]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 18.0, 15.0, 25.0, 28.0, 20.0, 14.0, 34.0, 30.0, 30.0, 34.0, 36.0, 31.0, 41.0, 41.0, 32.0, 38.0, 27.0, 38.0, 46.0, 31.0, 30.0, 37.0, 36.0, 31.0, 19.0, 30.0, 28.0, 5.0, 17.0, 18.0, 12.0, 16.0, 16.0, 4.0, 2.0, 9.0, 5.0, 4.0, 2.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.528428554534912, -5.359193801879883, -5.189959526062012, -5.020724773406982, -4.851490020751953, -4.682255744934082, -4.513020992279053, -4.343786239624023, -4.174551963806152, -4.005317211151123, -3.836082696914673, -3.6668481826782227, -3.4976136684417725, -3.3283791542053223, -3.159144401550293, -2.9899098873138428, -2.8206751346588135, -2.6514406204223633, -2.482205867767334, -2.312971353530884, -2.1437368392944336, -1.9745022058486938, -1.805267572402954, -1.636033058166504, -1.4667984247207642, -1.2975637912750244, -1.1283292770385742, -0.9590946435928345, -0.7898600697517395, -0.6206254959106445, -0.4513908624649048, -0.2821563482284546, -0.11292171478271484, 0.05631287395954132, 0.22554746270179749, 0.39478206634521484, 0.5640166401863098, 0.7332512140274048, 0.9024858474731445, 1.0717203617095947, 1.2409549951553345, 1.4101896286010742, 1.5794241428375244, 1.7486587762832642, 1.917893409729004, 2.087127923965454, 2.2563624382019043, 2.4255971908569336, 2.594831705093384, 2.764066219329834, 2.9333009719848633, 3.1025354862213135, 3.2717700004577637, 3.441004753112793, 3.610239267349243, 3.7794737815856934, 3.9487085342407227, 4.117943286895752, 4.287177562713623, 4.456412315368652, 4.625647068023682, 4.794881343841553, 4.964116096496582, 5.133350372314453, 5.302585124969482]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 10.0, 11.0, 14.0, 18.0, 30.0, 49.0, 65.0, 102.0, 149.0, 267.0, 417.0, 800.0, 1568.0, 3382.0, 9402.0, 36615.0, 365435.0, 3605318.0, 137071.0, 21415.0, 6444.0, 2708.0, 1237.0, 651.0, 396.0, 246.0, 155.0, 94.0, 64.0, 44.0, 31.0, 24.0, 18.0, 8.0, 9.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.591796875, -3.50048828125, -3.4091796875, -3.31787109375, -3.2265625, -3.13525390625, -3.0439453125, -2.95263671875, -2.861328125, -2.77001953125, -2.6787109375, -2.58740234375, -2.49609375, -2.40478515625, -2.3134765625, -2.22216796875, -2.130859375, -2.03955078125, -1.9482421875, -1.85693359375, -1.765625, -1.67431640625, -1.5830078125, -1.49169921875, -1.400390625, -1.30908203125, -1.2177734375, -1.12646484375, -1.03515625, -0.94384765625, -0.8525390625, -0.76123046875, -0.669921875, -0.57861328125, -0.4873046875, -0.39599609375, -0.3046875, -0.21337890625, -0.1220703125, -0.03076171875, 0.060546875, 0.15185546875, 0.2431640625, 0.33447265625, 0.42578125, 0.51708984375, 0.6083984375, 0.69970703125, 0.791015625, 0.88232421875, 0.9736328125, 1.06494140625, 1.15625, 1.24755859375, 1.3388671875, 1.43017578125, 1.521484375, 1.61279296875, 1.7041015625, 1.79541015625, 1.88671875, 1.97802734375, 2.0693359375, 2.16064453125, 2.251953125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 5.0, 4.0, 8.0, 14.0, 12.0, 20.0, 20.0, 21.0, 25.0, 55.0, 49.0, 62.0, 64.0, 76.0, 85.0, 70.0, 62.0, 54.0, 46.0, 40.0, 46.0, 25.0, 21.0, 19.0, 18.0, 7.0, 10.0, 6.0, 10.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.76171875, -1.7061309814453125, -1.650543212890625, -1.5949554443359375, -1.53936767578125, -1.4837799072265625, -1.428192138671875, -1.3726043701171875, -1.3170166015625, -1.2614288330078125, -1.205841064453125, -1.1502532958984375, -1.09466552734375, -1.0390777587890625, -0.983489990234375, -0.9279022216796875, -0.872314453125, -0.8167266845703125, -0.761138916015625, -0.7055511474609375, -0.64996337890625, -0.5943756103515625, -0.538787841796875, -0.4832000732421875, -0.4276123046875, -0.3720245361328125, -0.316436767578125, -0.2608489990234375, -0.20526123046875, -0.1496734619140625, -0.094085693359375, -0.0384979248046875, 0.01708984375, 0.0726776123046875, 0.128265380859375, 0.1838531494140625, 0.23944091796875, 0.2950286865234375, 0.350616455078125, 0.4062042236328125, 0.4617919921875, 0.5173797607421875, 0.572967529296875, 0.6285552978515625, 0.68414306640625, 0.7397308349609375, 0.795318603515625, 0.8509063720703125, 0.906494140625, 0.9620819091796875, 1.017669677734375, 1.0732574462890625, 1.12884521484375, 1.1844329833984375, 1.240020751953125, 1.2956085205078125, 1.3511962890625, 1.4067840576171875, 1.462371826171875, 1.5179595947265625, 1.57354736328125, 1.6291351318359375, 1.684722900390625, 1.7403106689453125, 1.7958984375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 18.0, 19.0, 24.0, 51.0, 69.0, 110.0, 226.0, 407.0, 1058.0, 2782.0, 10882.0, 78259.0, 3782767.0, 288476.0, 21510.0, 4796.0, 1538.0, 561.0, 250.0, 164.0, 90.0, 56.0, 44.0, 25.0, 18.0, 16.0, 6.0, 4.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6953125, -3.582305908203125, -3.46929931640625, -3.356292724609375, -3.2432861328125, -3.130279541015625, -3.01727294921875, -2.904266357421875, -2.791259765625, -2.678253173828125, -2.56524658203125, -2.452239990234375, -2.3392333984375, -2.226226806640625, -2.11322021484375, -2.000213623046875, -1.88720703125, -1.774200439453125, -1.66119384765625, -1.548187255859375, -1.4351806640625, -1.322174072265625, -1.20916748046875, -1.096160888671875, -0.983154296875, -0.870147705078125, -0.75714111328125, -0.644134521484375, -0.5311279296875, -0.418121337890625, -0.30511474609375, -0.192108154296875, -0.0791015625, 0.033905029296875, 0.14691162109375, 0.259918212890625, 0.3729248046875, 0.485931396484375, 0.59893798828125, 0.711944580078125, 0.824951171875, 0.937957763671875, 1.05096435546875, 1.163970947265625, 1.2769775390625, 1.389984130859375, 1.50299072265625, 1.615997314453125, 1.72900390625, 1.842010498046875, 1.95501708984375, 2.068023681640625, 2.1810302734375, 2.294036865234375, 2.40704345703125, 2.520050048828125, 2.633056640625, 2.746063232421875, 2.85906982421875, 2.972076416015625, 3.0850830078125, 3.198089599609375, 3.31109619140625, 3.424102783203125, 3.537109375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 5.0, 6.0, 9.0, 6.0, 18.0, 25.0, 26.0, 50.0, 48.0, 81.0, 133.0, 201.0, 364.0, 728.0, 1132.0, 479.0, 286.0, 131.0, 94.0, 61.0, 40.0, 30.0, 33.0, 16.0, 12.0, 12.0, 11.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.544921875, -0.5256195068359375, -0.506317138671875, -0.4870147705078125, -0.46771240234375, -0.4484100341796875, -0.429107666015625, -0.4098052978515625, -0.3905029296875, -0.3712005615234375, -0.351898193359375, -0.3325958251953125, -0.31329345703125, -0.2939910888671875, -0.274688720703125, -0.2553863525390625, -0.236083984375, -0.2167816162109375, -0.197479248046875, -0.1781768798828125, -0.15887451171875, -0.1395721435546875, -0.120269775390625, -0.1009674072265625, -0.0816650390625, -0.0623626708984375, -0.043060302734375, -0.0237579345703125, -0.00445556640625, 0.0148468017578125, 0.034149169921875, 0.0534515380859375, 0.07275390625, 0.0920562744140625, 0.111358642578125, 0.1306610107421875, 0.14996337890625, 0.1692657470703125, 0.188568115234375, 0.2078704833984375, 0.2271728515625, 0.2464752197265625, 0.265777587890625, 0.2850799560546875, 0.30438232421875, 0.3236846923828125, 0.342987060546875, 0.3622894287109375, 0.381591796875, 0.4008941650390625, 0.420196533203125, 0.4394989013671875, 0.45880126953125, 0.4781036376953125, 0.497406005859375, 0.5167083740234375, 0.5360107421875, 0.5553131103515625, 0.574615478515625, 0.5939178466796875, 0.61322021484375, 0.6325225830078125, 0.651824951171875, 0.6711273193359375, 0.6904296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 10.0, 9.0, 4.0, 14.0, 18.0, 26.0, 35.0, 53.0, 88.0, 156.0, 170.0, 156.0, 94.0, 55.0, 32.0, 19.0, 18.0, 15.0, 9.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.264806270599365, -4.1411027908325195, -4.017398834228516, -3.89369535446167, -3.769991874694824, -3.6462881565093994, -3.5225844383239746, -3.398880958557129, -3.275177240371704, -3.1514735221862793, -3.0277700424194336, -2.904066324234009, -2.780362844467163, -2.6566591262817383, -2.5329556465148926, -2.4092519283294678, -2.285548210144043, -2.161844491958618, -2.0381410121917725, -1.9144372940063477, -1.7907336950302124, -1.6670300960540771, -1.543326497077942, -1.4196228981018066, -1.295919418334961, -1.1722158193588257, -1.0485122203826904, -0.9248085618019104, -0.8011049032211304, -0.6774013042449951, -0.5536977052688599, -0.42999404668807983, -0.3062903881072998, -0.18258675932884216, -0.058883145451545715, 0.06482046842575073, 0.18852409720420837, 0.312227725982666, 0.43593132495880127, 0.5596349835395813, 0.6833385825157166, 0.8070421814918518, 0.9307458400726318, 1.054449439048767, 1.1781530380249023, 1.3018567562103271, 1.4255602359771729, 1.5492639541625977, 1.672967553138733, 1.7966711521148682, 1.9203747510910034, 2.0440783500671387, 2.1677820682525635, 2.2914857864379883, 2.415189266204834, 2.538892984390259, 2.6625964641571045, 2.7863001823425293, 2.910003662109375, 3.0337073802948, 3.1574108600616455, 3.2811145782470703, 3.404818058013916, 3.528521776199341, 3.6522254943847656]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 6.0, 9.0, 12.0, 19.0, 13.0, 16.0, 25.0, 26.0, 35.0, 44.0, 37.0, 55.0, 49.0, 62.0, 55.0, 62.0, 55.0, 48.0, 62.0, 39.0, 45.0, 32.0, 36.0, 20.0, 23.0, 18.0, 13.0, 18.0, 9.0, 9.0, 5.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0225017070770264, -1.9644750356674194, -1.906448245048523, -1.848421573638916, -1.7903947830200195, -1.7323681116104126, -1.6743413209915161, -1.6163146495819092, -1.5582878589630127, -1.5002611875534058, -1.4422343969345093, -1.3842077255249023, -1.3261809349060059, -1.268154263496399, -1.2101274728775024, -1.1521008014678955, -1.094074010848999, -1.036047339439392, -0.9780205488204956, -0.9199938178062439, -0.8619670867919922, -0.8039404153823853, -0.7459136247634888, -0.6878869533538818, -0.6298602819442749, -0.5718335509300232, -0.5138068199157715, -0.4557800889015198, -0.39775335788726807, -0.33972665667533875, -0.28169992566108704, -0.22367319464683533, -0.16564643383026123, -0.10761970281600952, -0.04959297925233841, 0.008433744311332703, 0.06646047532558441, 0.12448719143867493, 0.18251392245292664, 0.24054065346717834, 0.29856738448143005, 0.35659411549568176, 0.41462084650993347, 0.4726475477218628, 0.5306742787361145, 0.5887010097503662, 0.6467277407646179, 0.7047544717788696, 0.7627812027931213, 0.820807933807373, 0.8788346648216248, 0.9368613958358765, 0.9948881268501282, 1.0529148578643799, 1.1109415292739868, 1.1689683198928833, 1.2269949913024902, 1.2850216627120972, 1.3430484533309937, 1.4010751247406006, 1.459101915359497, 1.517128586769104, 1.5751553773880005, 1.6331820487976074, 1.691208839416504]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 9.0, 16.0, 18.0, 26.0, 39.0, 60.0, 101.0, 124.0, 182.0, 339.0, 596.0, 952.0, 1824.0, 3691.0, 7796.0, 18026.0, 46948.0, 145246.0, 375740.0, 291902.0, 96456.0, 32988.0, 13046.0, 5882.0, 2894.0, 1576.0, 835.0, 458.0, 263.0, 167.0, 108.0, 73.0, 50.0, 34.0, 25.0, 21.0, 9.0, 7.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1845703125, -0.17911338806152344, -0.17365646362304688, -0.1681995391845703, -0.16274261474609375, -0.1572856903076172, -0.15182876586914062, -0.14637184143066406, -0.1409149169921875, -0.13545799255371094, -0.13000106811523438, -0.12454414367675781, -0.11908721923828125, -0.11363029479980469, -0.10817337036132812, -0.10271644592285156, -0.097259521484375, -0.09180259704589844, -0.08634567260742188, -0.08088874816894531, -0.07543182373046875, -0.06997489929199219, -0.06451797485351562, -0.05906105041503906, -0.0536041259765625, -0.04814720153808594, -0.042690277099609375, -0.03723335266113281, -0.03177642822265625, -0.026319503784179688, -0.020862579345703125, -0.015405654907226562, -0.00994873046875, -0.0044918060302734375, 0.000965118408203125, 0.0064220428466796875, 0.01187896728515625, 0.017335891723632812, 0.022792816162109375, 0.028249740600585938, 0.0337066650390625, 0.03916358947753906, 0.044620513916015625, 0.05007743835449219, 0.05553436279296875, 0.06099128723144531, 0.06644821166992188, 0.07190513610839844, 0.077362060546875, 0.08281898498535156, 0.08827590942382812, 0.09373283386230469, 0.09918975830078125, 0.10464668273925781, 0.11010360717773438, 0.11556053161621094, 0.1210174560546875, 0.12647438049316406, 0.13193130493164062, 0.1373882293701172, 0.14284515380859375, 0.1483020782470703, 0.15375900268554688, 0.15921592712402344, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 3.0, 3.0, 8.0, 8.0, 16.0, 7.0, 14.0, 21.0, 29.0, 32.0, 45.0, 46.0, 69.0, 58.0, 86.0, 73.0, 80.0, 58.0, 59.0, 51.0, 49.0, 35.0, 32.0, 23.0, 14.0, 19.0, 13.0, 10.0, 4.0, 9.0, 6.0, 1.0, 4.0, 1.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5859375, -1.5360260009765625, -1.486114501953125, -1.4362030029296875, -1.38629150390625, -1.3363800048828125, -1.286468505859375, -1.2365570068359375, -1.1866455078125, -1.1367340087890625, -1.086822509765625, -1.0369110107421875, -0.98699951171875, -0.9370880126953125, -0.887176513671875, -0.8372650146484375, -0.787353515625, -0.7374420166015625, -0.687530517578125, -0.6376190185546875, -0.58770751953125, -0.5377960205078125, -0.487884521484375, -0.4379730224609375, -0.3880615234375, -0.3381500244140625, -0.288238525390625, -0.2383270263671875, -0.18841552734375, -0.1385040283203125, -0.088592529296875, -0.0386810302734375, 0.01123046875, 0.0611419677734375, 0.111053466796875, 0.1609649658203125, 0.21087646484375, 0.2607879638671875, 0.310699462890625, 0.3606109619140625, 0.4105224609375, 0.4604339599609375, 0.510345458984375, 0.5602569580078125, 0.61016845703125, 0.6600799560546875, 0.709991455078125, 0.7599029541015625, 0.809814453125, 0.8597259521484375, 0.909637451171875, 0.9595489501953125, 1.00946044921875, 1.0593719482421875, 1.109283447265625, 1.1591949462890625, 1.2091064453125, 1.2590179443359375, 1.308929443359375, 1.3588409423828125, 1.40875244140625, 1.4586639404296875, 1.508575439453125, 1.5584869384765625, 1.6083984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 10.0, 25.0, 23.0, 48.0, 64.0, 113.0, 156.0, 264.0, 432.0, 758.0, 1735.0, 4443.0, 15756.0, 74413.0, 370327.0, 449231.0, 100853.0, 20100.0, 5524.0, 2031.0, 942.0, 520.0, 292.0, 178.0, 108.0, 64.0, 51.0, 25.0, 19.0, 13.0, 10.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2098388671875, -0.20209312438964844, -0.19434738159179688, -0.1866016387939453, -0.17885589599609375, -0.1711101531982422, -0.16336441040039062, -0.15561866760253906, -0.1478729248046875, -0.14012718200683594, -0.13238143920898438, -0.12463569641113281, -0.11688995361328125, -0.10914421081542969, -0.10139846801757812, -0.09365272521972656, -0.085906982421875, -0.07816123962402344, -0.07041549682617188, -0.06266975402832031, -0.05492401123046875, -0.04717826843261719, -0.039432525634765625, -0.03168678283691406, -0.0239410400390625, -0.016195297241210938, -0.008449554443359375, -0.0007038116455078125, 0.00704193115234375, 0.014787673950195312, 0.022533416748046875, 0.030279159545898438, 0.03802490234375, 0.04577064514160156, 0.053516387939453125, 0.06126213073730469, 0.06900787353515625, 0.07675361633300781, 0.08449935913085938, 0.09224510192871094, 0.0999908447265625, 0.10773658752441406, 0.11548233032226562, 0.12322807312011719, 0.13097381591796875, 0.1387195587158203, 0.14646530151367188, 0.15421104431152344, 0.161956787109375, 0.16970252990722656, 0.17744827270507812, 0.1851940155029297, 0.19293975830078125, 0.2006855010986328, 0.20843124389648438, 0.21617698669433594, 0.2239227294921875, 0.23166847229003906, 0.23941421508789062, 0.2471599578857422, 0.25490570068359375, 0.2626514434814453, 0.2703971862792969, 0.27814292907714844, 0.285888671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 8.0, 11.0, 6.0, 16.0, 9.0, 9.0, 19.0, 23.0, 20.0, 24.0, 23.0, 42.0, 46.0, 47.0, 54.0, 53.0, 51.0, 45.0, 60.0, 48.0, 48.0, 47.0, 44.0, 44.0, 36.0, 34.0, 23.0, 18.0, 21.0, 14.0, 17.0, 12.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.108673095703125, -2.02984619140625, -1.951019287109375, -1.8721923828125, -1.793365478515625, -1.71453857421875, -1.635711669921875, -1.556884765625, -1.478057861328125, -1.39923095703125, -1.320404052734375, -1.2415771484375, -1.162750244140625, -1.08392333984375, -1.005096435546875, -0.92626953125, -0.847442626953125, -0.76861572265625, -0.689788818359375, -0.6109619140625, -0.532135009765625, -0.45330810546875, -0.374481201171875, -0.295654296875, -0.216827392578125, -0.13800048828125, -0.059173583984375, 0.0196533203125, 0.098480224609375, 0.17730712890625, 0.256134033203125, 0.3349609375, 0.413787841796875, 0.49261474609375, 0.571441650390625, 0.6502685546875, 0.729095458984375, 0.80792236328125, 0.886749267578125, 0.965576171875, 1.044403076171875, 1.12322998046875, 1.202056884765625, 1.2808837890625, 1.359710693359375, 1.43853759765625, 1.517364501953125, 1.59619140625, 1.675018310546875, 1.75384521484375, 1.832672119140625, 1.9114990234375, 1.990325927734375, 2.06915283203125, 2.147979736328125, 2.226806640625, 2.305633544921875, 2.38446044921875, 2.463287353515625, 2.5421142578125, 2.620941162109375, 2.69976806640625, 2.778594970703125, 2.857421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 10.0, 17.0, 16.0, 32.0, 47.0, 84.0, 196.0, 451.0, 1117.0, 3313.0, 14133.0, 219295.0, 761021.0, 39769.0, 6082.0, 1768.0, 646.0, 254.0, 131.0, 50.0, 34.0, 29.0, 16.0, 13.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1392822265625, -0.13451766967773438, -0.12975311279296875, -0.12498855590820312, -0.1202239990234375, -0.11545944213867188, -0.11069488525390625, -0.10593032836914062, -0.101165771484375, -0.09640121459960938, -0.09163665771484375, -0.08687210083007812, -0.0821075439453125, -0.07734298706054688, -0.07257843017578125, -0.06781387329101562, -0.06304931640625, -0.058284759521484375, -0.05352020263671875, -0.048755645751953125, -0.0439910888671875, -0.039226531982421875, -0.03446197509765625, -0.029697418212890625, -0.024932861328125, -0.020168304443359375, -0.01540374755859375, -0.010639190673828125, -0.0058746337890625, -0.001110076904296875, 0.00365447998046875, 0.008419036865234375, 0.01318359375, 0.017948150634765625, 0.02271270751953125, 0.027477264404296875, 0.0322418212890625, 0.037006378173828125, 0.04177093505859375, 0.046535491943359375, 0.051300048828125, 0.056064605712890625, 0.06082916259765625, 0.06559371948242188, 0.0703582763671875, 0.07512283325195312, 0.07988739013671875, 0.08465194702148438, 0.08941650390625, 0.09418106079101562, 0.09894561767578125, 0.10371017456054688, 0.1084747314453125, 0.11323928833007812, 0.11800384521484375, 0.12276840209960938, 0.127532958984375, 0.13229751586914062, 0.13706207275390625, 0.14182662963867188, 0.1465911865234375, 0.15135574340820312, 0.15612030029296875, 0.16088485717773438, 0.1656494140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 10.0, 17.0, 13.0, 32.0, 40.0, 62.0, 72.0, 100.0, 117.0, 106.0, 116.0, 85.0, 57.0, 41.0, 27.0, 25.0, 16.0, 9.0, 14.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.628036499023438e-05, -6.448943167924881e-05, -6.269849836826324e-05, -6.090756505727768e-05, -5.9116631746292114e-05, -5.732569843530655e-05, -5.5534765124320984e-05, -5.374383181333542e-05, -5.1952898502349854e-05, -5.016196519136429e-05, -4.837103188037872e-05, -4.658009856939316e-05, -4.478916525840759e-05, -4.299823194742203e-05, -4.120729863643646e-05, -3.94163653254509e-05, -3.762543201446533e-05, -3.583449870347977e-05, -3.40435653924942e-05, -3.2252632081508636e-05, -3.046169877052307e-05, -2.8670765459537506e-05, -2.687983214855194e-05, -2.5088898837566376e-05, -2.329796552658081e-05, -2.1507032215595245e-05, -1.971609890460968e-05, -1.7925165593624115e-05, -1.613423228263855e-05, -1.4343298971652985e-05, -1.255236566066742e-05, -1.0761432349681854e-05, -8.970499038696289e-06, -7.179565727710724e-06, -5.388632416725159e-06, -3.5976991057395935e-06, -1.8067657947540283e-06, -1.5832483768463135e-08, 1.775100827217102e-06, 3.5660341382026672e-06, 5.356967449188232e-06, 7.147900760173798e-06, 8.938834071159363e-06, 1.0729767382144928e-05, 1.2520700693130493e-05, 1.4311634004116058e-05, 1.6102567315101624e-05, 1.789350062608719e-05, 1.9684433937072754e-05, 2.147536724805832e-05, 2.3266300559043884e-05, 2.505723387002945e-05, 2.6848167181015015e-05, 2.863910049200058e-05, 3.0430033802986145e-05, 3.222096711397171e-05, 3.4011900424957275e-05, 3.580283373594284e-05, 3.7593767046928406e-05, 3.938470035791397e-05, 4.1175633668899536e-05, 4.29665669798851e-05, 4.4757500290870667e-05, 4.654843360185623e-05, 4.83393669128418e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 14.0, 17.0, 38.0, 52.0, 109.0, 207.0, 477.0, 936.0, 2712.0, 10537.0, 104852.0, 831346.0, 83550.0, 9401.0, 2510.0, 919.0, 403.0, 201.0, 110.0, 53.0, 33.0, 20.0, 13.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1844482421875, -0.17977428436279297, -0.17510032653808594, -0.1704263687133789, -0.16575241088867188, -0.16107845306396484, -0.1564044952392578, -0.15173053741455078, -0.14705657958984375, -0.14238262176513672, -0.1377086639404297, -0.13303470611572266, -0.12836074829101562, -0.1236867904663086, -0.11901283264160156, -0.11433887481689453, -0.1096649169921875, -0.10499095916748047, -0.10031700134277344, -0.0956430435180664, -0.09096908569335938, -0.08629512786865234, -0.08162117004394531, -0.07694721221923828, -0.07227325439453125, -0.06759929656982422, -0.06292533874511719, -0.058251380920410156, -0.053577423095703125, -0.048903465270996094, -0.04422950744628906, -0.03955554962158203, -0.034881591796875, -0.03020763397216797, -0.025533676147460938, -0.020859718322753906, -0.016185760498046875, -0.011511802673339844, -0.0068378448486328125, -0.0021638870239257812, 0.00251007080078125, 0.007184028625488281, 0.011857986450195312, 0.016531944274902344, 0.021205902099609375, 0.025879859924316406, 0.030553817749023438, 0.03522777557373047, 0.0399017333984375, 0.04457569122314453, 0.04924964904785156, 0.053923606872558594, 0.058597564697265625, 0.06327152252197266, 0.06794548034667969, 0.07261943817138672, 0.07729339599609375, 0.08196735382080078, 0.08664131164550781, 0.09131526947021484, 0.09598922729492188, 0.1006631851196289, 0.10533714294433594, 0.11001110076904297, 0.11468505859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 11.0, 10.0, 16.0, 24.0, 45.0, 55.0, 105.0, 146.0, 176.0, 152.0, 103.0, 57.0, 30.0, 19.0, 15.0, 8.0, 5.0, 9.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026214599609375, -0.025096893310546875, -0.02397918701171875, -0.022861480712890625, -0.0217437744140625, -0.020626068115234375, -0.01950836181640625, -0.018390655517578125, -0.01727294921875, -0.016155242919921875, -0.01503753662109375, -0.013919830322265625, -0.0128021240234375, -0.011684417724609375, -0.01056671142578125, -0.009449005126953125, -0.008331298828125, -0.007213592529296875, -0.00609588623046875, -0.004978179931640625, -0.0038604736328125, -0.002742767333984375, -0.00162506103515625, -0.000507354736328125, 0.0006103515625, 0.001728057861328125, 0.00284576416015625, 0.003963470458984375, 0.0050811767578125, 0.006198883056640625, 0.00731658935546875, 0.008434295654296875, 0.009552001953125, 0.010669708251953125, 0.01178741455078125, 0.012905120849609375, 0.0140228271484375, 0.015140533447265625, 0.01625823974609375, 0.017375946044921875, 0.01849365234375, 0.019611358642578125, 0.02072906494140625, 0.021846771240234375, 0.0229644775390625, 0.024082183837890625, 0.02519989013671875, 0.026317596435546875, 0.027435302734375, 0.028553009033203125, 0.02967071533203125, 0.030788421630859375, 0.0319061279296875, 0.033023834228515625, 0.03414154052734375, 0.035259246826171875, 0.036376953125, 0.037494659423828125, 0.03861236572265625, 0.039730072021484375, 0.0408477783203125, 0.041965484619140625, 0.04308319091796875, 0.044200897216796875, 0.045318603515625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 12.0, 9.0, 6.0, 8.0, 20.0, 20.0, 34.0, 52.0, 94.0, 167.0, 196.0, 159.0, 82.0, 47.0, 27.0, 19.0, 11.0, 14.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.8472964763641357, -2.7590572834014893, -2.670818328857422, -2.5825791358947754, -2.494340181350708, -2.4061009883880615, -2.317862033843994, -2.2296228408813477, -2.141383647918701, -2.0531444549560547, -1.9649055004119873, -1.8766663074493408, -1.7884273529052734, -1.700188159942627, -1.61194908618927, -1.523710012435913, -1.4354710578918457, -1.3472319841384888, -1.2589929103851318, -1.1707537174224854, -1.082514762878418, -0.9942756295204163, -0.9060364961624146, -0.8177974224090576, -0.7295583486557007, -0.6413192749023438, -0.5530802011489868, -0.4648410677909851, -0.3766019940376282, -0.28836292028427124, -0.20012378692626953, -0.1118847131729126, -0.023645639419555664, 0.06459344923496246, 0.1528325378894806, 0.2410716414451599, 0.32931071519851685, 0.4175497889518738, 0.5057889223098755, 0.5940279960632324, 0.6822670698165894, 0.7705061435699463, 0.8587452173233032, 0.9469843506813049, 1.0352234840393066, 1.123462438583374, 1.2117016315460205, 1.2999407052993774, 1.3881797790527344, 1.4764188528060913, 1.5646579265594482, 1.6528971195220947, 1.741136074066162, 1.8293752670288086, 1.9176143407821655, 2.0058534145355225, 2.09409236907959, 2.1823315620422363, 2.2705705165863037, 2.35880970954895, 2.4470486640930176, 2.535287857055664, 2.6235270500183105, 2.711766004562378, 2.8000051975250244]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 4.0, 7.0, 7.0, 12.0, 9.0, 18.0, 22.0, 24.0, 34.0, 44.0, 58.0, 58.0, 67.0, 70.0, 69.0, 69.0, 69.0, 64.0, 53.0, 43.0, 32.0, 28.0, 27.0, 17.0, 17.0, 16.0, 9.0, 6.0, 9.0, 7.0, 2.0, 5.0, 2.0, 3.0, 0.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5011661052703857, -1.4553509950637817, -1.4095358848571777, -1.3637208938598633, -1.3179057836532593, -1.2720906734466553, -1.2262755632400513, -1.1804604530334473, -1.1346454620361328, -1.0888303518295288, -1.0430152416229248, -0.9972001910209656, -0.9513851404190063, -0.9055700302124023, -0.8597549200057983, -0.8139398097991943, -0.7681246995925903, -0.7223095893859863, -0.6764945387840271, -0.6306794285774231, -0.5848643779754639, -0.5390492677688599, -0.49323415756225586, -0.44741907715797424, -0.4016039967536926, -0.355788916349411, -0.3099738359451294, -0.2641587257385254, -0.21834364533424377, -0.17252856492996216, -0.12671345472335815, -0.08089837431907654, -0.03508317470550537, 0.010731913149356842, 0.056547001004219055, 0.10236209630966187, 0.14817717671394348, 0.1939922571182251, 0.2398073673248291, 0.2856224477291107, 0.33143752813339233, 0.37725260853767395, 0.42306768894195557, 0.46888279914855957, 0.5146979093551636, 0.5605129599571228, 0.6063280701637268, 0.652143120765686, 0.69795823097229, 0.743773341178894, 0.7895883917808533, 0.8354035019874573, 0.8812185525894165, 0.9270336627960205, 0.9728487730026245, 1.0186638832092285, 1.064478874206543, 1.110293984413147, 1.156109094619751, 1.2019240856170654, 1.2477391958236694, 1.2935543060302734, 1.3393694162368774, 1.3851845264434814, 1.4309996366500854]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 5.0, 9.0, 8.0, 14.0, 30.0, 28.0, 38.0, 62.0, 97.0, 114.0, 196.0, 249.0, 444.0, 739.0, 1293.0, 2669.0, 6072.0, 16585.0, 82805.0, 857637.0, 55176.0, 13706.0, 5164.0, 2301.0, 1155.0, 726.0, 392.0, 251.0, 166.0, 116.0, 94.0, 48.0, 42.0, 32.0, 26.0, 16.0, 16.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.94744873046875, -1.8812255859375, -1.81500244140625, -1.748779296875, -1.68255615234375, -1.6163330078125, -1.55010986328125, -1.48388671875, -1.41766357421875, -1.3514404296875, -1.28521728515625, -1.218994140625, -1.15277099609375, -1.0865478515625, -1.02032470703125, -0.9541015625, -0.88787841796875, -0.8216552734375, -0.75543212890625, -0.689208984375, -0.62298583984375, -0.5567626953125, -0.49053955078125, -0.42431640625, -0.35809326171875, -0.2918701171875, -0.22564697265625, -0.159423828125, -0.09320068359375, -0.0269775390625, 0.03924560546875, 0.10546875, 0.17169189453125, 0.2379150390625, 0.30413818359375, 0.370361328125, 0.43658447265625, 0.5028076171875, 0.56903076171875, 0.63525390625, 0.70147705078125, 0.7677001953125, 0.83392333984375, 0.900146484375, 0.96636962890625, 1.0325927734375, 1.09881591796875, 1.1650390625, 1.23126220703125, 1.2974853515625, 1.36370849609375, 1.429931640625, 1.49615478515625, 1.5623779296875, 1.62860107421875, 1.69482421875, 1.76104736328125, 1.8272705078125, 1.89349365234375, 1.959716796875, 2.02593994140625, 2.0921630859375, 2.15838623046875, 2.224609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 4.0, 4.0, 10.0, 7.0, 14.0, 21.0, 22.0, 37.0, 43.0, 50.0, 64.0, 48.0, 75.0, 81.0, 69.0, 85.0, 55.0, 51.0, 50.0, 40.0, 26.0, 17.0, 28.0, 16.0, 11.0, 12.0, 12.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.44921875, -3.353424072265625, -3.25762939453125, -3.161834716796875, -3.0660400390625, -2.970245361328125, -2.87445068359375, -2.778656005859375, -2.682861328125, -2.587066650390625, -2.49127197265625, -2.395477294921875, -2.2996826171875, -2.203887939453125, -2.10809326171875, -2.012298583984375, -1.91650390625, -1.820709228515625, -1.72491455078125, -1.629119873046875, -1.5333251953125, -1.437530517578125, -1.34173583984375, -1.245941162109375, -1.150146484375, -1.054351806640625, -0.95855712890625, -0.862762451171875, -0.7669677734375, -0.671173095703125, -0.57537841796875, -0.479583740234375, -0.3837890625, -0.287994384765625, -0.19219970703125, -0.096405029296875, -0.0006103515625, 0.095184326171875, 0.19097900390625, 0.286773681640625, 0.382568359375, 0.478363037109375, 0.57415771484375, 0.669952392578125, 0.7657470703125, 0.861541748046875, 0.95733642578125, 1.053131103515625, 1.14892578125, 1.244720458984375, 1.34051513671875, 1.436309814453125, 1.5321044921875, 1.627899169921875, 1.72369384765625, 1.819488525390625, 1.915283203125, 2.011077880859375, 2.10687255859375, 2.202667236328125, 2.2984619140625, 2.394256591796875, 2.49005126953125, 2.585845947265625, 2.681640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 12.0, 24.0, 27.0, 50.0, 96.0, 194.0, 505.0, 1580.0, 7310.0, 88006.0, 927453.0, 18842.0, 3007.0, 803.0, 319.0, 155.0, 62.0, 31.0, 18.0, 11.0, 10.0, 4.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.14404296875, -3.0400390625, -2.93603515625, -2.83203125, -2.72802734375, -2.6240234375, -2.52001953125, -2.416015625, -2.31201171875, -2.2080078125, -2.10400390625, -2.0, -1.89599609375, -1.7919921875, -1.68798828125, -1.583984375, -1.47998046875, -1.3759765625, -1.27197265625, -1.16796875, -1.06396484375, -0.9599609375, -0.85595703125, -0.751953125, -0.64794921875, -0.5439453125, -0.43994140625, -0.3359375, -0.23193359375, -0.1279296875, -0.02392578125, 0.080078125, 0.18408203125, 0.2880859375, 0.39208984375, 0.49609375, 0.60009765625, 0.7041015625, 0.80810546875, 0.912109375, 1.01611328125, 1.1201171875, 1.22412109375, 1.328125, 1.43212890625, 1.5361328125, 1.64013671875, 1.744140625, 1.84814453125, 1.9521484375, 2.05615234375, 2.16015625, 2.26416015625, 2.3681640625, 2.47216796875, 2.576171875, 2.68017578125, 2.7841796875, 2.88818359375, 2.9921875, 3.09619140625, 3.2001953125, 3.30419921875, 3.408203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 8.0, 13.0, 9.0, 15.0, 24.0, 24.0, 37.0, 32.0, 41.0, 45.0, 39.0, 38.0, 49.0, 61.0, 54.0, 60.0, 54.0, 55.0, 40.0, 47.0, 46.0, 36.0, 28.0, 18.0, 22.0, 15.0, 20.0, 13.0, 9.0, 9.0, 5.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.859375, -3.751800537109375, -3.64422607421875, -3.536651611328125, -3.4290771484375, -3.321502685546875, -3.21392822265625, -3.106353759765625, -2.998779296875, -2.891204833984375, -2.78363037109375, -2.676055908203125, -2.5684814453125, -2.460906982421875, -2.35333251953125, -2.245758056640625, -2.13818359375, -2.030609130859375, -1.92303466796875, -1.815460205078125, -1.7078857421875, -1.600311279296875, -1.49273681640625, -1.385162353515625, -1.277587890625, -1.170013427734375, -1.06243896484375, -0.954864501953125, -0.8472900390625, -0.739715576171875, -0.63214111328125, -0.524566650390625, -0.4169921875, -0.309417724609375, -0.20184326171875, -0.094268798828125, 0.0133056640625, 0.120880126953125, 0.22845458984375, 0.336029052734375, 0.443603515625, 0.551177978515625, 0.65875244140625, 0.766326904296875, 0.8739013671875, 0.981475830078125, 1.08905029296875, 1.196624755859375, 1.30419921875, 1.411773681640625, 1.51934814453125, 1.626922607421875, 1.7344970703125, 1.842071533203125, 1.94964599609375, 2.057220458984375, 2.164794921875, 2.272369384765625, 2.37994384765625, 2.487518310546875, 2.5950927734375, 2.702667236328125, 2.81024169921875, 2.917816162109375, 3.025390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 2.0, 8.0, 11.0, 15.0, 15.0, 26.0, 25.0, 66.0, 66.0, 98.0, 210.0, 486.0, 1392.0, 4550.0, 20623.0, 789527.0, 209859.0, 15916.0, 3566.0, 1061.0, 475.0, 205.0, 112.0, 70.0, 37.0, 37.0, 25.0, 16.0, 10.0, 15.0, 7.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0546875, -1.0216522216796875, -0.988616943359375, -0.9555816650390625, -0.92254638671875, -0.8895111083984375, -0.856475830078125, -0.8234405517578125, -0.7904052734375, -0.7573699951171875, -0.724334716796875, -0.6912994384765625, -0.65826416015625, -0.6252288818359375, -0.592193603515625, -0.5591583251953125, -0.526123046875, -0.4930877685546875, -0.460052490234375, -0.4270172119140625, -0.39398193359375, -0.3609466552734375, -0.327911376953125, -0.2948760986328125, -0.2618408203125, -0.2288055419921875, -0.195770263671875, -0.1627349853515625, -0.12969970703125, -0.0966644287109375, -0.063629150390625, -0.0305938720703125, 0.00244140625, 0.0354766845703125, 0.068511962890625, 0.1015472412109375, 0.13458251953125, 0.1676177978515625, 0.200653076171875, 0.2336883544921875, 0.2667236328125, 0.2997589111328125, 0.332794189453125, 0.3658294677734375, 0.39886474609375, 0.4319000244140625, 0.464935302734375, 0.4979705810546875, 0.531005859375, 0.5640411376953125, 0.597076416015625, 0.6301116943359375, 0.66314697265625, 0.6961822509765625, 0.729217529296875, 0.7622528076171875, 0.7952880859375, 0.8283233642578125, 0.861358642578125, 0.8943939208984375, 0.92742919921875, 0.9604644775390625, 0.993499755859375, 1.0265350341796875, 1.0595703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 10.0, 14.0, 36.0, 102.0, 669.0, 90.0, 24.0, 11.0, 11.0, 6.0, 10.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011903047561645508, -0.00010954122990369797, -0.00010005198419094086, -9.056273847818375e-05, -8.107349276542664e-05, -7.158424705266953e-05, -6.209500133991241e-05, -5.2605755627155304e-05, -4.311650991439819e-05, -3.362726420164108e-05, -2.4138018488883972e-05, -1.4648772776126862e-05, -5.159527063369751e-06, 4.32971864938736e-06, 1.381896436214447e-05, 2.330821007490158e-05, 3.279745578765869e-05, 4.22867015004158e-05, 5.177594721317291e-05, 6.126519292593002e-05, 7.075443863868713e-05, 8.024368435144424e-05, 8.973293006420135e-05, 9.922217577695847e-05, 0.00010871142148971558, 0.00011820066720247269, 0.0001276899129152298, 0.0001371791586279869, 0.00014666840434074402, 0.00015615765005350113, 0.00016564689576625824, 0.00017513614147901535, 0.00018462538719177246, 0.00019411463290452957, 0.00020360387861728668, 0.0002130931243300438, 0.0002225823700428009, 0.00023207161575555801, 0.00024156086146831512, 0.00025105010718107224, 0.00026053935289382935, 0.00027002859860658646, 0.00027951784431934357, 0.0002890070900321007, 0.0002984963357448578, 0.0003079855814576149, 0.000317474827170372, 0.0003269640728831291, 0.00033645331859588623, 0.00034594256430864334, 0.00035543181002140045, 0.00036492105573415756, 0.00037441030144691467, 0.0003838995471596718, 0.0003933887928724289, 0.000402878038585186, 0.0004123672842979431, 0.0004218565300107002, 0.00043134577572345734, 0.00044083502143621445, 0.00045032426714897156, 0.00045981351286172867, 0.0004693027585744858, 0.0004787920042872429, 0.00048828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 16.0, 28.0, 53.0, 109.0, 215.0, 535.0, 1502.0, 4686.0, 21203.0, 859715.0, 141652.0, 13758.0, 3226.0, 1040.0, 415.0, 187.0, 67.0, 45.0, 25.0, 17.0, 11.0, 10.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4287109375, -1.3909835815429688, -1.3532562255859375, -1.3155288696289062, -1.277801513671875, -1.2400741577148438, -1.2023468017578125, -1.1646194458007812, -1.12689208984375, -1.0891647338867188, -1.0514373779296875, -1.0137100219726562, -0.975982666015625, -0.9382553100585938, -0.9005279541015625, -0.8628005981445312, -0.8250732421875, -0.7873458862304688, -0.7496185302734375, -0.7118911743164062, -0.674163818359375, -0.6364364624023438, -0.5987091064453125, -0.5609817504882812, -0.52325439453125, -0.48552703857421875, -0.4477996826171875, -0.41007232666015625, -0.372344970703125, -0.33461761474609375, -0.2968902587890625, -0.25916290283203125, -0.221435546875, -0.18370819091796875, -0.1459808349609375, -0.10825347900390625, -0.070526123046875, -0.03279876708984375, 0.0049285888671875, 0.04265594482421875, 0.08038330078125, 0.11811065673828125, 0.1558380126953125, 0.19356536865234375, 0.231292724609375, 0.26902008056640625, 0.3067474365234375, 0.34447479248046875, 0.3822021484375, 0.41992950439453125, 0.4576568603515625, 0.49538421630859375, 0.533111572265625, 0.5708389282226562, 0.6085662841796875, 0.6462936401367188, 0.68402099609375, 0.7217483520507812, 0.7594757080078125, 0.7972030639648438, 0.834930419921875, 0.8726577758789062, 0.9103851318359375, 0.9481124877929688, 0.98583984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 7.0, 11.0, 21.0, 23.0, 71.0, 198.0, 441.0, 87.0, 36.0, 19.0, 16.0, 11.0, 11.0, 5.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.415771484375, -0.4036064147949219, -0.39144134521484375, -0.3792762756347656, -0.3671112060546875, -0.3549461364746094, -0.34278106689453125, -0.3306159973144531, -0.318450927734375, -0.3062858581542969, -0.29412078857421875, -0.2819557189941406, -0.2697906494140625, -0.2576255798339844, -0.24546051025390625, -0.23329544067382812, -0.22113037109375, -0.20896530151367188, -0.19680023193359375, -0.18463516235351562, -0.1724700927734375, -0.16030502319335938, -0.14813995361328125, -0.13597488403320312, -0.123809814453125, -0.11164474487304688, -0.09947967529296875, -0.08731460571289062, -0.0751495361328125, -0.06298446655273438, -0.05081939697265625, -0.038654327392578125, -0.0264892578125, -0.014324188232421875, -0.00215911865234375, 0.010005950927734375, 0.0221710205078125, 0.034336090087890625, 0.04650115966796875, 0.058666229248046875, 0.070831298828125, 0.08299636840820312, 0.09516143798828125, 0.10732650756835938, 0.1194915771484375, 0.13165664672851562, 0.14382171630859375, 0.15598678588867188, 0.16815185546875, 0.18031692504882812, 0.19248199462890625, 0.20464706420898438, 0.2168121337890625, 0.22897720336914062, 0.24114227294921875, 0.2533073425292969, 0.265472412109375, 0.2776374816894531, 0.28980255126953125, 0.3019676208496094, 0.3141326904296875, 0.3262977600097656, 0.33846282958984375, 0.3506278991699219, 0.36279296875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 16.0, 24.0, 60.0, 223.0, 395.0, 191.0, 42.0, 28.0, 12.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.579866409301758, -22.140300750732422, -21.700733184814453, -21.261167526245117, -20.82160186767578, -20.382036209106445, -19.94247055053711, -19.50290298461914, -19.063337326049805, -18.62377166748047, -18.1842041015625, -17.744638442993164, -17.305072784423828, -16.865507125854492, -16.425941467285156, -15.986373901367188, -15.546808242797852, -15.107242584228516, -14.667675971984863, -14.228109359741211, -13.788543701171875, -13.348978042602539, -12.909411430358887, -12.469844818115234, -12.030279159545898, -11.590713500976562, -11.15114688873291, -10.711580276489258, -10.272014617919922, -9.832448959350586, -9.392882347106934, -8.953315734863281, -8.513750076293945, -8.07418441772461, -7.634617805480957, -7.195051670074463, -6.755485534667969, -6.315919399261475, -5.8763532638549805, -5.436787128448486, -4.99722146987915, -4.557655334472656, -4.118089199066162, -3.678523063659668, -3.238956928253174, -2.7993907928466797, -2.3598246574401855, -1.9202585220336914, -1.4806923866271973, -1.0411262512207031, -0.601560115814209, -0.16199398040771484, 0.2775721549987793, 0.7171382904052734, 1.1567044258117676, 1.5962705612182617, 2.035836696624756, 2.47540283203125, 2.914968967437744, 3.3545351028442383, 3.7941012382507324, 4.233667373657227, 4.673233509063721, 5.112799644470215, 5.552365779876709]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 8.0, 9.0, 7.0, 7.0, 16.0, 10.0, 17.0, 21.0, 19.0, 23.0, 35.0, 30.0, 38.0, 28.0, 39.0, 41.0, 37.0, 49.0, 38.0, 37.0, 41.0, 38.0, 39.0, 47.0, 38.0, 30.0, 31.0, 30.0, 30.0, 19.0, 25.0, 16.0, 20.0, 14.0, 11.0, 13.0, 5.0, 10.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.190743923187256, -5.0354743003845215, -4.880205154418945, -4.724935531616211, -4.569665908813477, -4.414396286010742, -4.259126663208008, -4.103857517242432, -3.9485878944396973, -3.793318271636963, -3.6380488872528076, -3.4827795028686523, -3.327509880065918, -3.1722402572631836, -3.0169708728790283, -2.861701488494873, -2.7064318656921387, -2.5511622428894043, -2.395892858505249, -2.2406234741210938, -2.0853538513183594, -1.9300843477249146, -1.7748148441314697, -1.619545340538025, -1.46427583694458, -1.3090063333511353, -1.1537368297576904, -0.9984673261642456, -0.8431978225708008, -0.687928318977356, -0.5326588153839111, -0.3773893117904663, -0.22211933135986328, -0.06684982776641846, 0.08841967582702637, 0.2436891794204712, 0.398958683013916, 0.5542281866073608, 0.7094976902008057, 0.8647671937942505, 1.0200366973876953, 1.1753062009811401, 1.330575704574585, 1.4858452081680298, 1.6411147117614746, 1.7963842153549194, 1.9516537189483643, 2.1069231033325195, 2.262192726135254, 2.4174623489379883, 2.5727317333221436, 2.728001117706299, 2.883270740509033, 3.0385403633117676, 3.193809747695923, 3.349079132080078, 3.5043487548828125, 3.659618377685547, 3.814887762069702, 3.9701571464538574, 4.125426769256592, 4.280696392059326, 4.435965538024902, 4.591235160827637, 4.746504783630371]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 15.0, 18.0, 23.0, 29.0, 34.0, 64.0, 97.0, 203.0, 508.0, 1749.0, 7992.0, 91802.0, 4013111.0, 69599.0, 6551.0, 1439.0, 500.0, 183.0, 98.0, 60.0, 39.0, 22.0, 17.0, 17.0, 15.0, 19.0, 9.0, 6.0, 9.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.390625, -6.21533203125, -6.0400390625, -5.86474609375, -5.689453125, -5.51416015625, -5.3388671875, -5.16357421875, -4.98828125, -4.81298828125, -4.6376953125, -4.46240234375, -4.287109375, -4.11181640625, -3.9365234375, -3.76123046875, -3.5859375, -3.41064453125, -3.2353515625, -3.06005859375, -2.884765625, -2.70947265625, -2.5341796875, -2.35888671875, -2.18359375, -2.00830078125, -1.8330078125, -1.65771484375, -1.482421875, -1.30712890625, -1.1318359375, -0.95654296875, -0.78125, -0.60595703125, -0.4306640625, -0.25537109375, -0.080078125, 0.09521484375, 0.2705078125, 0.44580078125, 0.62109375, 0.79638671875, 0.9716796875, 1.14697265625, 1.322265625, 1.49755859375, 1.6728515625, 1.84814453125, 2.0234375, 2.19873046875, 2.3740234375, 2.54931640625, 2.724609375, 2.89990234375, 3.0751953125, 3.25048828125, 3.42578125, 3.60107421875, 3.7763671875, 3.95166015625, 4.126953125, 4.30224609375, 4.4775390625, 4.65283203125, 4.828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 11.0, 15.0, 14.0, 14.0, 34.0, 33.0, 42.0, 50.0, 72.0, 78.0, 89.0, 92.0, 86.0, 66.0, 80.0, 46.0, 27.0, 25.0, 25.0, 22.0, 17.0, 6.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.89605712890625, -1.8370361328125, -1.77801513671875, -1.718994140625, -1.65997314453125, -1.6009521484375, -1.54193115234375, -1.48291015625, -1.42388916015625, -1.3648681640625, -1.30584716796875, -1.246826171875, -1.18780517578125, -1.1287841796875, -1.06976318359375, -1.0107421875, -0.95172119140625, -0.8927001953125, -0.83367919921875, -0.774658203125, -0.71563720703125, -0.6566162109375, -0.59759521484375, -0.53857421875, -0.47955322265625, -0.4205322265625, -0.36151123046875, -0.302490234375, -0.24346923828125, -0.1844482421875, -0.12542724609375, -0.06640625, -0.00738525390625, 0.0516357421875, 0.11065673828125, 0.169677734375, 0.22869873046875, 0.2877197265625, 0.34674072265625, 0.40576171875, 0.46478271484375, 0.5238037109375, 0.58282470703125, 0.641845703125, 0.70086669921875, 0.7598876953125, 0.81890869140625, 0.8779296875, 0.93695068359375, 0.9959716796875, 1.05499267578125, 1.114013671875, 1.17303466796875, 1.2320556640625, 1.29107666015625, 1.35009765625, 1.40911865234375, 1.4681396484375, 1.52716064453125, 1.586181640625, 1.64520263671875, 1.7042236328125, 1.76324462890625, 1.822265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 10.0, 21.0, 48.0, 42.0, 86.0, 149.0, 372.0, 1113.0, 4557.0, 31237.0, 2786627.0, 1337618.0, 26646.0, 3989.0, 995.0, 398.0, 139.0, 83.0, 34.0, 33.0, 17.0, 10.0, 10.0, 3.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.84765625, -4.69598388671875, -4.5443115234375, -4.39263916015625, -4.240966796875, -4.08929443359375, -3.9376220703125, -3.78594970703125, -3.63427734375, -3.48260498046875, -3.3309326171875, -3.17926025390625, -3.027587890625, -2.87591552734375, -2.7242431640625, -2.57257080078125, -2.4208984375, -2.26922607421875, -2.1175537109375, -1.96588134765625, -1.814208984375, -1.66253662109375, -1.5108642578125, -1.35919189453125, -1.20751953125, -1.05584716796875, -0.9041748046875, -0.75250244140625, -0.600830078125, -0.44915771484375, -0.2974853515625, -0.14581298828125, 0.005859375, 0.15753173828125, 0.3092041015625, 0.46087646484375, 0.612548828125, 0.76422119140625, 0.9158935546875, 1.06756591796875, 1.21923828125, 1.37091064453125, 1.5225830078125, 1.67425537109375, 1.825927734375, 1.97760009765625, 2.1292724609375, 2.28094482421875, 2.4326171875, 2.58428955078125, 2.7359619140625, 2.88763427734375, 3.039306640625, 3.19097900390625, 3.3426513671875, 3.49432373046875, 3.64599609375, 3.79766845703125, 3.9493408203125, 4.10101318359375, 4.252685546875, 4.40435791015625, 4.5560302734375, 4.70770263671875, 4.859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 7.0, 22.0, 17.0, 23.0, 28.0, 45.0, 68.0, 84.0, 94.0, 176.0, 355.0, 597.0, 1052.0, 559.0, 310.0, 203.0, 100.0, 86.0, 61.0, 42.0, 28.0, 22.0, 20.0, 13.0, 8.0, 18.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60546875, -0.5849685668945312, -0.5644683837890625, -0.5439682006835938, -0.523468017578125, -0.5029678344726562, -0.4824676513671875, -0.46196746826171875, -0.44146728515625, -0.42096710205078125, -0.4004669189453125, -0.37996673583984375, -0.359466552734375, -0.33896636962890625, -0.3184661865234375, -0.29796600341796875, -0.2774658203125, -0.25696563720703125, -0.2364654541015625, -0.21596527099609375, -0.195465087890625, -0.17496490478515625, -0.1544647216796875, -0.13396453857421875, -0.11346435546875, -0.09296417236328125, -0.0724639892578125, -0.05196380615234375, -0.031463623046875, -0.01096343994140625, 0.0095367431640625, 0.03003692626953125, 0.050537109375, 0.07103729248046875, 0.0915374755859375, 0.11203765869140625, 0.132537841796875, 0.15303802490234375, 0.1735382080078125, 0.19403839111328125, 0.21453857421875, 0.23503875732421875, 0.2555389404296875, 0.27603912353515625, 0.296539306640625, 0.31703948974609375, 0.3375396728515625, 0.35803985595703125, 0.3785400390625, 0.39904022216796875, 0.4195404052734375, 0.44004058837890625, 0.460540771484375, 0.48104095458984375, 0.5015411376953125, 0.5220413208007812, 0.54254150390625, 0.5630416870117188, 0.5835418701171875, 0.6040420532226562, 0.624542236328125, 0.6450424194335938, 0.6655426025390625, 0.6860427856445312, 0.70654296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 31.0, 35.0, 53.0, 104.0, 152.0, 170.0, 159.0, 122.0, 55.0, 49.0, 17.0, 15.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2743020057678223, -3.1289138793945312, -2.9835257530212402, -2.838137626647949, -2.692749500274658, -2.547361373901367, -2.401973247528076, -2.256585121154785, -2.111196994781494, -1.9658088684082031, -1.820420742034912, -1.675032615661621, -1.52964448928833, -1.384256362915039, -1.2388681173324585, -1.0934799909591675, -0.9480917453765869, -0.8027036190032959, -0.6573154926300049, -0.5119273066520691, -0.3665391802787781, -0.22115105390548706, -0.07576286792755127, 0.06962525844573975, 0.21501338481903076, 0.3604015111923218, 0.5057896375656128, 0.6511778235435486, 0.7965659499168396, 0.9419540762901306, 1.0873422622680664, 1.2327303886413574, 1.3781185150146484, 1.5235066413879395, 1.6688947677612305, 1.8142828941345215, 1.9596710205078125, 2.1050591468811035, 2.2504472732543945, 2.3958353996276855, 2.5412235260009766, 2.6866116523742676, 2.8319997787475586, 2.9773879051208496, 3.1227760314941406, 3.2681641578674316, 3.4135522842407227, 3.5589404106140137, 3.704328775405884, 3.849716901779175, 3.995105028152466, 4.140493392944336, 4.285881519317627, 4.431269645690918, 4.576657772064209, 4.7220458984375, 4.867434024810791, 5.012822151184082, 5.158210277557373, 5.303598403930664, 5.448986530303955, 5.594374656677246, 5.739762783050537, 5.885150909423828, 6.030539035797119]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 12.0, 12.0, 24.0, 13.0, 27.0, 17.0, 32.0, 35.0, 46.0, 44.0, 50.0, 51.0, 60.0, 60.0, 51.0, 49.0, 56.0, 52.0, 45.0, 34.0, 43.0, 27.0, 29.0, 28.0, 16.0, 20.0, 10.0, 11.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.029968023300171, -1.9686391353607178, -1.907310128211975, -1.845981240272522, -1.7846523523330688, -1.7233233451843262, -1.661994457244873, -1.60066556930542, -1.5393366813659668, -1.4780077934265137, -1.416678786277771, -1.3553498983383179, -1.2940210103988647, -1.232692003250122, -1.171363115310669, -1.1100342273712158, -1.0487052202224731, -0.9873762726783752, -0.9260473847389221, -0.8647184371948242, -0.8033895492553711, -0.7420606017112732, -0.6807316541671753, -0.6194027662277222, -0.5580738186836243, -0.49674490094184875, -0.43541598320007324, -0.37408703565597534, -0.31275811791419983, -0.2514292001724243, -0.19010025262832642, -0.1287713348865509, -0.06744253635406494, -0.006113611161708832, 0.05521531403064728, 0.11654424667358398, 0.1778731644153595, 0.239202082157135, 0.3005310297012329, 0.3618599474430084, 0.42318886518478394, 0.48451778292655945, 0.545846700668335, 0.6071756482124329, 0.6685045957565308, 0.7298334836959839, 0.7911624312400818, 0.8524913787841797, 0.9138202667236328, 0.9751492142677307, 1.0364781618118286, 1.0978070497512817, 1.1591359376907349, 1.2204649448394775, 1.2817938327789307, 1.3431227207183838, 1.404451608657837, 1.46578049659729, 1.5271095037460327, 1.5884383916854858, 1.649767279624939, 1.7110962867736816, 1.7724251747131348, 1.833754062652588, 1.8950830698013306]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 5.0, 13.0, 9.0, 13.0, 23.0, 33.0, 39.0, 68.0, 75.0, 127.0, 214.0, 351.0, 536.0, 966.0, 1564.0, 2969.0, 5989.0, 14633.0, 48827.0, 261582.0, 535112.0, 127286.0, 28116.0, 9907.0, 4491.0, 2316.0, 1217.0, 705.0, 408.0, 303.0, 217.0, 113.0, 103.0, 58.0, 48.0, 26.0, 26.0, 10.0, 11.0, 8.0, 12.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.36962890625, -0.35852813720703125, -0.3474273681640625, -0.33632659912109375, -0.325225830078125, -0.31412506103515625, -0.3030242919921875, -0.29192352294921875, -0.28082275390625, -0.26972198486328125, -0.2586212158203125, -0.24752044677734375, -0.236419677734375, -0.22531890869140625, -0.2142181396484375, -0.20311737060546875, -0.1920166015625, -0.18091583251953125, -0.1698150634765625, -0.15871429443359375, -0.147613525390625, -0.13651275634765625, -0.1254119873046875, -0.11431121826171875, -0.10321044921875, -0.09210968017578125, -0.0810089111328125, -0.06990814208984375, -0.058807373046875, -0.04770660400390625, -0.0366058349609375, -0.02550506591796875, -0.014404296875, -0.00330352783203125, 0.0077972412109375, 0.01889801025390625, 0.029998779296875, 0.04109954833984375, 0.0522003173828125, 0.06330108642578125, 0.07440185546875, 0.08550262451171875, 0.0966033935546875, 0.10770416259765625, 0.118804931640625, 0.12990570068359375, 0.1410064697265625, 0.15210723876953125, 0.1632080078125, 0.17430877685546875, 0.1854095458984375, 0.19651031494140625, 0.207611083984375, 0.21871185302734375, 0.2298126220703125, 0.24091339111328125, 0.25201416015625, 0.26311492919921875, 0.2742156982421875, 0.28531646728515625, 0.296417236328125, 0.30751800537109375, 0.3186187744140625, 0.32971954345703125, 0.3408203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 11.0, 9.0, 17.0, 19.0, 16.0, 27.0, 26.0, 46.0, 49.0, 39.0, 64.0, 60.0, 65.0, 71.0, 52.0, 53.0, 42.0, 47.0, 50.0, 35.0, 35.0, 35.0, 26.0, 24.0, 16.0, 11.0, 7.0, 6.0, 10.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6683197021484375, -1.616912841796875, -1.5655059814453125, -1.51409912109375, -1.4626922607421875, -1.411285400390625, -1.3598785400390625, -1.3084716796875, -1.2570648193359375, -1.205657958984375, -1.1542510986328125, -1.10284423828125, -1.0514373779296875, -1.000030517578125, -0.9486236572265625, -0.897216796875, -0.8458099365234375, -0.794403076171875, -0.7429962158203125, -0.69158935546875, -0.6401824951171875, -0.588775634765625, -0.5373687744140625, -0.4859619140625, -0.4345550537109375, -0.383148193359375, -0.3317413330078125, -0.28033447265625, -0.2289276123046875, -0.177520751953125, -0.1261138916015625, -0.07470703125, -0.0233001708984375, 0.028106689453125, 0.0795135498046875, 0.13092041015625, 0.1823272705078125, 0.233734130859375, 0.2851409912109375, 0.3365478515625, 0.3879547119140625, 0.439361572265625, 0.4907684326171875, 0.54217529296875, 0.5935821533203125, 0.644989013671875, 0.6963958740234375, 0.747802734375, 0.7992095947265625, 0.850616455078125, 0.9020233154296875, 0.95343017578125, 1.0048370361328125, 1.056243896484375, 1.1076507568359375, 1.1590576171875, 1.2104644775390625, 1.261871337890625, 1.3132781982421875, 1.36468505859375, 1.4160919189453125, 1.467498779296875, 1.5189056396484375, 1.5703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 1.0, 4.0, 4.0, 6.0, 12.0, 15.0, 18.0, 35.0, 28.0, 53.0, 64.0, 99.0, 116.0, 235.0, 376.0, 561.0, 940.0, 1664.0, 3374.0, 7775.0, 21335.0, 86718.0, 403508.0, 399290.0, 85691.0, 21343.0, 7624.0, 3401.0, 1670.0, 961.0, 550.0, 338.0, 229.0, 146.0, 112.0, 68.0, 46.0, 30.0, 34.0, 22.0, 13.0, 9.0, 13.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.293701171875, -0.2839088439941406, -0.27411651611328125, -0.2643241882324219, -0.2545318603515625, -0.24473953247070312, -0.23494720458984375, -0.22515487670898438, -0.215362548828125, -0.20557022094726562, -0.19577789306640625, -0.18598556518554688, -0.1761932373046875, -0.16640090942382812, -0.15660858154296875, -0.14681625366210938, -0.13702392578125, -0.12723159790039062, -0.11743927001953125, -0.10764694213867188, -0.0978546142578125, -0.08806228637695312, -0.07826995849609375, -0.06847763061523438, -0.058685302734375, -0.048892974853515625, -0.03910064697265625, -0.029308319091796875, -0.0195159912109375, -0.009723663330078125, 6.866455078125e-05, 0.009860992431640625, 0.0196533203125, 0.029445648193359375, 0.03923797607421875, 0.049030303955078125, 0.0588226318359375, 0.06861495971679688, 0.07840728759765625, 0.08819961547851562, 0.097991943359375, 0.10778427124023438, 0.11757659912109375, 0.12736892700195312, 0.1371612548828125, 0.14695358276367188, 0.15674591064453125, 0.16653823852539062, 0.17633056640625, 0.18612289428710938, 0.19591522216796875, 0.20570755004882812, 0.2154998779296875, 0.22529220581054688, 0.23508453369140625, 0.24487686157226562, 0.254669189453125, 0.2644615173339844, 0.27425384521484375, 0.2840461730957031, 0.2938385009765625, 0.3036308288574219, 0.31342315673828125, 0.3232154846191406, 0.3330078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 15.0, 10.0, 12.0, 18.0, 22.0, 24.0, 24.0, 25.0, 31.0, 34.0, 48.0, 49.0, 53.0, 53.0, 66.0, 65.0, 59.0, 47.0, 47.0, 48.0, 48.0, 28.0, 33.0, 27.0, 18.0, 13.0, 18.0, 15.0, 13.0, 13.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.04296875, -2.93072509765625, -2.8184814453125, -2.70623779296875, -2.593994140625, -2.48175048828125, -2.3695068359375, -2.25726318359375, -2.14501953125, -2.03277587890625, -1.9205322265625, -1.80828857421875, -1.696044921875, -1.58380126953125, -1.4715576171875, -1.35931396484375, -1.2470703125, -1.13482666015625, -1.0225830078125, -0.91033935546875, -0.798095703125, -0.68585205078125, -0.5736083984375, -0.46136474609375, -0.34912109375, -0.23687744140625, -0.1246337890625, -0.01239013671875, 0.099853515625, 0.21209716796875, 0.3243408203125, 0.43658447265625, 0.548828125, 0.66107177734375, 0.7733154296875, 0.88555908203125, 0.997802734375, 1.11004638671875, 1.2222900390625, 1.33453369140625, 1.44677734375, 1.55902099609375, 1.6712646484375, 1.78350830078125, 1.895751953125, 2.00799560546875, 2.1202392578125, 2.23248291015625, 2.3447265625, 2.45697021484375, 2.5692138671875, 2.68145751953125, 2.793701171875, 2.90594482421875, 3.0181884765625, 3.13043212890625, 3.24267578125, 3.35491943359375, 3.4671630859375, 3.57940673828125, 3.691650390625, 3.80389404296875, 3.9161376953125, 4.02838134765625, 4.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 2.0, 4.0, 9.0, 10.0, 14.0, 14.0, 18.0, 31.0, 53.0, 83.0, 118.0, 229.0, 331.0, 631.0, 1293.0, 2773.0, 7003.0, 25243.0, 184313.0, 692865.0, 105731.0, 17731.0, 5347.0, 2242.0, 1048.0, 577.0, 338.0, 161.0, 101.0, 77.0, 41.0, 38.0, 27.0, 16.0, 13.0, 4.0, 6.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11956787109375, -0.11575794219970703, -0.11194801330566406, -0.1081380844116211, -0.10432815551757812, -0.10051822662353516, -0.09670829772949219, -0.09289836883544922, -0.08908843994140625, -0.08527851104736328, -0.08146858215332031, -0.07765865325927734, -0.07384872436523438, -0.0700387954711914, -0.06622886657714844, -0.06241893768310547, -0.0586090087890625, -0.05479907989501953, -0.05098915100097656, -0.047179222106933594, -0.043369293212890625, -0.039559364318847656, -0.03574943542480469, -0.03193950653076172, -0.02812957763671875, -0.02431964874267578, -0.020509719848632812, -0.016699790954589844, -0.012889862060546875, -0.009079933166503906, -0.0052700042724609375, -0.0014600753784179688, 0.002349853515625, 0.006159782409667969, 0.009969711303710938, 0.013779640197753906, 0.017589569091796875, 0.021399497985839844, 0.025209426879882812, 0.02901935577392578, 0.03282928466796875, 0.03663921356201172, 0.04044914245605469, 0.044259071350097656, 0.048069000244140625, 0.051878929138183594, 0.05568885803222656, 0.05949878692626953, 0.0633087158203125, 0.06711864471435547, 0.07092857360839844, 0.0747385025024414, 0.07854843139648438, 0.08235836029052734, 0.08616828918457031, 0.08997821807861328, 0.09378814697265625, 0.09759807586669922, 0.10140800476074219, 0.10521793365478516, 0.10902786254882812, 0.1128377914428711, 0.11664772033691406, 0.12045764923095703, 0.124267578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 6.0, 4.0, 4.0, 15.0, 16.0, 23.0, 21.0, 32.0, 46.0, 78.0, 87.0, 78.0, 90.0, 102.0, 100.0, 62.0, 61.0, 46.0, 29.0, 26.0, 14.0, 15.0, 11.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9591064453125e-05, -4.779268056154251e-05, -4.599429666996002e-05, -4.419591277837753e-05, -4.2397528886795044e-05, -4.0599144995212555e-05, -3.8800761103630066e-05, -3.700237721204758e-05, -3.520399332046509e-05, -3.34056094288826e-05, -3.160722553730011e-05, -2.980884164571762e-05, -2.8010457754135132e-05, -2.6212073862552643e-05, -2.4413689970970154e-05, -2.2615306079387665e-05, -2.0816922187805176e-05, -1.9018538296222687e-05, -1.7220154404640198e-05, -1.542177051305771e-05, -1.362338662147522e-05, -1.182500272989273e-05, -1.0026618838310242e-05, -8.228234946727753e-06, -6.429851055145264e-06, -4.631467163562775e-06, -2.8330832719802856e-06, -1.0346993803977966e-06, 7.636845111846924e-07, 2.5620684027671814e-06, 4.36045229434967e-06, 6.1588361859321594e-06, 7.957220077514648e-06, 9.755603969097137e-06, 1.1553987860679626e-05, 1.3352371752262115e-05, 1.5150755643844604e-05, 1.6949139535427094e-05, 1.8747523427009583e-05, 2.054590731859207e-05, 2.234429121017456e-05, 2.414267510175705e-05, 2.594105899333954e-05, 2.7739442884922028e-05, 2.9537826776504517e-05, 3.1336210668087006e-05, 3.3134594559669495e-05, 3.4932978451251984e-05, 3.673136234283447e-05, 3.852974623441696e-05, 4.032813012599945e-05, 4.212651401758194e-05, 4.392489790916443e-05, 4.572328180074692e-05, 4.752166569232941e-05, 4.9320049583911896e-05, 5.1118433475494385e-05, 5.2916817367076874e-05, 5.471520125865936e-05, 5.651358515024185e-05, 5.831196904182434e-05, 6.011035293340683e-05, 6.190873682498932e-05, 6.370712071657181e-05, 6.55055046081543e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 15.0, 14.0, 29.0, 36.0, 72.0, 101.0, 165.0, 282.0, 455.0, 873.0, 1707.0, 3650.0, 9005.0, 28942.0, 209224.0, 680277.0, 84464.0, 17407.0, 6223.0, 2622.0, 1334.0, 648.0, 368.0, 238.0, 151.0, 57.0, 64.0, 34.0, 21.0, 16.0, 7.0, 8.0, 6.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146240234375, -0.14209842681884766, -0.1379566192626953, -0.13381481170654297, -0.12967300415039062, -0.12553119659423828, -0.12138938903808594, -0.1172475814819336, -0.11310577392578125, -0.1089639663696289, -0.10482215881347656, -0.10068035125732422, -0.09653854370117188, -0.09239673614501953, -0.08825492858886719, -0.08411312103271484, -0.0799713134765625, -0.07582950592041016, -0.07168769836425781, -0.06754589080810547, -0.06340408325195312, -0.05926227569580078, -0.05512046813964844, -0.050978660583496094, -0.04683685302734375, -0.042695045471191406, -0.03855323791503906, -0.03441143035888672, -0.030269622802734375, -0.02612781524658203, -0.021986007690429688, -0.017844200134277344, -0.013702392578125, -0.009560585021972656, -0.0054187774658203125, -0.0012769699096679688, 0.002864837646484375, 0.007006645202636719, 0.011148452758789062, 0.015290260314941406, 0.01943206787109375, 0.023573875427246094, 0.027715682983398438, 0.03185749053955078, 0.035999298095703125, 0.04014110565185547, 0.04428291320800781, 0.048424720764160156, 0.0525665283203125, 0.056708335876464844, 0.06085014343261719, 0.06499195098876953, 0.06913375854492188, 0.07327556610107422, 0.07741737365722656, 0.0815591812133789, 0.08570098876953125, 0.0898427963256836, 0.09398460388183594, 0.09812641143798828, 0.10226821899414062, 0.10641002655029297, 0.11055183410644531, 0.11469364166259766, 0.11883544921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 1.0, 3.0, 6.0, 5.0, 8.0, 24.0, 22.0, 36.0, 45.0, 88.0, 107.0, 162.0, 144.0, 108.0, 80.0, 37.0, 32.0, 13.0, 19.0, 10.0, 11.0, 7.0, 6.0, 3.0, 1.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046905517578125, -0.04563283920288086, -0.04436016082763672, -0.04308748245239258, -0.04181480407714844, -0.0405421257019043, -0.039269447326660156, -0.037996768951416016, -0.036724090576171875, -0.035451412200927734, -0.034178733825683594, -0.03290605545043945, -0.03163337707519531, -0.030360698699951172, -0.02908802032470703, -0.02781534194946289, -0.02654266357421875, -0.02526998519897461, -0.02399730682373047, -0.022724628448486328, -0.021451950073242188, -0.020179271697998047, -0.018906593322753906, -0.017633914947509766, -0.016361236572265625, -0.015088558197021484, -0.013815879821777344, -0.012543201446533203, -0.011270523071289062, -0.009997844696044922, -0.008725166320800781, -0.007452487945556641, -0.0061798095703125, -0.004907131195068359, -0.0036344528198242188, -0.002361774444580078, -0.0010890960693359375, 0.00018358230590820312, 0.0014562606811523438, 0.0027289390563964844, 0.004001617431640625, 0.005274295806884766, 0.006546974182128906, 0.007819652557373047, 0.009092330932617188, 0.010365009307861328, 0.011637687683105469, 0.01291036605834961, 0.01418304443359375, 0.01545572280883789, 0.01672840118408203, 0.018001079559326172, 0.019273757934570312, 0.020546436309814453, 0.021819114685058594, 0.023091793060302734, 0.024364471435546875, 0.025637149810791016, 0.026909828186035156, 0.028182506561279297, 0.029455184936523438, 0.030727863311767578, 0.03200054168701172, 0.03327322006225586, 0.0345458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 6.0, 11.0, 22.0, 29.0, 47.0, 82.0, 149.0, 153.0, 147.0, 125.0, 88.0, 54.0, 31.0, 18.0, 11.0, 3.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7874157428741455, -2.6876680850982666, -2.5879201889038086, -2.4881725311279297, -2.388424873352051, -2.288677215576172, -2.188929557800293, -2.089181661605835, -1.989434003829956, -1.8896863460540771, -1.7899385690689087, -1.6901907920837402, -1.5904431343078613, -1.4906954765319824, -1.390947699546814, -1.2911999225616455, -1.1914522647857666, -1.0917046070098877, -0.9919568300247192, -0.8922091126441956, -0.7924613952636719, -0.6927136778831482, -0.5929659605026245, -0.49321824312210083, -0.39347052574157715, -0.29372280836105347, -0.19397509098052979, -0.0942273736000061, 0.005520343780517578, 0.10526806116104126, 0.20501577854156494, 0.3047634959220886, 0.4045112133026123, 0.504258930683136, 0.6040066480636597, 0.7037543654441833, 0.803502082824707, 0.9032498002052307, 1.0029975175857544, 1.1027452945709229, 1.2024929523468018, 1.3022406101226807, 1.4019883871078491, 1.5017361640930176, 1.6014838218688965, 1.7012314796447754, 1.8009792566299438, 1.9007270336151123, 2.000474691390991, 2.10022234916687, 2.199970245361328, 2.299717903137207, 2.399465560913086, 2.499213218688965, 2.5989608764648438, 2.6987087726593018, 2.7984564304351807, 2.8982040882110596, 2.9979519844055176, 3.0976996421813965, 3.1974472999572754, 3.2971949577331543, 3.396942615509033, 3.496690511703491, 3.59643816947937]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 4.0, 13.0, 14.0, 20.0, 28.0, 21.0, 24.0, 48.0, 57.0, 53.0, 61.0, 64.0, 63.0, 56.0, 74.0, 61.0, 59.0, 40.0, 41.0, 41.0, 30.0, 22.0, 22.0, 18.0, 7.0, 10.0, 8.0, 2.0, 5.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6601585149765015, -1.6081640720367432, -1.5561696290969849, -1.5041751861572266, -1.4521807432174683, -1.40018630027771, -1.3481918573379517, -1.2961974143981934, -1.244202971458435, -1.1922085285186768, -1.1402140855789185, -1.0882196426391602, -1.0362251996994019, -0.9842307567596436, -0.9322363138198853, -0.880241870880127, -0.8282474279403687, -0.7762529850006104, -0.724258542060852, -0.6722640991210938, -0.6202696561813354, -0.5682752132415771, -0.5162807703018188, -0.46428632736206055, -0.41229188442230225, -0.36029744148254395, -0.30830299854278564, -0.25630855560302734, -0.20431411266326904, -0.15231966972351074, -0.10032522678375244, -0.04833078384399414, 0.003663778305053711, 0.05565822124481201, 0.10765266418457031, 0.1596471071243286, 0.21164155006408691, 0.2636359930038452, 0.3156304359436035, 0.3676248788833618, 0.4196193218231201, 0.4716137647628784, 0.5236082077026367, 0.575602650642395, 0.6275970935821533, 0.6795915365219116, 0.7315859794616699, 0.7835804224014282, 0.8355748653411865, 0.8875693082809448, 0.9395637512207031, 0.9915581941604614, 1.0435526371002197, 1.095547080039978, 1.1475415229797363, 1.1995359659194946, 1.251530408859253, 1.3035248517990112, 1.3555192947387695, 1.4075137376785278, 1.4595081806182861, 1.5115026235580444, 1.5634970664978027, 1.615491509437561, 1.6674859523773193]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 13.0, 36.0, 40.0, 61.0, 94.0, 132.0, 231.0, 356.0, 633.0, 1265.0, 2530.0, 5990.0, 18944.0, 111448.0, 814344.0, 68303.0, 14404.0, 4999.0, 2170.0, 1063.0, 517.0, 318.0, 202.0, 147.0, 88.0, 55.0, 38.0, 26.0, 25.0, 12.0, 6.0, 10.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.308197021484375, -2.22967529296875, -2.151153564453125, -2.0726318359375, -1.994110107421875, -1.91558837890625, -1.837066650390625, -1.758544921875, -1.680023193359375, -1.60150146484375, -1.522979736328125, -1.4444580078125, -1.365936279296875, -1.28741455078125, -1.208892822265625, -1.13037109375, -1.051849365234375, -0.97332763671875, -0.894805908203125, -0.8162841796875, -0.737762451171875, -0.65924072265625, -0.580718994140625, -0.502197265625, -0.423675537109375, -0.34515380859375, -0.266632080078125, -0.1881103515625, -0.109588623046875, -0.03106689453125, 0.047454833984375, 0.1259765625, 0.204498291015625, 0.28302001953125, 0.361541748046875, 0.4400634765625, 0.518585205078125, 0.59710693359375, 0.675628662109375, 0.754150390625, 0.832672119140625, 0.91119384765625, 0.989715576171875, 1.0682373046875, 1.146759033203125, 1.22528076171875, 1.303802490234375, 1.38232421875, 1.460845947265625, 1.53936767578125, 1.617889404296875, 1.6964111328125, 1.774932861328125, 1.85345458984375, 1.931976318359375, 2.010498046875, 2.089019775390625, 2.16754150390625, 2.246063232421875, 2.3245849609375, 2.403106689453125, 2.48162841796875, 2.560150146484375, 2.638671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 7.0, 3.0, 2.0, 3.0, 12.0, 8.0, 15.0, 17.0, 29.0, 23.0, 23.0, 33.0, 69.0, 74.0, 69.0, 51.0, 97.0, 79.0, 82.0, 63.0, 52.0, 42.0, 31.0, 29.0, 24.0, 18.0, 13.0, 11.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.179107666015625, -3.06719970703125, -2.955291748046875, -2.8433837890625, -2.731475830078125, -2.61956787109375, -2.507659912109375, -2.395751953125, -2.283843994140625, -2.17193603515625, -2.060028076171875, -1.9481201171875, -1.836212158203125, -1.72430419921875, -1.612396240234375, -1.50048828125, -1.388580322265625, -1.27667236328125, -1.164764404296875, -1.0528564453125, -0.940948486328125, -0.82904052734375, -0.717132568359375, -0.605224609375, -0.493316650390625, -0.38140869140625, -0.269500732421875, -0.1575927734375, -0.045684814453125, 0.06622314453125, 0.178131103515625, 0.2900390625, 0.401947021484375, 0.51385498046875, 0.625762939453125, 0.7376708984375, 0.849578857421875, 0.96148681640625, 1.073394775390625, 1.185302734375, 1.297210693359375, 1.40911865234375, 1.521026611328125, 1.6329345703125, 1.744842529296875, 1.85675048828125, 1.968658447265625, 2.08056640625, 2.192474365234375, 2.30438232421875, 2.416290283203125, 2.5281982421875, 2.640106201171875, 2.75201416015625, 2.863922119140625, 2.975830078125, 3.087738037109375, 3.19964599609375, 3.311553955078125, 3.4234619140625, 3.535369873046875, 3.64727783203125, 3.759185791015625, 3.87109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 12.0, 12.0, 21.0, 26.0, 26.0, 58.0, 66.0, 118.0, 237.0, 537.0, 2063.0, 13132.0, 751185.0, 268076.0, 10047.0, 1781.0, 559.0, 206.0, 126.0, 75.0, 53.0, 46.0, 26.0, 14.0, 16.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.48828125, -6.3216552734375, -6.155029296875, -5.9884033203125, -5.82177734375, -5.6551513671875, -5.488525390625, -5.3218994140625, -5.1552734375, -4.9886474609375, -4.822021484375, -4.6553955078125, -4.48876953125, -4.3221435546875, -4.155517578125, -3.9888916015625, -3.822265625, -3.6556396484375, -3.489013671875, -3.3223876953125, -3.15576171875, -2.9891357421875, -2.822509765625, -2.6558837890625, -2.4892578125, -2.3226318359375, -2.156005859375, -1.9893798828125, -1.82275390625, -1.6561279296875, -1.489501953125, -1.3228759765625, -1.15625, -0.9896240234375, -0.822998046875, -0.6563720703125, -0.48974609375, -0.3231201171875, -0.156494140625, 0.0101318359375, 0.1767578125, 0.3433837890625, 0.510009765625, 0.6766357421875, 0.84326171875, 1.0098876953125, 1.176513671875, 1.3431396484375, 1.509765625, 1.6763916015625, 1.843017578125, 2.0096435546875, 2.17626953125, 2.3428955078125, 2.509521484375, 2.6761474609375, 2.8427734375, 3.0093994140625, 3.176025390625, 3.3426513671875, 3.50927734375, 3.6759033203125, 3.842529296875, 4.0091552734375, 4.17578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 13.0, 15.0, 16.0, 21.0, 11.0, 18.0, 37.0, 42.0, 41.0, 43.0, 35.0, 64.0, 50.0, 55.0, 77.0, 56.0, 64.0, 43.0, 54.0, 46.0, 47.0, 23.0, 25.0, 29.0, 19.0, 9.0, 11.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.286163330078125, -5.14263916015625, -4.999114990234375, -4.8555908203125, -4.712066650390625, -4.56854248046875, -4.425018310546875, -4.281494140625, -4.137969970703125, -3.99444580078125, -3.850921630859375, -3.7073974609375, -3.563873291015625, -3.42034912109375, -3.276824951171875, -3.13330078125, -2.989776611328125, -2.84625244140625, -2.702728271484375, -2.5592041015625, -2.415679931640625, -2.27215576171875, -2.128631591796875, -1.985107421875, -1.841583251953125, -1.69805908203125, -1.554534912109375, -1.4110107421875, -1.267486572265625, -1.12396240234375, -0.980438232421875, -0.8369140625, -0.693389892578125, -0.54986572265625, -0.406341552734375, -0.2628173828125, -0.119293212890625, 0.02423095703125, 0.167755126953125, 0.311279296875, 0.454803466796875, 0.59832763671875, 0.741851806640625, 0.8853759765625, 1.028900146484375, 1.17242431640625, 1.315948486328125, 1.45947265625, 1.602996826171875, 1.74652099609375, 1.890045166015625, 2.0335693359375, 2.177093505859375, 2.32061767578125, 2.464141845703125, 2.607666015625, 2.751190185546875, 2.89471435546875, 3.038238525390625, 3.1817626953125, 3.325286865234375, 3.46881103515625, 3.612335205078125, 3.755859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 13.0, 12.0, 13.0, 21.0, 44.0, 84.0, 184.0, 464.0, 2007.0, 15396.0, 326747.0, 680563.0, 19581.0, 2469.0, 549.0, 191.0, 89.0, 40.0, 33.0, 10.0, 7.0, 7.0, 3.0, 6.0, 9.0, 4.0, 2.0, 1.0], "bins": [-1.572265625, -1.538848876953125, -1.50543212890625, -1.472015380859375, -1.4385986328125, -1.405181884765625, -1.37176513671875, -1.338348388671875, -1.304931640625, -1.271514892578125, -1.23809814453125, -1.204681396484375, -1.1712646484375, -1.137847900390625, -1.10443115234375, -1.071014404296875, -1.03759765625, -1.004180908203125, -0.97076416015625, -0.937347412109375, -0.9039306640625, -0.870513916015625, -0.83709716796875, -0.803680419921875, -0.770263671875, -0.736846923828125, -0.70343017578125, -0.670013427734375, -0.6365966796875, -0.603179931640625, -0.56976318359375, -0.536346435546875, -0.5029296875, -0.469512939453125, -0.43609619140625, -0.402679443359375, -0.3692626953125, -0.335845947265625, -0.30242919921875, -0.269012451171875, -0.235595703125, -0.202178955078125, -0.16876220703125, -0.135345458984375, -0.1019287109375, -0.068511962890625, -0.03509521484375, -0.001678466796875, 0.03173828125, 0.065155029296875, 0.09857177734375, 0.131988525390625, 0.1654052734375, 0.198822021484375, 0.23223876953125, 0.265655517578125, 0.299072265625, 0.332489013671875, 0.36590576171875, 0.399322509765625, 0.4327392578125, 0.466156005859375, 0.49957275390625, 0.532989501953125, 0.56640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 3.0, 4.0, 6.0, 11.0, 14.0, 10.0, 19.0, 30.0, 28.0, 62.0, 96.0, 192.0, 196.0, 98.0, 61.0, 38.0, 38.0, 24.0, 6.0, 17.0, 8.0, 7.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.604194641113281e-05, -6.330013275146484e-05, -6.0558319091796875e-05, -5.7816505432128906e-05, -5.507469177246094e-05, -5.233287811279297e-05, -4.9591064453125e-05, -4.684925079345703e-05, -4.410743713378906e-05, -4.1365623474121094e-05, -3.8623809814453125e-05, -3.5881996154785156e-05, -3.314018249511719e-05, -3.039836883544922e-05, -2.765655517578125e-05, -2.491474151611328e-05, -2.2172927856445312e-05, -1.9431114196777344e-05, -1.6689300537109375e-05, -1.3947486877441406e-05, -1.1205673217773438e-05, -8.463859558105469e-06, -5.7220458984375e-06, -2.9802322387695312e-06, -2.384185791015625e-07, 2.5033950805664062e-06, 5.245208740234375e-06, 7.987022399902344e-06, 1.0728836059570312e-05, 1.3470649719238281e-05, 1.621246337890625e-05, 1.895427703857422e-05, 2.1696090698242188e-05, 2.4437904357910156e-05, 2.7179718017578125e-05, 2.9921531677246094e-05, 3.266334533691406e-05, 3.540515899658203e-05, 3.814697265625e-05, 4.088878631591797e-05, 4.363059997558594e-05, 4.6372413635253906e-05, 4.9114227294921875e-05, 5.1856040954589844e-05, 5.459785461425781e-05, 5.733966827392578e-05, 6.008148193359375e-05, 6.282329559326172e-05, 6.556510925292969e-05, 6.830692291259766e-05, 7.104873657226562e-05, 7.37905502319336e-05, 7.653236389160156e-05, 7.927417755126953e-05, 8.20159912109375e-05, 8.475780487060547e-05, 8.749961853027344e-05, 9.02414321899414e-05, 9.298324584960938e-05, 9.572505950927734e-05, 9.846687316894531e-05, 0.00010120868682861328, 0.00010395050048828125, 0.00010669231414794922, 0.00010943412780761719]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 15.0, 29.0, 50.0, 86.0, 193.0, 512.0, 1538.0, 7191.0, 54463.0, 882651.0, 88806.0, 9951.0, 2025.0, 574.0, 227.0, 100.0, 57.0, 25.0, 15.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9176101684570312, -0.8855133056640625, -0.8534164428710938, -0.821319580078125, -0.7892227172851562, -0.7571258544921875, -0.7250289916992188, -0.69293212890625, -0.6608352661132812, -0.6287384033203125, -0.5966415405273438, -0.564544677734375, -0.5324478149414062, -0.5003509521484375, -0.46825408935546875, -0.4361572265625, -0.40406036376953125, -0.3719635009765625, -0.33986663818359375, -0.307769775390625, -0.27567291259765625, -0.2435760498046875, -0.21147918701171875, -0.17938232421875, -0.14728546142578125, -0.1151885986328125, -0.08309173583984375, -0.050994873046875, -0.01889801025390625, 0.0131988525390625, 0.04529571533203125, 0.077392578125, 0.10948944091796875, 0.1415863037109375, 0.17368316650390625, 0.205780029296875, 0.23787689208984375, 0.2699737548828125, 0.30207061767578125, 0.33416748046875, 0.36626434326171875, 0.3983612060546875, 0.43045806884765625, 0.462554931640625, 0.49465179443359375, 0.5267486572265625, 0.5588455200195312, 0.5909423828125, 0.6230392456054688, 0.6551361083984375, 0.6872329711914062, 0.719329833984375, 0.7514266967773438, 0.7835235595703125, 0.8156204223632812, 0.84771728515625, 0.8798141479492188, 0.9119110107421875, 0.9440078735351562, 0.976104736328125, 1.0082015991210938, 1.0402984619140625, 1.0723953247070312, 1.1044921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 7.0, 3.0, 6.0, 6.0, 19.0, 23.0, 18.0, 39.0, 52.0, 67.0, 114.0, 268.0, 115.0, 66.0, 47.0, 31.0, 34.0, 12.0, 17.0, 13.0, 7.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3030548095703125, -0.293121337890625, -0.2831878662109375, -0.27325439453125, -0.2633209228515625, -0.253387451171875, -0.2434539794921875, -0.2335205078125, -0.2235870361328125, -0.213653564453125, -0.2037200927734375, -0.19378662109375, -0.1838531494140625, -0.173919677734375, -0.1639862060546875, -0.154052734375, -0.1441192626953125, -0.134185791015625, -0.1242523193359375, -0.11431884765625, -0.1043853759765625, -0.094451904296875, -0.0845184326171875, -0.0745849609375, -0.0646514892578125, -0.054718017578125, -0.0447845458984375, -0.03485107421875, -0.0249176025390625, -0.014984130859375, -0.0050506591796875, 0.0048828125, 0.0148162841796875, 0.024749755859375, 0.0346832275390625, 0.04461669921875, 0.0545501708984375, 0.064483642578125, 0.0744171142578125, 0.0843505859375, 0.0942840576171875, 0.104217529296875, 0.1141510009765625, 0.12408447265625, 0.1340179443359375, 0.143951416015625, 0.1538848876953125, 0.163818359375, 0.1737518310546875, 0.183685302734375, 0.1936187744140625, 0.20355224609375, 0.2134857177734375, 0.223419189453125, 0.2333526611328125, 0.2432861328125, 0.2532196044921875, 0.263153076171875, 0.2730865478515625, 0.28302001953125, 0.2929534912109375, 0.302886962890625, 0.3128204345703125, 0.32275390625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 9.0, 5.0, 24.0, 50.0, 134.0, 278.0, 271.0, 153.0, 55.0, 12.0, 9.0, 1.0, 6.0, 1.0, 2.0, 0.0, 3.0], "bins": [-21.024106979370117, -20.627666473388672, -20.231225967407227, -19.83478546142578, -19.438343048095703, -19.041902542114258, -18.645462036132812, -18.249021530151367, -17.852581024169922, -17.456140518188477, -17.05970001220703, -16.663259506225586, -16.266817092895508, -15.870377540588379, -15.473936080932617, -15.077495574951172, -14.681055068969727, -14.284614562988281, -13.88817310333252, -13.491732597351074, -13.095292091369629, -12.698851585388184, -12.302410125732422, -11.905969619750977, -11.509528160095215, -11.11308765411377, -10.716646194458008, -10.320205688476562, -9.923765182495117, -9.527324676513672, -9.13088321685791, -8.734442710876465, -8.338001251220703, -7.9415602684021, -7.545119762420654, -7.148678779602051, -6.7522382736206055, -6.355797290802002, -5.959356307983398, -5.562915802001953, -5.166475296020508, -4.770034313201904, -4.373593807220459, -3.9771528244018555, -3.58071231842041, -3.1842713356018066, -2.7878305912017822, -2.391389846801758, -1.9949493408203125, -1.598508596420288, -1.2020678520202637, -0.8056269884109497, -0.4091862440109253, -0.012745499610900879, 0.3836953639984131, 0.7801361083984375, 1.176576852798462, 1.5730175971984863, 1.9694583415985107, 2.365899085998535, 2.7623400688171387, 3.158780574798584, 3.5552215576171875, 3.951662302017212, 4.348103046417236]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 4.0, 8.0, 13.0, 13.0, 10.0, 18.0, 28.0, 15.0, 22.0, 26.0, 35.0, 27.0, 39.0, 31.0, 43.0, 44.0, 44.0, 39.0, 38.0, 48.0, 46.0, 41.0, 35.0, 45.0, 34.0, 37.0, 27.0, 23.0, 34.0, 20.0, 11.0, 14.0, 18.0, 13.0, 13.0, 7.0, 5.0, 8.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.569394111633301, -6.385113716125488, -6.200833320617676, -6.016552925109863, -5.832272529602051, -5.647992134094238, -5.463711738586426, -5.279431343078613, -5.095150947570801, -4.910870552062988, -4.726590156555176, -4.542309761047363, -4.358029365539551, -4.173748970031738, -3.989468574523926, -3.8051881790161133, -3.620907783508301, -3.4366273880004883, -3.252346992492676, -3.0680665969848633, -2.883786201477051, -2.6995058059692383, -2.515225410461426, -2.3309450149536133, -2.146664619445801, -1.9623842239379883, -1.7781038284301758, -1.5938234329223633, -1.4095430374145508, -1.2252626419067383, -1.0409822463989258, -0.8567018508911133, -0.6724214553833008, -0.4881410598754883, -0.3038606643676758, -0.11958026885986328, 0.06470012664794922, 0.24898052215576172, 0.4332609176635742, 0.6175413131713867, 0.8018217086791992, 0.9861021041870117, 1.1703824996948242, 1.3546628952026367, 1.5389432907104492, 1.7232236862182617, 1.9075040817260742, 2.0917844772338867, 2.276064872741699, 2.4603452682495117, 2.644625663757324, 2.8289060592651367, 3.013186454772949, 3.1974668502807617, 3.381747245788574, 3.5660276412963867, 3.750308036804199, 3.9345884323120117, 4.118868827819824, 4.303149223327637, 4.487429618835449, 4.671710014343262, 4.855990409851074, 5.040270805358887, 5.224551200866699]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 6.0, 16.0, 22.0, 23.0, 34.0, 28.0, 59.0, 90.0, 130.0, 133.0, 214.0, 333.0, 560.0, 947.0, 2248.0, 6118.0, 24189.0, 248927.0, 3730464.0, 150573.0, 19479.0, 5320.0, 1981.0, 897.0, 462.0, 287.0, 193.0, 151.0, 103.0, 67.0, 60.0, 49.0, 37.0, 17.0, 16.0, 12.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.794921875, -3.684661865234375, -3.57440185546875, -3.464141845703125, -3.3538818359375, -3.243621826171875, -3.13336181640625, -3.023101806640625, -2.912841796875, -2.802581787109375, -2.69232177734375, -2.582061767578125, -2.4718017578125, -2.361541748046875, -2.25128173828125, -2.141021728515625, -2.03076171875, -1.920501708984375, -1.81024169921875, -1.699981689453125, -1.5897216796875, -1.479461669921875, -1.36920166015625, -1.258941650390625, -1.148681640625, -1.038421630859375, -0.92816162109375, -0.817901611328125, -0.7076416015625, -0.597381591796875, -0.48712158203125, -0.376861572265625, -0.2666015625, -0.156341552734375, -0.04608154296875, 0.064178466796875, 0.1744384765625, 0.284698486328125, 0.39495849609375, 0.505218505859375, 0.615478515625, 0.725738525390625, 0.83599853515625, 0.946258544921875, 1.0565185546875, 1.166778564453125, 1.27703857421875, 1.387298583984375, 1.49755859375, 1.607818603515625, 1.71807861328125, 1.828338623046875, 1.9385986328125, 2.048858642578125, 2.15911865234375, 2.269378662109375, 2.379638671875, 2.489898681640625, 2.60015869140625, 2.710418701171875, 2.8206787109375, 2.930938720703125, 3.04119873046875, 3.151458740234375, 3.26171875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 6.0, 6.0, 9.0, 17.0, 16.0, 16.0, 37.0, 27.0, 40.0, 48.0, 68.0, 70.0, 72.0, 76.0, 94.0, 70.0, 54.0, 61.0, 58.0, 34.0, 22.0, 21.0, 14.0, 13.0, 12.0, 10.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.81927490234375, -1.7664794921875, -1.71368408203125, -1.660888671875, -1.60809326171875, -1.5552978515625, -1.50250244140625, -1.44970703125, -1.39691162109375, -1.3441162109375, -1.29132080078125, -1.238525390625, -1.18572998046875, -1.1329345703125, -1.08013916015625, -1.02734375, -0.97454833984375, -0.9217529296875, -0.86895751953125, -0.816162109375, -0.76336669921875, -0.7105712890625, -0.65777587890625, -0.60498046875, -0.55218505859375, -0.4993896484375, -0.44659423828125, -0.393798828125, -0.34100341796875, -0.2882080078125, -0.23541259765625, -0.1826171875, -0.12982177734375, -0.0770263671875, -0.02423095703125, 0.028564453125, 0.08135986328125, 0.1341552734375, 0.18695068359375, 0.23974609375, 0.29254150390625, 0.3453369140625, 0.39813232421875, 0.450927734375, 0.50372314453125, 0.5565185546875, 0.60931396484375, 0.662109375, 0.71490478515625, 0.7677001953125, 0.82049560546875, 0.873291015625, 0.92608642578125, 0.9788818359375, 1.03167724609375, 1.08447265625, 1.13726806640625, 1.1900634765625, 1.24285888671875, 1.295654296875, 1.34844970703125, 1.4012451171875, 1.45404052734375, 1.5068359375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 11.0, 6.0, 13.0, 15.0, 23.0, 45.0, 79.0, 147.0, 333.0, 910.0, 4510.0, 45955.0, 3757299.0, 367265.0, 14408.0, 2212.0, 546.0, 212.0, 109.0, 51.0, 36.0, 29.0, 12.0, 9.0, 14.0, 5.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.46453857421875, -4.2767333984375, -4.08892822265625, -3.901123046875, -3.71331787109375, -3.5255126953125, -3.33770751953125, -3.14990234375, -2.96209716796875, -2.7742919921875, -2.58648681640625, -2.398681640625, -2.21087646484375, -2.0230712890625, -1.83526611328125, -1.6474609375, -1.45965576171875, -1.2718505859375, -1.08404541015625, -0.896240234375, -0.70843505859375, -0.5206298828125, -0.33282470703125, -0.14501953125, 0.04278564453125, 0.2305908203125, 0.41839599609375, 0.606201171875, 0.79400634765625, 0.9818115234375, 1.16961669921875, 1.357421875, 1.54522705078125, 1.7330322265625, 1.92083740234375, 2.108642578125, 2.29644775390625, 2.4842529296875, 2.67205810546875, 2.85986328125, 3.04766845703125, 3.2354736328125, 3.42327880859375, 3.611083984375, 3.79888916015625, 3.9866943359375, 4.17449951171875, 4.3623046875, 4.55010986328125, 4.7379150390625, 4.92572021484375, 5.113525390625, 5.30133056640625, 5.4891357421875, 5.67694091796875, 5.86474609375, 6.05255126953125, 6.2403564453125, 6.42816162109375, 6.615966796875, 6.80377197265625, 6.9915771484375, 7.17938232421875, 7.3671875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 14.0, 8.0, 12.0, 16.0, 20.0, 25.0, 29.0, 39.0, 76.0, 90.0, 131.0, 217.0, 337.0, 571.0, 763.0, 594.0, 382.0, 219.0, 153.0, 93.0, 69.0, 34.0, 44.0, 26.0, 24.0, 13.0, 16.0, 8.0, 10.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7569046020507812, -0.7350006103515625, -0.7130966186523438, -0.691192626953125, -0.6692886352539062, -0.6473846435546875, -0.6254806518554688, -0.60357666015625, -0.5816726684570312, -0.5597686767578125, -0.5378646850585938, -0.515960693359375, -0.49405670166015625, -0.4721527099609375, -0.45024871826171875, -0.4283447265625, -0.40644073486328125, -0.3845367431640625, -0.36263275146484375, -0.340728759765625, -0.31882476806640625, -0.2969207763671875, -0.27501678466796875, -0.25311279296875, -0.23120880126953125, -0.2093048095703125, -0.18740081787109375, -0.165496826171875, -0.14359283447265625, -0.1216888427734375, -0.09978485107421875, -0.077880859375, -0.05597686767578125, -0.0340728759765625, -0.01216888427734375, 0.009735107421875, 0.03163909912109375, 0.0535430908203125, 0.07544708251953125, 0.09735107421875, 0.11925506591796875, 0.1411590576171875, 0.16306304931640625, 0.184967041015625, 0.20687103271484375, 0.2287750244140625, 0.25067901611328125, 0.2725830078125, 0.29448699951171875, 0.3163909912109375, 0.33829498291015625, 0.360198974609375, 0.38210296630859375, 0.4040069580078125, 0.42591094970703125, 0.44781494140625, 0.46971893310546875, 0.4916229248046875, 0.5135269165039062, 0.535430908203125, 0.5573348999023438, 0.5792388916015625, 0.6011428833007812, 0.623046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 13.0, 21.0, 12.0, 28.0, 33.0, 49.0, 65.0, 79.0, 102.0, 122.0, 98.0, 98.0, 88.0, 58.0, 45.0, 26.0, 30.0, 13.0, 11.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.552720069885254, -2.454667091369629, -2.356614351272583, -2.258561372756958, -2.160508632659912, -2.062455654144287, -1.9644027948379517, -1.8663499355316162, -1.7682969570159912, -1.6702440977096558, -1.5721912384033203, -1.4741382598876953, -1.3760854005813599, -1.2780325412750244, -1.179979681968689, -1.0819268226623535, -0.9838739633560181, -0.8858211040496826, -0.7877681851387024, -0.6897153258323669, -0.5916624069213867, -0.49360954761505127, -0.3955566883087158, -0.2975037693977356, -0.19945091009140015, -0.1013980284333229, -0.0033451467752456665, 0.09470772743225098, 0.1927606165409088, 0.29081350564956665, 0.3888663649559021, 0.4869192838668823, 0.5849721431732178, 0.6830250024795532, 0.7810779213905334, 0.8791307806968689, 0.9771836996078491, 1.0752365589141846, 1.17328941822052, 1.2713422775268555, 1.3693952560424805, 1.467448115348816, 1.5655009746551514, 1.6635539531707764, 1.7616068124771118, 1.8596596717834473, 1.9577125310897827, 2.055765390396118, 2.153818130493164, 2.251871109008789, 2.349923849105835, 2.44797682762146, 2.546029567718506, 2.644082546234131, 2.742135524749756, 2.8401882648468018, 2.9382412433624268, 3.0362942218780518, 3.1343469619750977, 3.2323999404907227, 3.3304526805877686, 3.4285056591033936, 3.5265583992004395, 3.6246113777160645, 3.7226643562316895]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 2.0, 4.0, 9.0, 12.0, 11.0, 19.0, 19.0, 18.0, 21.0, 25.0, 23.0, 31.0, 33.0, 38.0, 39.0, 38.0, 46.0, 42.0, 40.0, 53.0, 55.0, 39.0, 49.0, 34.0, 30.0, 36.0, 26.0, 25.0, 28.0, 23.0, 20.0, 23.0, 11.0, 11.0, 15.0, 12.0, 6.0, 5.0, 2.0, 4.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4101009368896484, -1.361124873161316, -1.312148928642273, -1.2631728649139404, -1.2141969203948975, -1.165220856666565, -1.1162447929382324, -1.0672688484191895, -1.0182929039001465, -0.9693168997764587, -0.920340895652771, -0.8713648319244385, -0.8223888874053955, -0.773412823677063, -0.7244368195533752, -0.6754608154296875, -0.626484751701355, -0.5775087475776672, -0.5285327434539795, -0.47955670952796936, -0.4305807054042816, -0.38160470128059387, -0.33262866735458374, -0.283652663230896, -0.23467665910720825, -0.1857006549835205, -0.13672463595867157, -0.08774861693382263, -0.03877261281013489, 0.010203391313552856, 0.05917942523956299, 0.10815542936325073, 0.15713131427764893, 0.20610731840133667, 0.2550833225250244, 0.30405935645103455, 0.3530353605747223, 0.40201136469841003, 0.45098739862442017, 0.4999634027481079, 0.5489394068717957, 0.5979154109954834, 0.6468914151191711, 0.6958674192428589, 0.7448434829711914, 0.7938194274902344, 0.8427954912185669, 0.8917714953422546, 0.9407474994659424, 0.9897235035896301, 1.0386995077133179, 1.0876755714416504, 1.1366515159606934, 1.1856275796890259, 1.2346036434173584, 1.2835795879364014, 1.3325555324554443, 1.3815315961837769, 1.4305075407028198, 1.4794836044311523, 1.5284595489501953, 1.5774356126785278, 1.6264116764068604, 1.6753876209259033, 1.7243636846542358]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 4.0, 6.0, 7.0, 15.0, 25.0, 38.0, 36.0, 77.0, 116.0, 211.0, 366.0, 668.0, 1528.0, 3455.0, 8631.0, 26996.0, 106096.0, 408498.0, 364885.0, 89954.0, 23184.0, 7889.0, 3066.0, 1305.0, 628.0, 340.0, 176.0, 92.0, 78.0, 49.0, 37.0, 23.0, 19.0, 13.0, 9.0, 8.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.25432586669921875, -0.2452239990234375, -0.23612213134765625, -0.227020263671875, -0.21791839599609375, -0.2088165283203125, -0.19971466064453125, -0.19061279296875, -0.18151092529296875, -0.1724090576171875, -0.16330718994140625, -0.154205322265625, -0.14510345458984375, -0.1360015869140625, -0.12689971923828125, -0.1177978515625, -0.10869598388671875, -0.0995941162109375, -0.09049224853515625, -0.081390380859375, -0.07228851318359375, -0.0631866455078125, -0.05408477783203125, -0.04498291015625, -0.03588104248046875, -0.0267791748046875, -0.01767730712890625, -0.008575439453125, 0.00052642822265625, 0.0096282958984375, 0.01873016357421875, 0.02783203125, 0.03693389892578125, 0.0460357666015625, 0.05513763427734375, 0.064239501953125, 0.07334136962890625, 0.0824432373046875, 0.09154510498046875, 0.10064697265625, 0.10974884033203125, 0.1188507080078125, 0.12795257568359375, 0.137054443359375, 0.14615631103515625, 0.1552581787109375, 0.16436004638671875, 0.1734619140625, 0.18256378173828125, 0.1916656494140625, 0.20076751708984375, 0.209869384765625, 0.21897125244140625, 0.2280731201171875, 0.23717498779296875, 0.24627685546875, 0.25537872314453125, 0.2644805908203125, 0.27358245849609375, 0.282684326171875, 0.29178619384765625, 0.3008880615234375, 0.30998992919921875, 0.319091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 4.0, 16.0, 21.0, 18.0, 21.0, 21.0, 30.0, 34.0, 39.0, 35.0, 35.0, 52.0, 48.0, 47.0, 52.0, 50.0, 48.0, 50.0, 48.0, 41.0, 44.0, 32.0, 26.0, 28.0, 22.0, 14.0, 22.0, 17.0, 17.0, 11.0, 6.0, 6.0, 7.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0390625, -1.0032958984375, -0.967529296875, -0.9317626953125, -0.89599609375, -0.8602294921875, -0.824462890625, -0.7886962890625, -0.7529296875, -0.7171630859375, -0.681396484375, -0.6456298828125, -0.60986328125, -0.5740966796875, -0.538330078125, -0.5025634765625, -0.466796875, -0.4310302734375, -0.395263671875, -0.3594970703125, -0.32373046875, -0.2879638671875, -0.252197265625, -0.2164306640625, -0.1806640625, -0.1448974609375, -0.109130859375, -0.0733642578125, -0.03759765625, -0.0018310546875, 0.033935546875, 0.0697021484375, 0.10546875, 0.1412353515625, 0.177001953125, 0.2127685546875, 0.24853515625, 0.2843017578125, 0.320068359375, 0.3558349609375, 0.3916015625, 0.4273681640625, 0.463134765625, 0.4989013671875, 0.53466796875, 0.5704345703125, 0.606201171875, 0.6419677734375, 0.677734375, 0.7135009765625, 0.749267578125, 0.7850341796875, 0.82080078125, 0.8565673828125, 0.892333984375, 0.9281005859375, 0.9638671875, 0.9996337890625, 1.035400390625, 1.0711669921875, 1.10693359375, 1.1427001953125, 1.178466796875, 1.2142333984375, 1.25]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 7.0, 21.0, 26.0, 40.0, 52.0, 91.0, 131.0, 205.0, 357.0, 659.0, 1393.0, 3220.0, 8832.0, 33451.0, 163752.0, 492601.0, 265962.0, 56182.0, 13643.0, 4302.0, 1715.0, 730.0, 440.0, 248.0, 187.0, 97.0, 57.0, 49.0, 24.0, 24.0, 17.0, 9.0, 2.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.23785972595214844, -0.22925949096679688, -0.2206592559814453, -0.21205902099609375, -0.2034587860107422, -0.19485855102539062, -0.18625831604003906, -0.1776580810546875, -0.16905784606933594, -0.16045761108398438, -0.1518573760986328, -0.14325714111328125, -0.1346569061279297, -0.12605667114257812, -0.11745643615722656, -0.108856201171875, -0.10025596618652344, -0.09165573120117188, -0.08305549621582031, -0.07445526123046875, -0.06585502624511719, -0.057254791259765625, -0.04865455627441406, -0.0400543212890625, -0.03145408630371094, -0.022853851318359375, -0.014253616333007812, -0.00565338134765625, 0.0029468536376953125, 0.011547088623046875, 0.020147323608398438, 0.02874755859375, 0.03734779357910156, 0.045948028564453125, 0.05454826354980469, 0.06314849853515625, 0.07174873352050781, 0.08034896850585938, 0.08894920349121094, 0.0975494384765625, 0.10614967346191406, 0.11474990844726562, 0.12335014343261719, 0.13195037841796875, 0.1405506134033203, 0.14915084838867188, 0.15775108337402344, 0.166351318359375, 0.17495155334472656, 0.18355178833007812, 0.1921520233154297, 0.20075225830078125, 0.2093524932861328, 0.21795272827148438, 0.22655296325683594, 0.2351531982421875, 0.24375343322753906, 0.2523536682128906, 0.2609539031982422, 0.26955413818359375, 0.2781543731689453, 0.2867546081542969, 0.29535484313964844, 0.303955078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 11.0, 15.0, 13.0, 8.0, 18.0, 9.0, 21.0, 27.0, 30.0, 35.0, 37.0, 26.0, 51.0, 37.0, 41.0, 44.0, 46.0, 58.0, 39.0, 29.0, 35.0, 45.0, 29.0, 30.0, 36.0, 28.0, 19.0, 18.0, 21.0, 16.0, 10.0, 13.0, 10.0, 12.0, 6.0, 6.0, 15.0, 5.0, 7.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.09393310546875, -2.0277099609375, -1.96148681640625, -1.895263671875, -1.82904052734375, -1.7628173828125, -1.69659423828125, -1.63037109375, -1.56414794921875, -1.4979248046875, -1.43170166015625, -1.365478515625, -1.29925537109375, -1.2330322265625, -1.16680908203125, -1.1005859375, -1.03436279296875, -0.9681396484375, -0.90191650390625, -0.835693359375, -0.76947021484375, -0.7032470703125, -0.63702392578125, -0.57080078125, -0.50457763671875, -0.4383544921875, -0.37213134765625, -0.305908203125, -0.23968505859375, -0.1734619140625, -0.10723876953125, -0.041015625, 0.02520751953125, 0.0914306640625, 0.15765380859375, 0.223876953125, 0.29010009765625, 0.3563232421875, 0.42254638671875, 0.48876953125, 0.55499267578125, 0.6212158203125, 0.68743896484375, 0.753662109375, 0.81988525390625, 0.8861083984375, 0.95233154296875, 1.0185546875, 1.08477783203125, 1.1510009765625, 1.21722412109375, 1.283447265625, 1.34967041015625, 1.4158935546875, 1.48211669921875, 1.54833984375, 1.61456298828125, 1.6807861328125, 1.74700927734375, 1.813232421875, 1.87945556640625, 1.9456787109375, 2.01190185546875, 2.078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 15.0, 28.0, 31.0, 50.0, 66.0, 106.0, 189.0, 333.0, 645.0, 1379.0, 3352.0, 10236.0, 40243.0, 230384.0, 584235.0, 138243.0, 26624.0, 7355.0, 2703.0, 1093.0, 530.0, 249.0, 147.0, 80.0, 71.0, 42.0, 30.0, 26.0, 16.0, 18.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.1258544921875, -0.1225738525390625, -0.119293212890625, -0.1160125732421875, -0.11273193359375, -0.1094512939453125, -0.106170654296875, -0.1028900146484375, -0.099609375, -0.0963287353515625, -0.093048095703125, -0.0897674560546875, -0.08648681640625, -0.0832061767578125, -0.079925537109375, -0.0766448974609375, -0.0733642578125, -0.0700836181640625, -0.066802978515625, -0.0635223388671875, -0.06024169921875, -0.0569610595703125, -0.053680419921875, -0.0503997802734375, -0.047119140625, -0.0438385009765625, -0.040557861328125, -0.0372772216796875, -0.03399658203125, -0.0307159423828125, -0.027435302734375, -0.0241546630859375, -0.0208740234375, -0.0175933837890625, -0.014312744140625, -0.0110321044921875, -0.00775146484375, -0.0044708251953125, -0.001190185546875, 0.0020904541015625, 0.00537109375, 0.0086517333984375, 0.011932373046875, 0.0152130126953125, 0.01849365234375, 0.0217742919921875, 0.025054931640625, 0.0283355712890625, 0.0316162109375, 0.0348968505859375, 0.038177490234375, 0.0414581298828125, 0.04473876953125, 0.0480194091796875, 0.051300048828125, 0.0545806884765625, 0.057861328125, 0.0611419677734375, 0.064422607421875, 0.0677032470703125, 0.07098388671875, 0.0742645263671875, 0.077545166015625, 0.0808258056640625, 0.0841064453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 15.0, 13.0, 22.0, 27.0, 46.0, 48.0, 70.0, 84.0, 96.0, 105.0, 114.0, 77.0, 56.0, 53.0, 37.0, 31.0, 24.0, 13.0, 18.0, 8.0, 4.0, 10.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.324052810668945e-05, -6.123911589384079e-05, -5.9237703680992126e-05, -5.723629146814346e-05, -5.52348792552948e-05, -5.3233467042446136e-05, -5.123205482959747e-05, -4.923064261674881e-05, -4.7229230403900146e-05, -4.522781819105148e-05, -4.322640597820282e-05, -4.1224993765354156e-05, -3.922358155250549e-05, -3.722216933965683e-05, -3.5220757126808167e-05, -3.32193449139595e-05, -3.121793270111084e-05, -2.9216520488262177e-05, -2.7215108275413513e-05, -2.521369606256485e-05, -2.3212283849716187e-05, -2.1210871636867523e-05, -1.920945942401886e-05, -1.7208047211170197e-05, -1.5206634998321533e-05, -1.320522278547287e-05, -1.1203810572624207e-05, -9.202398359775543e-06, -7.20098614692688e-06, -5.1995739340782166e-06, -3.1981617212295532e-06, -1.1967495083808899e-06, 8.046627044677734e-07, 2.8060749173164368e-06, 4.8074871301651e-06, 6.8088993430137634e-06, 8.810311555862427e-06, 1.081172376871109e-05, 1.2813135981559753e-05, 1.4814548194408417e-05, 1.681596040725708e-05, 1.8817372620105743e-05, 2.0818784832954407e-05, 2.282019704580307e-05, 2.4821609258651733e-05, 2.6823021471500397e-05, 2.882443368434906e-05, 3.0825845897197723e-05, 3.282725811004639e-05, 3.482867032289505e-05, 3.683008253574371e-05, 3.883149474859238e-05, 4.083290696144104e-05, 4.28343191742897e-05, 4.483573138713837e-05, 4.683714359998703e-05, 4.883855581283569e-05, 5.083996802568436e-05, 5.284138023853302e-05, 5.484279245138168e-05, 5.684420466423035e-05, 5.884561687707901e-05, 6.084702908992767e-05, 6.284844130277634e-05, 6.4849853515625e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 9.0, 14.0, 13.0, 9.0, 13.0, 29.0, 41.0, 50.0, 62.0, 94.0, 139.0, 194.0, 343.0, 574.0, 1056.0, 2080.0, 4543.0, 11026.0, 34572.0, 143975.0, 497216.0, 264014.0, 58813.0, 17030.0, 6421.0, 2888.0, 1402.0, 742.0, 413.0, 248.0, 155.0, 102.0, 80.0, 42.0, 27.0, 31.0, 24.0, 20.0, 12.0, 13.0, 5.0, 2.0, 8.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09637451171875, -0.09323501586914062, -0.09009552001953125, -0.08695602416992188, -0.0838165283203125, -0.08067703247070312, -0.07753753662109375, -0.07439804077148438, -0.071258544921875, -0.06811904907226562, -0.06497955322265625, -0.061840057373046875, -0.0587005615234375, -0.055561065673828125, -0.05242156982421875, -0.049282073974609375, -0.046142578125, -0.043003082275390625, -0.03986358642578125, -0.036724090576171875, -0.0335845947265625, -0.030445098876953125, -0.02730560302734375, -0.024166107177734375, -0.021026611328125, -0.017887115478515625, -0.01474761962890625, -0.011608123779296875, -0.0084686279296875, -0.005329132080078125, -0.00218963623046875, 0.000949859619140625, 0.00408935546875, 0.007228851318359375, 0.01036834716796875, 0.013507843017578125, 0.0166473388671875, 0.019786834716796875, 0.02292633056640625, 0.026065826416015625, 0.029205322265625, 0.032344818115234375, 0.03548431396484375, 0.038623809814453125, 0.0417633056640625, 0.044902801513671875, 0.04804229736328125, 0.051181793212890625, 0.0543212890625, 0.057460784912109375, 0.06060028076171875, 0.06373977661132812, 0.0668792724609375, 0.07001876831054688, 0.07315826416015625, 0.07629776000976562, 0.079437255859375, 0.08257675170898438, 0.08571624755859375, 0.08885574340820312, 0.0919952392578125, 0.09513473510742188, 0.09827423095703125, 0.10141372680664062, 0.10455322265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 6.0, 4.0, 8.0, 8.0, 12.0, 9.0, 38.0, 37.0, 44.0, 41.0, 73.0, 94.0, 83.0, 83.0, 88.0, 82.0, 63.0, 51.0, 44.0, 29.0, 17.0, 26.0, 11.0, 6.0, 12.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0306854248046875, -0.0298919677734375, -0.0290985107421875, -0.0283050537109375, -0.0275115966796875, -0.0267181396484375, -0.0259246826171875, -0.0251312255859375, -0.0243377685546875, -0.0235443115234375, -0.0227508544921875, -0.0219573974609375, -0.0211639404296875, -0.0203704833984375, -0.0195770263671875, -0.0187835693359375, -0.0179901123046875, -0.0171966552734375, -0.0164031982421875, -0.0156097412109375, -0.0148162841796875, -0.0140228271484375, -0.0132293701171875, -0.0124359130859375, -0.0116424560546875, -0.0108489990234375, -0.0100555419921875, -0.0092620849609375, -0.0084686279296875, -0.0076751708984375, -0.0068817138671875, -0.0060882568359375, -0.0052947998046875, -0.0045013427734375, -0.0037078857421875, -0.0029144287109375, -0.0021209716796875, -0.0013275146484375, -0.0005340576171875, 0.0002593994140625, 0.0010528564453125, 0.0018463134765625, 0.0026397705078125, 0.0034332275390625, 0.0042266845703125, 0.0050201416015625, 0.0058135986328125, 0.0066070556640625, 0.0074005126953125, 0.0081939697265625, 0.0089874267578125, 0.0097808837890625, 0.0105743408203125, 0.0113677978515625, 0.0121612548828125, 0.0129547119140625, 0.0137481689453125, 0.0145416259765625, 0.0153350830078125, 0.0161285400390625, 0.0169219970703125, 0.0177154541015625, 0.0185089111328125, 0.0193023681640625, 0.0200958251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 9.0, 10.0, 23.0, 24.0, 35.0, 46.0, 56.0, 63.0, 94.0, 97.0, 88.0, 109.0, 86.0, 60.0, 55.0, 40.0, 23.0, 20.0, 18.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6849658489227295, -1.6311278343200684, -1.5772899389266968, -1.5234519243240356, -1.4696139097213745, -1.415776014328003, -1.3619379997253418, -1.3080999851226807, -1.2542619705200195, -1.2004239559173584, -1.1465860605239868, -1.0927480459213257, -1.0389100313186646, -0.9850720763206482, -0.9312341213226318, -0.8773961067199707, -0.8235582113265991, -0.7697202563285828, -0.7158822417259216, -0.6620442867279053, -0.6082062721252441, -0.5543683171272278, -0.5005303621292114, -0.4466923773288727, -0.39285439252853394, -0.3390164077281952, -0.28517842292785645, -0.2313404679298401, -0.17750248312950134, -0.1236644983291626, -0.06982654333114624, -0.015988558530807495, 0.0378495454788208, 0.09168752282857895, 0.1455255001783371, 0.19936347007751465, 0.2532014548778534, 0.30703943967819214, 0.3608773946762085, 0.41471537947654724, 0.468553364276886, 0.5223913192749023, 0.5762293338775635, 0.6300672888755798, 0.6839052438735962, 0.7377432584762573, 0.7915812134742737, 0.84541916847229, 0.8992571830749512, 0.9530951380729675, 1.0069330930709839, 1.060771107673645, 1.1146091222763062, 1.1684470176696777, 1.2222850322723389, 1.276123046875, 1.3299610614776611, 1.3837990760803223, 1.4376369714736938, 1.491474986076355, 1.5453130006790161, 1.5991508960723877, 1.6529889106750488, 1.70682692527771, 1.7606648206710815]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 5.0, 5.0, 11.0, 17.0, 20.0, 23.0, 24.0, 17.0, 33.0, 35.0, 43.0, 42.0, 45.0, 49.0, 48.0, 57.0, 60.0, 53.0, 52.0, 47.0, 26.0, 44.0, 30.0, 28.0, 21.0, 22.0, 35.0, 16.0, 12.0, 11.0, 12.0, 9.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9726780652999878, -0.9380478858947754, -0.903417706489563, -0.8687874674797058, -0.8341572880744934, -0.799527108669281, -0.7648968696594238, -0.7302666902542114, -0.695636510848999, -0.6610063314437866, -0.6263761520385742, -0.591745913028717, -0.5571157336235046, -0.5224855542182922, -0.48785534501075745, -0.45322513580322266, -0.41859495639801025, -0.38396477699279785, -0.34933456778526306, -0.31470435857772827, -0.28007417917251587, -0.24544398486614227, -0.21081379055976868, -0.17618359625339508, -0.14155340194702148, -0.10692320764064789, -0.07229301333427429, -0.037662819027900696, -0.0030326247215270996, 0.0315975695848465, 0.06622776389122009, 0.10085795819759369, 0.13548815250396729, 0.17011834681034088, 0.20474854111671448, 0.23937873542308807, 0.27400892972946167, 0.3086391091346741, 0.34326931834220886, 0.37789952754974365, 0.41252970695495605, 0.44715988636016846, 0.48179009556770325, 0.516420304775238, 0.5510504841804504, 0.5856806635856628, 0.62031090259552, 0.6549410820007324, 0.6895712614059448, 0.7242014408111572, 0.7588316202163696, 0.7934618592262268, 0.8280920386314392, 0.8627222180366516, 0.8973524570465088, 0.9319826364517212, 0.9666128158569336, 1.001242995262146, 1.0358731746673584, 1.0705033540725708, 1.1051335334777832, 1.1397638320922852, 1.1743940114974976, 1.20902419090271, 1.2436543703079224]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 4.0, 11.0, 4.0, 17.0, 22.0, 29.0, 49.0, 44.0, 67.0, 121.0, 173.0, 299.0, 450.0, 811.0, 1467.0, 2864.0, 5878.0, 13789.0, 36316.0, 145395.0, 630537.0, 147493.0, 36434.0, 13689.0, 6064.0, 2866.0, 1504.0, 810.0, 462.0, 311.0, 193.0, 140.0, 65.0, 61.0, 33.0, 28.0, 14.0, 10.0, 8.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6796875, -1.6227569580078125, -1.565826416015625, -1.5088958740234375, -1.45196533203125, -1.3950347900390625, -1.338104248046875, -1.2811737060546875, -1.2242431640625, -1.1673126220703125, -1.110382080078125, -1.0534515380859375, -0.99652099609375, -0.9395904541015625, -0.882659912109375, -0.8257293701171875, -0.768798828125, -0.7118682861328125, -0.654937744140625, -0.5980072021484375, -0.54107666015625, -0.4841461181640625, -0.427215576171875, -0.3702850341796875, -0.3133544921875, -0.2564239501953125, -0.199493408203125, -0.1425628662109375, -0.08563232421875, -0.0287017822265625, 0.028228759765625, 0.0851593017578125, 0.14208984375, 0.1990203857421875, 0.255950927734375, 0.3128814697265625, 0.36981201171875, 0.4267425537109375, 0.483673095703125, 0.5406036376953125, 0.5975341796875, 0.6544647216796875, 0.711395263671875, 0.7683258056640625, 0.82525634765625, 0.8821868896484375, 0.939117431640625, 0.9960479736328125, 1.052978515625, 1.1099090576171875, 1.166839599609375, 1.2237701416015625, 1.28070068359375, 1.3376312255859375, 1.394561767578125, 1.4514923095703125, 1.5084228515625, 1.5653533935546875, 1.622283935546875, 1.6792144775390625, 1.73614501953125, 1.7930755615234375, 1.850006103515625, 1.9069366455078125, 1.9638671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 9.0, 6.0, 12.0, 19.0, 21.0, 15.0, 28.0, 28.0, 33.0, 31.0, 38.0, 57.0, 57.0, 59.0, 52.0, 58.0, 49.0, 47.0, 50.0, 49.0, 30.0, 38.0, 28.0, 29.0, 26.0, 29.0, 23.0, 11.0, 5.0, 12.0, 5.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.34765625, -2.267669677734375, -2.18768310546875, -2.107696533203125, -2.0277099609375, -1.947723388671875, -1.86773681640625, -1.787750244140625, -1.707763671875, -1.627777099609375, -1.54779052734375, -1.467803955078125, -1.3878173828125, -1.307830810546875, -1.22784423828125, -1.147857666015625, -1.06787109375, -0.987884521484375, -0.90789794921875, -0.827911376953125, -0.7479248046875, -0.667938232421875, -0.58795166015625, -0.507965087890625, -0.427978515625, -0.347991943359375, -0.26800537109375, -0.188018798828125, -0.1080322265625, -0.028045654296875, 0.05194091796875, 0.131927490234375, 0.2119140625, 0.291900634765625, 0.37188720703125, 0.451873779296875, 0.5318603515625, 0.611846923828125, 0.69183349609375, 0.771820068359375, 0.851806640625, 0.931793212890625, 1.01177978515625, 1.091766357421875, 1.1717529296875, 1.251739501953125, 1.33172607421875, 1.411712646484375, 1.49169921875, 1.571685791015625, 1.65167236328125, 1.731658935546875, 1.8116455078125, 1.891632080078125, 1.97161865234375, 2.051605224609375, 2.131591796875, 2.211578369140625, 2.29156494140625, 2.371551513671875, 2.4515380859375, 2.531524658203125, 2.61151123046875, 2.691497802734375, 2.771484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 6.0, 12.0, 20.0, 20.0, 42.0, 70.0, 107.0, 222.0, 548.0, 1752.0, 7510.0, 42669.0, 760811.0, 208594.0, 20208.0, 4091.0, 1091.0, 363.0, 157.0, 92.0, 46.0, 40.0, 24.0, 14.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.28125, -4.173675537109375, -4.06610107421875, -3.958526611328125, -3.8509521484375, -3.743377685546875, -3.63580322265625, -3.528228759765625, -3.420654296875, -3.313079833984375, -3.20550537109375, -3.097930908203125, -2.9903564453125, -2.882781982421875, -2.77520751953125, -2.667633056640625, -2.56005859375, -2.452484130859375, -2.34490966796875, -2.237335205078125, -2.1297607421875, -2.022186279296875, -1.91461181640625, -1.807037353515625, -1.699462890625, -1.591888427734375, -1.48431396484375, -1.376739501953125, -1.2691650390625, -1.161590576171875, -1.05401611328125, -0.946441650390625, -0.8388671875, -0.731292724609375, -0.62371826171875, -0.516143798828125, -0.4085693359375, -0.300994873046875, -0.19342041015625, -0.085845947265625, 0.021728515625, 0.129302978515625, 0.23687744140625, 0.344451904296875, 0.4520263671875, 0.559600830078125, 0.66717529296875, 0.774749755859375, 0.88232421875, 0.989898681640625, 1.09747314453125, 1.205047607421875, 1.3126220703125, 1.420196533203125, 1.52777099609375, 1.635345458984375, 1.742919921875, 1.850494384765625, 1.95806884765625, 2.065643310546875, 2.1732177734375, 2.280792236328125, 2.38836669921875, 2.495941162109375, 2.603515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 7.0, 11.0, 15.0, 24.0, 16.0, 19.0, 18.0, 15.0, 17.0, 47.0, 40.0, 41.0, 45.0, 50.0, 66.0, 60.0, 69.0, 52.0, 43.0, 46.0, 49.0, 34.0, 38.0, 32.0, 24.0, 18.0, 15.0, 11.0, 15.0, 11.0, 6.0, 4.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.74609375, -3.634857177734375, -3.52362060546875, -3.412384033203125, -3.3011474609375, -3.189910888671875, -3.07867431640625, -2.967437744140625, -2.856201171875, -2.744964599609375, -2.63372802734375, -2.522491455078125, -2.4112548828125, -2.300018310546875, -2.18878173828125, -2.077545166015625, -1.96630859375, -1.855072021484375, -1.74383544921875, -1.632598876953125, -1.5213623046875, -1.410125732421875, -1.29888916015625, -1.187652587890625, -1.076416015625, -0.965179443359375, -0.85394287109375, -0.742706298828125, -0.6314697265625, -0.520233154296875, -0.40899658203125, -0.297760009765625, -0.1865234375, -0.075286865234375, 0.03594970703125, 0.147186279296875, 0.2584228515625, 0.369659423828125, 0.48089599609375, 0.592132568359375, 0.703369140625, 0.814605712890625, 0.92584228515625, 1.037078857421875, 1.1483154296875, 1.259552001953125, 1.37078857421875, 1.482025146484375, 1.59326171875, 1.704498291015625, 1.81573486328125, 1.926971435546875, 2.0382080078125, 2.149444580078125, 2.26068115234375, 2.371917724609375, 2.483154296875, 2.594390869140625, 2.70562744140625, 2.816864013671875, 2.9281005859375, 3.039337158203125, 3.15057373046875, 3.261810302734375, 3.373046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 18.0, 21.0, 29.0, 45.0, 96.0, 204.0, 644.0, 2165.0, 9775.0, 61268.0, 773860.0, 174144.0, 20389.0, 4136.0, 1048.0, 349.0, 142.0, 91.0, 32.0, 24.0, 18.0, 9.0, 6.0, 4.0, 10.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8788986206054688, -0.8520355224609375, -0.8251724243164062, -0.798309326171875, -0.7714462280273438, -0.7445831298828125, -0.7177200317382812, -0.69085693359375, -0.6639938354492188, -0.6371307373046875, -0.6102676391601562, -0.583404541015625, -0.5565414428710938, -0.5296783447265625, -0.5028152465820312, -0.4759521484375, -0.44908905029296875, -0.4222259521484375, -0.39536285400390625, -0.368499755859375, -0.34163665771484375, -0.3147735595703125, -0.28791046142578125, -0.26104736328125, -0.23418426513671875, -0.2073211669921875, -0.18045806884765625, -0.153594970703125, -0.12673187255859375, -0.0998687744140625, -0.07300567626953125, -0.046142578125, -0.01927947998046875, 0.0075836181640625, 0.03444671630859375, 0.061309814453125, 0.08817291259765625, 0.1150360107421875, 0.14189910888671875, 0.16876220703125, 0.19562530517578125, 0.2224884033203125, 0.24935150146484375, 0.276214599609375, 0.30307769775390625, 0.3299407958984375, 0.35680389404296875, 0.3836669921875, 0.41053009033203125, 0.4373931884765625, 0.46425628662109375, 0.491119384765625, 0.5179824829101562, 0.5448455810546875, 0.5717086791992188, 0.59857177734375, 0.6254348754882812, 0.6522979736328125, 0.6791610717773438, 0.706024169921875, 0.7328872680664062, 0.7597503662109375, 0.7866134643554688, 0.8134765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 12.0, 7.0, 10.0, 15.0, 26.0, 29.0, 45.0, 71.0, 78.0, 189.0, 171.0, 105.0, 62.0, 48.0, 32.0, 27.0, 22.0, 18.0, 4.0, 11.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001310110092163086, -0.000127376988530159, -0.0001237429678440094, -0.0001201089471578598, -0.0001164749264717102, -0.00011284090578556061, -0.00010920688509941101, -0.00010557286441326141, -0.00010193884372711182, -9.830482304096222e-05, -9.467080235481262e-05, -9.103678166866302e-05, -8.740276098251343e-05, -8.376874029636383e-05, -8.013471961021423e-05, -7.650069892406464e-05, -7.286667823791504e-05, -6.923265755176544e-05, -6.559863686561584e-05, -6.196461617946625e-05, -5.833059549331665e-05, -5.469657480716705e-05, -5.1062554121017456e-05, -4.742853343486786e-05, -4.379451274871826e-05, -4.0160492062568665e-05, -3.652647137641907e-05, -3.289245069026947e-05, -2.9258430004119873e-05, -2.5624409317970276e-05, -2.199038863182068e-05, -1.835636794567108e-05, -1.4722347259521484e-05, -1.1088326573371887e-05, -7.45430588722229e-06, -3.820285201072693e-06, -1.862645149230957e-07, 3.4477561712265015e-06, 7.081776857376099e-06, 1.0715797543525696e-05, 1.4349818229675293e-05, 1.798383891582489e-05, 2.1617859601974487e-05, 2.5251880288124084e-05, 2.888590097427368e-05, 3.251992166042328e-05, 3.6153942346572876e-05, 3.978796303272247e-05, 4.342198371887207e-05, 4.705600440502167e-05, 5.0690025091171265e-05, 5.432404577732086e-05, 5.795806646347046e-05, 6.159208714962006e-05, 6.522610783576965e-05, 6.886012852191925e-05, 7.249414920806885e-05, 7.612816989421844e-05, 7.976219058036804e-05, 8.339621126651764e-05, 8.703023195266724e-05, 9.066425263881683e-05, 9.429827332496643e-05, 9.793229401111603e-05, 0.00010156631469726562]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 14.0, 20.0, 24.0, 36.0, 61.0, 103.0, 178.0, 280.0, 611.0, 1197.0, 3072.0, 8887.0, 30303.0, 149372.0, 700751.0, 115535.0, 25411.0, 7645.0, 2739.0, 1142.0, 491.0, 280.0, 153.0, 84.0, 50.0, 31.0, 26.0, 21.0, 17.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55419921875, -0.533233642578125, -0.51226806640625, -0.491302490234375, -0.4703369140625, -0.449371337890625, -0.42840576171875, -0.407440185546875, -0.386474609375, -0.365509033203125, -0.34454345703125, -0.323577880859375, -0.3026123046875, -0.281646728515625, -0.26068115234375, -0.239715576171875, -0.21875, -0.197784423828125, -0.17681884765625, -0.155853271484375, -0.1348876953125, -0.113922119140625, -0.09295654296875, -0.071990966796875, -0.051025390625, -0.030059814453125, -0.00909423828125, 0.011871337890625, 0.0328369140625, 0.053802490234375, 0.07476806640625, 0.095733642578125, 0.11669921875, 0.137664794921875, 0.15863037109375, 0.179595947265625, 0.2005615234375, 0.221527099609375, 0.24249267578125, 0.263458251953125, 0.284423828125, 0.305389404296875, 0.32635498046875, 0.347320556640625, 0.3682861328125, 0.389251708984375, 0.41021728515625, 0.431182861328125, 0.4521484375, 0.473114013671875, 0.49407958984375, 0.515045166015625, 0.5360107421875, 0.556976318359375, 0.57794189453125, 0.598907470703125, 0.619873046875, 0.640838623046875, 0.66180419921875, 0.682769775390625, 0.7037353515625, 0.724700927734375, 0.74566650390625, 0.766632080078125, 0.78759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 10.0, 10.0, 10.0, 6.0, 15.0, 23.0, 21.0, 27.0, 31.0, 44.0, 76.0, 122.0, 161.0, 132.0, 99.0, 45.0, 39.0, 24.0, 24.0, 13.0, 11.0, 12.0, 14.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.425048828125, -0.41400909423828125, -0.4029693603515625, -0.39192962646484375, -0.380889892578125, -0.36985015869140625, -0.3588104248046875, -0.34777069091796875, -0.33673095703125, -0.32569122314453125, -0.3146514892578125, -0.30361175537109375, -0.292572021484375, -0.28153228759765625, -0.2704925537109375, -0.25945281982421875, -0.2484130859375, -0.23737335205078125, -0.2263336181640625, -0.21529388427734375, -0.204254150390625, -0.19321441650390625, -0.1821746826171875, -0.17113494873046875, -0.16009521484375, -0.14905548095703125, -0.1380157470703125, -0.12697601318359375, -0.115936279296875, -0.10489654541015625, -0.0938568115234375, -0.08281707763671875, -0.07177734375, -0.06073760986328125, -0.0496978759765625, -0.03865814208984375, -0.027618408203125, -0.01657867431640625, -0.0055389404296875, 0.00550079345703125, 0.01654052734375, 0.02758026123046875, 0.0386199951171875, 0.04965972900390625, 0.060699462890625, 0.07173919677734375, 0.0827789306640625, 0.09381866455078125, 0.1048583984375, 0.11589813232421875, 0.1269378662109375, 0.13797760009765625, 0.149017333984375, 0.16005706787109375, 0.1710968017578125, 0.18213653564453125, 0.19317626953125, 0.20421600341796875, 0.2152557373046875, 0.22629547119140625, 0.237335205078125, 0.24837493896484375, 0.2594146728515625, 0.27045440673828125, 0.281494140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 15.0, 42.0, 66.0, 129.0, 176.0, 192.0, 164.0, 96.0, 53.0, 25.0, 19.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.952287197113037, -2.713155508041382, -2.4740238189697266, -2.234891891479492, -1.9957603216171265, -1.7566286325454712, -1.5174968242645264, -1.278365135192871, -1.0392334461212158, -0.8001017570495605, -0.5609700083732605, -0.32183825969696045, -0.08270657062530518, 0.1564251184463501, 0.3955569267272949, 0.6346886157989502, 0.8738203048706055, 1.1129519939422607, 1.352083683013916, 1.5912154912948608, 1.8303471803665161, 2.069478988647461, 2.308610677719116, 2.5477423667907715, 2.7868740558624268, 3.026005744934082, 3.2651374340057373, 3.5042691230773926, 3.743401050567627, 3.982532501220703, 4.2216644287109375, 4.460796356201172, 4.699928283691406, 4.939060211181641, 5.178191661834717, 5.417323589324951, 5.656455039978027, 5.895586967468262, 6.134718894958496, 6.373850345611572, 6.612981796264648, 6.852113723754883, 7.091245174407959, 7.330377101898193, 7.5695085525512695, 7.808640480041504, 8.047772407531738, 8.286903381347656, 8.52603530883789, 8.765167236328125, 9.00429916381836, 9.243430137634277, 9.482562065124512, 9.721693992614746, 9.96082592010498, 10.199956893920898, 10.43908977508545, 10.678221702575684, 10.917353630065918, 11.156484603881836, 11.39561653137207, 11.634748458862305, 11.873880386352539, 12.113012313842773, 12.352143287658691]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 5.0, 13.0, 4.0, 18.0, 16.0, 14.0, 24.0, 31.0, 20.0, 28.0, 31.0, 35.0, 39.0, 41.0, 48.0, 37.0, 30.0, 43.0, 40.0, 42.0, 40.0, 39.0, 30.0, 38.0, 33.0, 33.0, 35.0, 26.0, 18.0, 22.0, 18.0, 18.0, 12.0, 18.0, 9.0, 10.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.527335166931152, -6.350761413574219, -6.174187660217285, -5.997613906860352, -5.821040630340576, -5.644466876983643, -5.467893123626709, -5.291319370269775, -5.11474609375, -4.938172340393066, -4.761598587036133, -4.585024833679199, -4.408451557159424, -4.23187780380249, -4.055304050445557, -3.878730297088623, -3.7021565437316895, -3.525582790374756, -3.3490092754364014, -3.1724355220794678, -2.9958620071411133, -2.8192882537841797, -2.642714500427246, -2.4661407470703125, -2.289567232131958, -2.1129934787750244, -1.93641996383667, -1.7598462104797363, -1.5832725763320923, -1.4066989421844482, -1.2301251888275146, -1.0535515546798706, -0.8769774436950684, -0.7004038095474243, -0.5238301157951355, -0.3472564220428467, -0.17068278789520264, 0.005890846252441406, 0.182464599609375, 0.35903823375701904, 0.5356118679046631, 0.7121855020523071, 0.888759195804596, 1.0653328895568848, 1.2419065237045288, 1.4184801578521729, 1.5950539112091064, 1.7716275453567505, 1.9482011795043945, 2.124774932861328, 2.3013484477996826, 2.477922201156616, 2.6544957160949707, 2.8310694694519043, 3.007643222808838, 3.1842169761657715, 3.360790491104126, 3.5373642444610596, 3.713937759399414, 3.8905115127563477, 4.067085266113281, 4.243659019470215, 4.420232772827148, 4.596806049346924, 4.773379802703857]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 9.0, 7.0, 21.0, 22.0, 16.0, 45.0, 50.0, 84.0, 116.0, 184.0, 370.0, 703.0, 1854.0, 5358.0, 21717.0, 269852.0, 3773701.0, 99776.0, 13849.0, 3799.0, 1354.0, 578.0, 280.0, 147.0, 94.0, 66.0, 53.0, 36.0, 27.0, 21.0, 16.0, 17.0, 11.0, 7.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.13360595703125, -4.0133056640625, -3.89300537109375, -3.772705078125, -3.65240478515625, -3.5321044921875, -3.41180419921875, -3.29150390625, -3.17120361328125, -3.0509033203125, -2.93060302734375, -2.810302734375, -2.69000244140625, -2.5697021484375, -2.44940185546875, -2.3291015625, -2.20880126953125, -2.0885009765625, -1.96820068359375, -1.847900390625, -1.72760009765625, -1.6072998046875, -1.48699951171875, -1.36669921875, -1.24639892578125, -1.1260986328125, -1.00579833984375, -0.885498046875, -0.76519775390625, -0.6448974609375, -0.52459716796875, -0.404296875, -0.28399658203125, -0.1636962890625, -0.04339599609375, 0.076904296875, 0.19720458984375, 0.3175048828125, 0.43780517578125, 0.55810546875, 0.67840576171875, 0.7987060546875, 0.91900634765625, 1.039306640625, 1.15960693359375, 1.2799072265625, 1.40020751953125, 1.5205078125, 1.64080810546875, 1.7611083984375, 1.88140869140625, 2.001708984375, 2.12200927734375, 2.2423095703125, 2.36260986328125, 2.48291015625, 2.60321044921875, 2.7235107421875, 2.84381103515625, 2.964111328125, 3.08441162109375, 3.2047119140625, 3.32501220703125, 3.4453125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 8.0, 9.0, 16.0, 18.0, 28.0, 28.0, 33.0, 37.0, 31.0, 42.0, 56.0, 34.0, 61.0, 62.0, 71.0, 73.0, 55.0, 41.0, 40.0, 38.0, 35.0, 29.0, 18.0, 20.0, 25.0, 18.0, 14.0, 10.0, 4.0, 10.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8184661865234375, -0.784393310546875, -0.7503204345703125, -0.71624755859375, -0.6821746826171875, -0.648101806640625, -0.6140289306640625, -0.5799560546875, -0.5458831787109375, -0.511810302734375, -0.4777374267578125, -0.44366455078125, -0.4095916748046875, -0.375518798828125, -0.3414459228515625, -0.307373046875, -0.2733001708984375, -0.239227294921875, -0.2051544189453125, -0.17108154296875, -0.1370086669921875, -0.102935791015625, -0.0688629150390625, -0.0347900390625, -0.0007171630859375, 0.033355712890625, 0.0674285888671875, 0.10150146484375, 0.1355743408203125, 0.169647216796875, 0.2037200927734375, 0.23779296875, 0.2718658447265625, 0.305938720703125, 0.3400115966796875, 0.37408447265625, 0.4081573486328125, 0.442230224609375, 0.4763031005859375, 0.5103759765625, 0.5444488525390625, 0.578521728515625, 0.6125946044921875, 0.64666748046875, 0.6807403564453125, 0.714813232421875, 0.7488861083984375, 0.782958984375, 0.8170318603515625, 0.851104736328125, 0.8851776123046875, 0.91925048828125, 0.9533233642578125, 0.987396240234375, 1.0214691162109375, 1.0555419921875, 1.0896148681640625, 1.123687744140625, 1.1577606201171875, 1.19183349609375, 1.2259063720703125, 1.259979248046875, 1.2940521240234375, 1.328125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 11.0, 8.0, 7.0, 11.0, 5.0, 17.0, 27.0, 33.0, 54.0, 57.0, 82.0, 152.0, 232.0, 524.0, 1387.0, 4825.0, 22037.0, 179211.0, 3489294.0, 447359.0, 38078.0, 7330.0, 1964.0, 714.0, 309.0, 167.0, 105.0, 76.0, 42.0, 36.0, 27.0, 25.0, 14.0, 14.0, 6.0, 8.0, 4.0, 9.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84375, -2.747833251953125, -2.65191650390625, -2.555999755859375, -2.4600830078125, -2.364166259765625, -2.26824951171875, -2.172332763671875, -2.076416015625, -1.980499267578125, -1.88458251953125, -1.788665771484375, -1.6927490234375, -1.596832275390625, -1.50091552734375, -1.404998779296875, -1.30908203125, -1.213165283203125, -1.11724853515625, -1.021331787109375, -0.9254150390625, -0.829498291015625, -0.73358154296875, -0.637664794921875, -0.541748046875, -0.445831298828125, -0.34991455078125, -0.253997802734375, -0.1580810546875, -0.062164306640625, 0.03375244140625, 0.129669189453125, 0.2255859375, 0.321502685546875, 0.41741943359375, 0.513336181640625, 0.6092529296875, 0.705169677734375, 0.80108642578125, 0.897003173828125, 0.992919921875, 1.088836669921875, 1.18475341796875, 1.280670166015625, 1.3765869140625, 1.472503662109375, 1.56842041015625, 1.664337158203125, 1.76025390625, 1.856170654296875, 1.95208740234375, 2.048004150390625, 2.1439208984375, 2.239837646484375, 2.33575439453125, 2.431671142578125, 2.527587890625, 2.623504638671875, 2.71942138671875, 2.815338134765625, 2.9112548828125, 3.007171630859375, 3.10308837890625, 3.199005126953125, 3.294921875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 8.0, 15.0, 18.0, 16.0, 27.0, 43.0, 46.0, 65.0, 77.0, 127.0, 191.0, 270.0, 416.0, 586.0, 632.0, 463.0, 317.0, 216.0, 142.0, 102.0, 63.0, 58.0, 34.0, 34.0, 26.0, 13.0, 14.0, 13.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.673828125, -0.6547012329101562, -0.6355743408203125, -0.6164474487304688, -0.597320556640625, -0.5781936645507812, -0.5590667724609375, -0.5399398803710938, -0.52081298828125, -0.5016860961914062, -0.4825592041015625, -0.46343231201171875, -0.444305419921875, -0.42517852783203125, -0.4060516357421875, -0.38692474365234375, -0.3677978515625, -0.34867095947265625, -0.3295440673828125, -0.31041717529296875, -0.291290283203125, -0.27216339111328125, -0.2530364990234375, -0.23390960693359375, -0.21478271484375, -0.19565582275390625, -0.1765289306640625, -0.15740203857421875, -0.138275146484375, -0.11914825439453125, -0.1000213623046875, -0.08089447021484375, -0.061767578125, -0.04264068603515625, -0.0235137939453125, -0.00438690185546875, 0.014739990234375, 0.03386688232421875, 0.0529937744140625, 0.07212066650390625, 0.09124755859375, 0.11037445068359375, 0.1295013427734375, 0.14862823486328125, 0.167755126953125, 0.18688201904296875, 0.2060089111328125, 0.22513580322265625, 0.2442626953125, 0.26338958740234375, 0.2825164794921875, 0.30164337158203125, 0.320770263671875, 0.33989715576171875, 0.3590240478515625, 0.37815093994140625, 0.39727783203125, 0.41640472412109375, 0.4355316162109375, 0.45465850830078125, 0.473785400390625, 0.49291229248046875, 0.5120391845703125, 0.5311660766601562, 0.55029296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 11.0, 22.0, 24.0, 39.0, 53.0, 73.0, 77.0, 107.0, 102.0, 105.0, 90.0, 75.0, 67.0, 51.0, 37.0, 24.0, 12.0, 15.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5456047058105469, -1.4555232524871826, -1.3654416799545288, -1.2753602266311646, -1.1852786540985107, -1.0951972007751465, -1.0051157474517822, -0.9150342345237732, -0.8249527215957642, -0.7348712086677551, -0.6447896957397461, -0.5547082424163818, -0.4646267294883728, -0.37454521656036377, -0.2844637632369995, -0.19438225030899048, -0.10430073738098145, -0.014219239354133606, 0.07586225867271423, 0.16594374179840088, 0.2560252547264099, 0.34610676765441895, 0.4361882209777832, 0.5262697339057922, 0.6163512468338013, 0.7064327597618103, 0.7965142726898193, 0.8865957260131836, 0.9766772389411926, 1.0667587518692017, 1.156840205192566, 1.2469217777252197, 1.337003231048584, 1.4270846843719482, 1.517166256904602, 1.6072477102279663, 1.6973292827606201, 1.7874107360839844, 1.8774921894073486, 1.967573642730713, 2.0576553344726562, 2.1477367877960205, 2.2378182411193848, 2.327899932861328, 2.4179813861846924, 2.5080628395080566, 2.598144292831421, 2.688225746154785, 2.7783071994781494, 2.8683886528015137, 2.958470106124878, 3.048551559448242, 3.1386332511901855, 3.22871470451355, 3.318796157836914, 3.4088776111602783, 3.4989590644836426, 3.589040517807007, 3.679121971130371, 3.7692036628723145, 3.8592851161956787, 3.949366569519043, 4.039447784423828, 4.1295294761657715, 4.219611167907715]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 3.0, 1.0, 14.0, 12.0, 10.0, 13.0, 16.0, 19.0, 25.0, 20.0, 32.0, 24.0, 42.0, 35.0, 34.0, 37.0, 49.0, 35.0, 45.0, 43.0, 32.0, 37.0, 40.0, 44.0, 48.0, 36.0, 26.0, 23.0, 21.0, 28.0, 21.0, 21.0, 14.0, 20.0, 19.0, 9.0, 9.0, 9.0, 4.0, 5.0, 4.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3104372024536133, -1.2676371335983276, -1.224837064743042, -1.182037115097046, -1.1392370462417603, -1.0964369773864746, -1.053636908531189, -1.0108368396759033, -0.9680368304252625, -0.9252367615699768, -0.8824367523193359, -0.8396366834640503, -0.7968366146087646, -0.7540366053581238, -0.7112365365028381, -0.6684365272521973, -0.6256364583969116, -0.582836389541626, -0.5400363802909851, -0.49723631143569946, -0.4544362723827362, -0.41163623332977295, -0.3688361644744873, -0.32603612542152405, -0.2832360863685608, -0.24043604731559753, -0.19763599336147308, -0.15483593940734863, -0.11203590035438538, -0.06923586130142212, -0.026435792446136475, 0.016364246606826782, 0.05916416645050049, 0.10196421295404434, 0.1447642594575882, 0.18756431341171265, 0.2303643524646759, 0.27316439151763916, 0.3159644603729248, 0.35876449942588806, 0.4015645384788513, 0.4443645775318146, 0.48716461658477783, 0.5299646854400635, 0.5727647542953491, 0.61556476354599, 0.6583648324012756, 0.7011648416519165, 0.7439649105072021, 0.7867649793624878, 0.8295649886131287, 0.8723650574684143, 0.9151650667190552, 0.9579651355743408, 1.0007652044296265, 1.043565273284912, 1.0863652229309082, 1.1291652917861938, 1.1719653606414795, 1.2147653102874756, 1.2575653791427612, 1.3003654479980469, 1.3431655168533325, 1.3859655857086182, 1.4287656545639038]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 5.0, 9.0, 18.0, 31.0, 26.0, 42.0, 50.0, 84.0, 120.0, 201.0, 353.0, 904.0, 2613.0, 11545.0, 219890.0, 767297.0, 37614.0, 4966.0, 1484.0, 558.0, 258.0, 150.0, 99.0, 63.0, 57.0, 33.0, 21.0, 15.0, 12.0, 6.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47509765625, -0.45465850830078125, -0.4342193603515625, -0.41378021240234375, -0.393341064453125, -0.37290191650390625, -0.3524627685546875, -0.33202362060546875, -0.31158447265625, -0.29114532470703125, -0.2707061767578125, -0.25026702880859375, -0.229827880859375, -0.20938873291015625, -0.1889495849609375, -0.16851043701171875, -0.1480712890625, -0.12763214111328125, -0.1071929931640625, -0.08675384521484375, -0.066314697265625, -0.04587554931640625, -0.0254364013671875, -0.00499725341796875, 0.01544189453125, 0.03588104248046875, 0.0563201904296875, 0.07675933837890625, 0.097198486328125, 0.11763763427734375, 0.1380767822265625, 0.15851593017578125, 0.178955078125, 0.19939422607421875, 0.2198333740234375, 0.24027252197265625, 0.260711669921875, 0.28115081787109375, 0.3015899658203125, 0.32202911376953125, 0.34246826171875, 0.36290740966796875, 0.3833465576171875, 0.40378570556640625, 0.424224853515625, 0.44466400146484375, 0.4651031494140625, 0.48554229736328125, 0.5059814453125, 0.5264205932617188, 0.5468597412109375, 0.5672988891601562, 0.587738037109375, 0.6081771850585938, 0.6286163330078125, 0.6490554809570312, 0.66949462890625, 0.6899337768554688, 0.7103729248046875, 0.7308120727539062, 0.751251220703125, 0.7716903686523438, 0.7921295166015625, 0.8125686645507812, 0.8330078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 6.0, 9.0, 16.0, 16.0, 22.0, 21.0, 29.0, 46.0, 42.0, 48.0, 59.0, 61.0, 61.0, 61.0, 54.0, 54.0, 47.0, 54.0, 52.0, 40.0, 39.0, 26.0, 29.0, 20.0, 19.0, 21.0, 15.0, 7.0, 6.0, 8.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.70703125, -1.6634521484375, -1.619873046875, -1.5762939453125, -1.53271484375, -1.4891357421875, -1.445556640625, -1.4019775390625, -1.3583984375, -1.3148193359375, -1.271240234375, -1.2276611328125, -1.18408203125, -1.1405029296875, -1.096923828125, -1.0533447265625, -1.009765625, -0.9661865234375, -0.922607421875, -0.8790283203125, -0.83544921875, -0.7918701171875, -0.748291015625, -0.7047119140625, -0.6611328125, -0.6175537109375, -0.573974609375, -0.5303955078125, -0.48681640625, -0.4432373046875, -0.399658203125, -0.3560791015625, -0.3125, -0.2689208984375, -0.225341796875, -0.1817626953125, -0.13818359375, -0.0946044921875, -0.051025390625, -0.0074462890625, 0.0361328125, 0.0797119140625, 0.123291015625, 0.1668701171875, 0.21044921875, 0.2540283203125, 0.297607421875, 0.3411865234375, 0.384765625, 0.4283447265625, 0.471923828125, 0.5155029296875, 0.55908203125, 0.6026611328125, 0.646240234375, 0.6898193359375, 0.7333984375, 0.7769775390625, 0.820556640625, 0.8641357421875, 0.90771484375, 0.9512939453125, 0.994873046875, 1.0384521484375, 1.08203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 9.0, 10.0, 7.0, 17.0, 20.0, 32.0, 47.0, 57.0, 80.0, 111.0, 158.0, 266.0, 463.0, 849.0, 1633.0, 3487.0, 10094.0, 42902.0, 256105.0, 545857.0, 147708.0, 26215.0, 6728.0, 2609.0, 1244.0, 675.0, 410.0, 248.0, 166.0, 94.0, 73.0, 35.0, 57.0, 19.0, 11.0, 12.0, 5.0, 5.0, 10.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2534294128417969, -0.24416351318359375, -0.23489761352539062, -0.2256317138671875, -0.21636581420898438, -0.20709991455078125, -0.19783401489257812, -0.188568115234375, -0.17930221557617188, -0.17003631591796875, -0.16077041625976562, -0.1515045166015625, -0.14223861694335938, -0.13297271728515625, -0.12370681762695312, -0.11444091796875, -0.10517501831054688, -0.09590911865234375, -0.08664321899414062, -0.0773773193359375, -0.06811141967773438, -0.05884552001953125, -0.049579620361328125, -0.040313720703125, -0.031047821044921875, -0.02178192138671875, -0.012516021728515625, -0.0032501220703125, 0.006015777587890625, 0.01528167724609375, 0.024547576904296875, 0.0338134765625, 0.043079376220703125, 0.05234527587890625, 0.061611175537109375, 0.0708770751953125, 0.08014297485351562, 0.08940887451171875, 0.09867477416992188, 0.107940673828125, 0.11720657348632812, 0.12647247314453125, 0.13573837280273438, 0.1450042724609375, 0.15427017211914062, 0.16353607177734375, 0.17280197143554688, 0.18206787109375, 0.19133377075195312, 0.20059967041015625, 0.20986557006835938, 0.2191314697265625, 0.22839736938476562, 0.23766326904296875, 0.24692916870117188, 0.256195068359375, 0.2654609680175781, 0.27472686767578125, 0.2839927673339844, 0.2932586669921875, 0.3025245666503906, 0.31179046630859375, 0.3210563659667969, 0.330322265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 12.0, 9.0, 31.0, 26.0, 32.0, 43.0, 44.0, 57.0, 43.0, 61.0, 41.0, 42.0, 59.0, 52.0, 65.0, 41.0, 49.0, 42.0, 33.0, 40.0, 25.0, 20.0, 22.0, 20.0, 16.0, 10.0, 5.0, 10.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.64453125, -3.545074462890625, -3.44561767578125, -3.346160888671875, -3.2467041015625, -3.147247314453125, -3.04779052734375, -2.948333740234375, -2.848876953125, -2.749420166015625, -2.64996337890625, -2.550506591796875, -2.4510498046875, -2.351593017578125, -2.25213623046875, -2.152679443359375, -2.05322265625, -1.953765869140625, -1.85430908203125, -1.754852294921875, -1.6553955078125, -1.555938720703125, -1.45648193359375, -1.357025146484375, -1.257568359375, -1.158111572265625, -1.05865478515625, -0.959197998046875, -0.8597412109375, -0.760284423828125, -0.66082763671875, -0.561370849609375, -0.4619140625, -0.362457275390625, -0.26300048828125, -0.163543701171875, -0.0640869140625, 0.035369873046875, 0.13482666015625, 0.234283447265625, 0.333740234375, 0.433197021484375, 0.53265380859375, 0.632110595703125, 0.7315673828125, 0.831024169921875, 0.93048095703125, 1.029937744140625, 1.12939453125, 1.228851318359375, 1.32830810546875, 1.427764892578125, 1.5272216796875, 1.626678466796875, 1.72613525390625, 1.825592041015625, 1.925048828125, 2.024505615234375, 2.12396240234375, 2.223419189453125, 2.3228759765625, 2.422332763671875, 2.52178955078125, 2.621246337890625, 2.720703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 5.0, 7.0, 2.0, 4.0, 8.0, 24.0, 30.0, 63.0, 130.0, 289.0, 738.0, 1888.0, 7004.0, 41825.0, 737265.0, 235658.0, 17740.0, 3798.0, 1213.0, 456.0, 193.0, 96.0, 65.0, 27.0, 13.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.20801162719726562, -0.20166778564453125, -0.19532394409179688, -0.1889801025390625, -0.18263626098632812, -0.17629241943359375, -0.16994857788085938, -0.163604736328125, -0.15726089477539062, -0.15091705322265625, -0.14457321166992188, -0.1382293701171875, -0.13188552856445312, -0.12554168701171875, -0.11919784545898438, -0.11285400390625, -0.10651016235351562, -0.10016632080078125, -0.09382247924804688, -0.0874786376953125, -0.08113479614257812, -0.07479095458984375, -0.06844711303710938, -0.062103271484375, -0.055759429931640625, -0.04941558837890625, -0.043071746826171875, -0.0367279052734375, -0.030384063720703125, -0.02404022216796875, -0.017696380615234375, -0.0113525390625, -0.005008697509765625, 0.00133514404296875, 0.007678985595703125, 0.0140228271484375, 0.020366668701171875, 0.02671051025390625, 0.033054351806640625, 0.039398193359375, 0.045742034912109375, 0.05208587646484375, 0.058429718017578125, 0.0647735595703125, 0.07111740112304688, 0.07746124267578125, 0.08380508422851562, 0.09014892578125, 0.09649276733398438, 0.10283660888671875, 0.10918045043945312, 0.1155242919921875, 0.12186813354492188, 0.12821197509765625, 0.13455581665039062, 0.140899658203125, 0.14724349975585938, 0.15358734130859375, 0.15993118286132812, 0.1662750244140625, 0.17261886596679688, 0.17896270751953125, 0.18530654907226562, 0.191650390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 5.0, 13.0, 8.0, 22.0, 19.0, 31.0, 56.0, 71.0, 92.0, 117.0, 117.0, 109.0, 96.0, 83.0, 51.0, 31.0, 24.0, 17.0, 11.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.192922592163086e-05, -5.942676216363907e-05, -5.692429840564728e-05, -5.442183464765549e-05, -5.1919370889663696e-05, -4.9416907131671906e-05, -4.6914443373680115e-05, -4.4411979615688324e-05, -4.190951585769653e-05, -3.940705209970474e-05, -3.690458834171295e-05, -3.440212458372116e-05, -3.189966082572937e-05, -2.939719706773758e-05, -2.689473330974579e-05, -2.4392269551753998e-05, -2.1889805793762207e-05, -1.9387342035770416e-05, -1.6884878277778625e-05, -1.4382414519786835e-05, -1.1879950761795044e-05, -9.377487003803253e-06, -6.875023245811462e-06, -4.372559487819672e-06, -1.8700957298278809e-06, 6.323680281639099e-07, 3.1348317861557007e-06, 5.6372955441474915e-06, 8.139759302139282e-06, 1.0642223060131073e-05, 1.3144686818122864e-05, 1.5647150576114655e-05, 1.8149614334106445e-05, 2.0652078092098236e-05, 2.3154541850090027e-05, 2.5657005608081818e-05, 2.815946936607361e-05, 3.06619331240654e-05, 3.316439688205719e-05, 3.566686064004898e-05, 3.816932439804077e-05, 4.067178815603256e-05, 4.317425191402435e-05, 4.5676715672016144e-05, 4.8179179430007935e-05, 5.0681643187999725e-05, 5.3184106945991516e-05, 5.568657070398331e-05, 5.81890344619751e-05, 6.069149821996689e-05, 6.319396197795868e-05, 6.569642573595047e-05, 6.819888949394226e-05, 7.070135325193405e-05, 7.320381700992584e-05, 7.570628076791763e-05, 7.820874452590942e-05, 8.071120828390121e-05, 8.3213672041893e-05, 8.57161357998848e-05, 8.821859955787659e-05, 9.072106331586838e-05, 9.322352707386017e-05, 9.572599083185196e-05, 9.822845458984375e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 15.0, 22.0, 28.0, 51.0, 89.0, 170.0, 272.0, 522.0, 912.0, 1582.0, 3029.0, 5911.0, 12022.0, 29141.0, 90231.0, 340112.0, 393616.0, 109150.0, 33951.0, 13763.0, 6556.0, 3344.0, 1811.0, 993.0, 541.0, 277.0, 173.0, 109.0, 66.0, 28.0, 12.0, 18.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08135986328125, -0.07882308959960938, -0.07628631591796875, -0.07374954223632812, -0.0712127685546875, -0.06867599487304688, -0.06613922119140625, -0.06360244750976562, -0.061065673828125, -0.058528900146484375, -0.05599212646484375, -0.053455352783203125, -0.0509185791015625, -0.048381805419921875, -0.04584503173828125, -0.043308258056640625, -0.040771484375, -0.038234710693359375, -0.03569793701171875, -0.033161163330078125, -0.0306243896484375, -0.028087615966796875, -0.02555084228515625, -0.023014068603515625, -0.020477294921875, -0.017940521240234375, -0.01540374755859375, -0.012866973876953125, -0.0103302001953125, -0.007793426513671875, -0.00525665283203125, -0.002719879150390625, -0.00018310546875, 0.002353668212890625, 0.00489044189453125, 0.007427215576171875, 0.0099639892578125, 0.012500762939453125, 0.01503753662109375, 0.017574310302734375, 0.020111083984375, 0.022647857666015625, 0.02518463134765625, 0.027721405029296875, 0.0302581787109375, 0.032794952392578125, 0.03533172607421875, 0.037868499755859375, 0.0404052734375, 0.042942047119140625, 0.04547882080078125, 0.048015594482421875, 0.0505523681640625, 0.053089141845703125, 0.05562591552734375, 0.058162689208984375, 0.060699462890625, 0.06323623657226562, 0.06577301025390625, 0.06830978393554688, 0.0708465576171875, 0.07338333129882812, 0.07592010498046875, 0.07845687866210938, 0.08099365234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 11.0, 21.0, 30.0, 42.0, 60.0, 94.0, 125.0, 152.0, 123.0, 110.0, 53.0, 35.0, 37.0, 22.0, 7.0, 11.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036590576171875, -0.035463809967041016, -0.03433704376220703, -0.03321027755737305, -0.03208351135253906, -0.030956745147705078, -0.029829978942871094, -0.02870321273803711, -0.027576446533203125, -0.02644968032836914, -0.025322914123535156, -0.024196147918701172, -0.023069381713867188, -0.021942615509033203, -0.02081584930419922, -0.019689083099365234, -0.01856231689453125, -0.017435550689697266, -0.01630878448486328, -0.015182018280029297, -0.014055252075195312, -0.012928485870361328, -0.011801719665527344, -0.01067495346069336, -0.009548187255859375, -0.00842142105102539, -0.007294654846191406, -0.006167888641357422, -0.0050411224365234375, -0.003914356231689453, -0.0027875900268554688, -0.0016608238220214844, -0.0005340576171875, 0.0005927085876464844, 0.0017194747924804688, 0.002846240997314453, 0.0039730072021484375, 0.005099773406982422, 0.006226539611816406, 0.007353305816650391, 0.008480072021484375, 0.00960683822631836, 0.010733604431152344, 0.011860370635986328, 0.012987136840820312, 0.014113903045654297, 0.015240669250488281, 0.016367435455322266, 0.01749420166015625, 0.018620967864990234, 0.01974773406982422, 0.020874500274658203, 0.022001266479492188, 0.023128032684326172, 0.024254798889160156, 0.02538156509399414, 0.026508331298828125, 0.02763509750366211, 0.028761863708496094, 0.029888629913330078, 0.031015396118164062, 0.03214216232299805, 0.03326892852783203, 0.034395694732666016, 0.0355224609375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 20.0, 24.0, 22.0, 51.0, 66.0, 71.0, 82.0, 101.0, 103.0, 96.0, 95.0, 64.0, 56.0, 47.0, 33.0, 17.0, 21.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0808062553405762, -1.0233845710754395, -0.9659629464149475, -0.9085413217544556, -0.8511196970939636, -0.7936980724334717, -0.736276388168335, -0.678854763507843, -0.6214331388473511, -0.5640115141868591, -0.5065898299217224, -0.44916820526123047, -0.3917465806007385, -0.3343249261379242, -0.27690327167510986, -0.21948164701461792, -0.1620599627494812, -0.10463832318782806, -0.04721667617559433, 0.010204970836639404, 0.06762661039829254, 0.12504824995994568, 0.18246990442276, 0.23989152908325195, 0.2973131835460663, 0.3547348380088806, 0.41215646266937256, 0.4695781171321869, 0.5269997715950012, 0.5844213962554932, 0.6418430805206299, 0.699264645576477, 0.7566863298416138, 0.8141079545021057, 0.8715296387672424, 0.9289512634277344, 0.9863728880882263, 1.0437945127487183, 1.101216197013855, 1.1586377620697021, 1.2160594463348389, 1.2734811305999756, 1.3309026956558228, 1.3883243799209595, 1.4457460641860962, 1.5031676292419434, 1.56058931350708, 1.6180109977722168, 1.6754326820373535, 1.7328543663024902, 1.7902759313583374, 1.8476976156234741, 1.9051192998886108, 1.962540864944458, 2.0199625492095947, 2.0773842334747314, 2.134805679321289, 2.192227363586426, 2.2496490478515625, 2.307070732116699, 2.364492177963257, 2.4219138622283936, 2.4793355464935303, 2.536757230758667, 2.5941789150238037]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 16.0, 14.0, 13.0, 21.0, 25.0, 32.0, 42.0, 39.0, 55.0, 43.0, 51.0, 55.0, 67.0, 53.0, 58.0, 58.0, 52.0, 49.0, 33.0, 35.0, 31.0, 37.0, 21.0, 27.0, 16.0, 10.0, 12.0, 3.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3500936031341553, -1.3102937936782837, -1.2704938650131226, -1.230694055557251, -1.1908942461013794, -1.1510944366455078, -1.1112945079803467, -1.071494698524475, -1.0316948890686035, -0.9918950200080872, -0.9520952105522156, -0.9122953414916992, -0.8724955320358276, -0.8326956629753113, -0.7928957939147949, -0.7530959844589233, -0.713296115398407, -0.6734962463378906, -0.633696436882019, -0.5938965678215027, -0.5540967583656311, -0.5142968893051147, -0.4744970500469208, -0.4346972107887268, -0.39489737153053284, -0.35509753227233887, -0.3152976930141449, -0.2754978537559509, -0.23569799959659576, -0.1958981603384018, -0.15609830617904663, -0.11629846692085266, -0.07649862766265869, -0.03669878467917442, 0.003101058304309845, 0.04290090501308441, 0.08270074427127838, 0.12250058352947235, 0.16230043768882751, 0.20210027694702148, 0.24190011620521545, 0.2816999554634094, 0.3214997947216034, 0.36129963397979736, 0.4010995030403137, 0.4408993124961853, 0.48069918155670166, 0.5204989910125732, 0.5602988600730896, 0.600098729133606, 0.6398985385894775, 0.6796984076499939, 0.7194982171058655, 0.7592980861663818, 0.7990978956222534, 0.8388977646827698, 0.8786976337432861, 0.9184975028038025, 0.9582973122596741, 0.9980971813201904, 1.037896990776062, 1.0776968002319336, 1.1174967288970947, 1.1572965383529663, 1.197096347808838]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 8.0, 16.0, 28.0, 46.0, 50.0, 87.0, 141.0, 222.0, 403.0, 721.0, 1463.0, 2760.0, 5858.0, 12809.0, 33046.0, 104302.0, 421887.0, 332861.0, 82939.0, 27581.0, 10859.0, 5055.0, 2532.0, 1291.0, 647.0, 374.0, 215.0, 133.0, 59.0, 53.0, 37.0, 19.0, 14.0, 17.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.9732666015625, -1.909423828125, -1.8455810546875, -1.78173828125, -1.7178955078125, -1.654052734375, -1.5902099609375, -1.5263671875, -1.4625244140625, -1.398681640625, -1.3348388671875, -1.27099609375, -1.2071533203125, -1.143310546875, -1.0794677734375, -1.015625, -0.9517822265625, -0.887939453125, -0.8240966796875, -0.76025390625, -0.6964111328125, -0.632568359375, -0.5687255859375, -0.5048828125, -0.4410400390625, -0.377197265625, -0.3133544921875, -0.24951171875, -0.1856689453125, -0.121826171875, -0.0579833984375, 0.005859375, 0.0697021484375, 0.133544921875, 0.1973876953125, 0.26123046875, 0.3250732421875, 0.388916015625, 0.4527587890625, 0.5166015625, 0.5804443359375, 0.644287109375, 0.7081298828125, 0.77197265625, 0.8358154296875, 0.899658203125, 0.9635009765625, 1.02734375, 1.0911865234375, 1.155029296875, 1.2188720703125, 1.28271484375, 1.3465576171875, 1.410400390625, 1.4742431640625, 1.5380859375, 1.6019287109375, 1.665771484375, 1.7296142578125, 1.79345703125, 1.8572998046875, 1.921142578125, 1.9849853515625, 2.048828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 10.0, 18.0, 15.0, 21.0, 14.0, 31.0, 38.0, 35.0, 30.0, 34.0, 35.0, 42.0, 56.0, 48.0, 57.0, 51.0, 50.0, 50.0, 39.0, 39.0, 35.0, 27.0, 35.0, 31.0, 28.0, 24.0, 15.0, 10.0, 15.0, 13.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.90234375, -1.8438720703125, -1.785400390625, -1.7269287109375, -1.66845703125, -1.6099853515625, -1.551513671875, -1.4930419921875, -1.4345703125, -1.3760986328125, -1.317626953125, -1.2591552734375, -1.20068359375, -1.1422119140625, -1.083740234375, -1.0252685546875, -0.966796875, -0.9083251953125, -0.849853515625, -0.7913818359375, -0.73291015625, -0.6744384765625, -0.615966796875, -0.5574951171875, -0.4990234375, -0.4405517578125, -0.382080078125, -0.3236083984375, -0.26513671875, -0.2066650390625, -0.148193359375, -0.0897216796875, -0.03125, 0.0272216796875, 0.085693359375, 0.1441650390625, 0.20263671875, 0.2611083984375, 0.319580078125, 0.3780517578125, 0.4365234375, 0.4949951171875, 0.553466796875, 0.6119384765625, 0.67041015625, 0.7288818359375, 0.787353515625, 0.8458251953125, 0.904296875, 0.9627685546875, 1.021240234375, 1.0797119140625, 1.13818359375, 1.1966552734375, 1.255126953125, 1.3135986328125, 1.3720703125, 1.4305419921875, 1.489013671875, 1.5474853515625, 1.60595703125, 1.6644287109375, 1.722900390625, 1.7813720703125, 1.83984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 11.0, 15.0, 31.0, 28.0, 37.0, 67.0, 90.0, 129.0, 194.0, 351.0, 582.0, 1036.0, 1824.0, 3382.0, 6636.0, 13280.0, 29826.0, 74041.0, 218096.0, 425043.0, 166631.0, 59080.0, 24607.0, 11236.0, 5474.0, 2933.0, 1572.0, 879.0, 526.0, 319.0, 219.0, 125.0, 76.0, 63.0, 36.0, 32.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7001953125, -1.6521453857421875, -1.604095458984375, -1.5560455322265625, -1.50799560546875, -1.4599456787109375, -1.411895751953125, -1.3638458251953125, -1.3157958984375, -1.2677459716796875, -1.219696044921875, -1.1716461181640625, -1.12359619140625, -1.0755462646484375, -1.027496337890625, -0.9794464111328125, -0.931396484375, -0.8833465576171875, -0.835296630859375, -0.7872467041015625, -0.73919677734375, -0.6911468505859375, -0.643096923828125, -0.5950469970703125, -0.5469970703125, -0.4989471435546875, -0.450897216796875, -0.4028472900390625, -0.35479736328125, -0.3067474365234375, -0.258697509765625, -0.2106475830078125, -0.16259765625, -0.1145477294921875, -0.066497802734375, -0.0184478759765625, 0.02960205078125, 0.0776519775390625, 0.125701904296875, 0.1737518310546875, 0.2218017578125, 0.2698516845703125, 0.317901611328125, 0.3659515380859375, 0.41400146484375, 0.4620513916015625, 0.510101318359375, 0.5581512451171875, 0.606201171875, 0.6542510986328125, 0.702301025390625, 0.7503509521484375, 0.79840087890625, 0.8464508056640625, 0.894500732421875, 0.9425506591796875, 0.9906005859375, 1.0386505126953125, 1.086700439453125, 1.1347503662109375, 1.18280029296875, 1.2308502197265625, 1.278900146484375, 1.3269500732421875, 1.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 2.0, 12.0, 7.0, 11.0, 15.0, 14.0, 23.0, 28.0, 19.0, 30.0, 25.0, 36.0, 30.0, 31.0, 39.0, 41.0, 40.0, 46.0, 50.0, 56.0, 36.0, 52.0, 48.0, 42.0, 34.0, 30.0, 26.0, 25.0, 20.0, 20.0, 15.0, 12.0, 12.0, 8.0, 7.0, 11.0, 3.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0], "bins": [-2.8359375, -2.759490966796875, -2.68304443359375, -2.606597900390625, -2.5301513671875, -2.453704833984375, -2.37725830078125, -2.300811767578125, -2.224365234375, -2.147918701171875, -2.07147216796875, -1.995025634765625, -1.9185791015625, -1.842132568359375, -1.76568603515625, -1.689239501953125, -1.61279296875, -1.536346435546875, -1.45989990234375, -1.383453369140625, -1.3070068359375, -1.230560302734375, -1.15411376953125, -1.077667236328125, -1.001220703125, -0.924774169921875, -0.84832763671875, -0.771881103515625, -0.6954345703125, -0.618988037109375, -0.54254150390625, -0.466094970703125, -0.3896484375, -0.313201904296875, -0.23675537109375, -0.160308837890625, -0.0838623046875, -0.007415771484375, 0.06903076171875, 0.145477294921875, 0.221923828125, 0.298370361328125, 0.37481689453125, 0.451263427734375, 0.5277099609375, 0.604156494140625, 0.68060302734375, 0.757049560546875, 0.83349609375, 0.909942626953125, 0.98638916015625, 1.062835693359375, 1.1392822265625, 1.215728759765625, 1.29217529296875, 1.368621826171875, 1.445068359375, 1.521514892578125, 1.59796142578125, 1.674407958984375, 1.7508544921875, 1.827301025390625, 1.90374755859375, 1.980194091796875, 2.056640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 3.0, 8.0, 14.0, 23.0, 30.0, 31.0, 60.0, 111.0, 145.0, 258.0, 412.0, 548.0, 1043.0, 1696.0, 2798.0, 4905.0, 8576.0, 15474.0, 28666.0, 53365.0, 100313.0, 192965.0, 312652.0, 151032.0, 79202.0, 42182.0, 22788.0, 12500.0, 6848.0, 3914.0, 2297.0, 1383.0, 873.0, 523.0, 310.0, 191.0, 133.0, 89.0, 65.0, 27.0, 32.0, 24.0, 12.0, 5.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.271484375, -0.26357269287109375, -0.2556610107421875, -0.24774932861328125, -0.239837646484375, -0.23192596435546875, -0.2240142822265625, -0.21610260009765625, -0.20819091796875, -0.20027923583984375, -0.1923675537109375, -0.18445587158203125, -0.176544189453125, -0.16863250732421875, -0.1607208251953125, -0.15280914306640625, -0.1448974609375, -0.13698577880859375, -0.1290740966796875, -0.12116241455078125, -0.113250732421875, -0.10533905029296875, -0.0974273681640625, -0.08951568603515625, -0.08160400390625, -0.07369232177734375, -0.0657806396484375, -0.05786895751953125, -0.049957275390625, -0.04204559326171875, -0.0341339111328125, -0.02622222900390625, -0.018310546875, -0.01039886474609375, -0.0024871826171875, 0.00542449951171875, 0.013336181640625, 0.02124786376953125, 0.0291595458984375, 0.03707122802734375, 0.04498291015625, 0.05289459228515625, 0.0608062744140625, 0.06871795654296875, 0.076629638671875, 0.08454132080078125, 0.0924530029296875, 0.10036468505859375, 0.1082763671875, 0.11618804931640625, 0.1240997314453125, 0.13201141357421875, 0.139923095703125, 0.14783477783203125, 0.1557464599609375, 0.16365814208984375, 0.17156982421875, 0.17948150634765625, 0.1873931884765625, 0.19530487060546875, 0.203216552734375, 0.21112823486328125, 0.2190399169921875, 0.22695159912109375, 0.23486328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 8.0, 8.0, 22.0, 26.0, 21.0, 31.0, 31.0, 41.0, 46.0, 61.0, 67.0, 100.0, 116.0, 68.0, 62.0, 53.0, 42.0, 32.0, 28.0, 29.0, 18.0, 12.0, 16.0, 5.0, 11.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.00012564659118652344, -0.00012251641601324081, -0.00011938624083995819, -0.00011625606566667557, -0.00011312589049339294, -0.00010999571532011032, -0.0001068655401468277, -0.00010373536497354507, -0.00010060518980026245, -9.747501462697983e-05, -9.43448394536972e-05, -9.121466428041458e-05, -8.808448910713196e-05, -8.495431393384933e-05, -8.182413876056671e-05, -7.869396358728409e-05, -7.556378841400146e-05, -7.243361324071884e-05, -6.930343806743622e-05, -6.61732628941536e-05, -6.304308772087097e-05, -5.991291254758835e-05, -5.6782737374305725e-05, -5.36525622010231e-05, -5.052238702774048e-05, -4.7392211854457855e-05, -4.426203668117523e-05, -4.113186150789261e-05, -3.8001686334609985e-05, -3.487151116132736e-05, -3.174133598804474e-05, -2.8611160814762115e-05, -2.5480985641479492e-05, -2.235081046819687e-05, -1.9220635294914246e-05, -1.6090460121631622e-05, -1.2960284948348999e-05, -9.830109775066376e-06, -6.6999346017837524e-06, -3.569759428501129e-06, -4.3958425521850586e-07, 2.6905909180641174e-06, 5.820766091346741e-06, 8.950941264629364e-06, 1.2081116437911987e-05, 1.521129161119461e-05, 1.8341466784477234e-05, 2.1471641957759857e-05, 2.460181713104248e-05, 2.7731992304325104e-05, 3.086216747760773e-05, 3.399234265089035e-05, 3.7122517824172974e-05, 4.02526929974556e-05, 4.338286817073822e-05, 4.6513043344020844e-05, 4.964321851730347e-05, 5.277339369058609e-05, 5.590356886386871e-05, 5.903374403715134e-05, 6.216391921043396e-05, 6.529409438371658e-05, 6.84242695569992e-05, 7.155444473028183e-05, 7.468461990356445e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 10.0, 7.0, 12.0, 15.0, 24.0, 33.0, 46.0, 82.0, 108.0, 157.0, 202.0, 355.0, 536.0, 876.0, 1399.0, 2320.0, 4059.0, 7350.0, 14228.0, 28981.0, 62387.0, 139447.0, 351544.0, 235351.0, 103814.0, 46820.0, 22561.0, 11237.0, 5835.0, 3473.0, 1944.0, 1170.0, 754.0, 467.0, 344.0, 202.0, 121.0, 88.0, 52.0, 48.0, 36.0, 26.0, 14.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.393310546875, -0.3820152282714844, -0.37071990966796875, -0.3594245910644531, -0.3481292724609375, -0.3368339538574219, -0.32553863525390625, -0.3142433166503906, -0.302947998046875, -0.2916526794433594, -0.28035736083984375, -0.2690620422363281, -0.2577667236328125, -0.24647140502929688, -0.23517608642578125, -0.22388076782226562, -0.21258544921875, -0.20129013061523438, -0.18999481201171875, -0.17869949340820312, -0.1674041748046875, -0.15610885620117188, -0.14481353759765625, -0.13351821899414062, -0.122222900390625, -0.11092758178710938, -0.09963226318359375, -0.08833694458007812, -0.0770416259765625, -0.06574630737304688, -0.05445098876953125, -0.043155670166015625, -0.0318603515625, -0.020565032958984375, -0.00926971435546875, 0.002025604248046875, 0.0133209228515625, 0.024616241455078125, 0.03591156005859375, 0.047206878662109375, 0.058502197265625, 0.06979751586914062, 0.08109283447265625, 0.09238815307617188, 0.1036834716796875, 0.11497879028320312, 0.12627410888671875, 0.13756942749023438, 0.14886474609375, 0.16016006469726562, 0.17145538330078125, 0.18275070190429688, 0.1940460205078125, 0.20534133911132812, 0.21663665771484375, 0.22793197631835938, 0.239227294921875, 0.2505226135253906, 0.26181793212890625, 0.2731132507324219, 0.2844085693359375, 0.2957038879394531, 0.30699920654296875, 0.3182945251464844, 0.32958984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 11.0, 10.0, 10.0, 15.0, 18.0, 22.0, 31.0, 33.0, 36.0, 42.0, 50.0, 72.0, 96.0, 93.0, 82.0, 51.0, 52.0, 49.0, 36.0, 29.0, 29.0, 28.0, 22.0, 15.0, 17.0, 9.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.2469940185546875, -0.238616943359375, -0.2302398681640625, -0.22186279296875, -0.2134857177734375, -0.205108642578125, -0.1967315673828125, -0.1883544921875, -0.1799774169921875, -0.171600341796875, -0.1632232666015625, -0.15484619140625, -0.1464691162109375, -0.138092041015625, -0.1297149658203125, -0.121337890625, -0.1129608154296875, -0.104583740234375, -0.0962066650390625, -0.08782958984375, -0.0794525146484375, -0.071075439453125, -0.0626983642578125, -0.0543212890625, -0.0459442138671875, -0.037567138671875, -0.0291900634765625, -0.02081298828125, -0.0124359130859375, -0.004058837890625, 0.0043182373046875, 0.0126953125, 0.0210723876953125, 0.029449462890625, 0.0378265380859375, 0.04620361328125, 0.0545806884765625, 0.062957763671875, 0.0713348388671875, 0.0797119140625, 0.0880889892578125, 0.096466064453125, 0.1048431396484375, 0.11322021484375, 0.1215972900390625, 0.129974365234375, 0.1383514404296875, 0.146728515625, 0.1551055908203125, 0.163482666015625, 0.1718597412109375, 0.18023681640625, 0.1886138916015625, 0.196990966796875, 0.2053680419921875, 0.2137451171875, 0.2221221923828125, 0.230499267578125, 0.2388763427734375, 0.24725341796875, 0.2556304931640625, 0.264007568359375, 0.2723846435546875, 0.28076171875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 13.0, 13.0, 28.0, 29.0, 78.0, 78.0, 95.0, 138.0, 93.0, 126.0, 104.0, 70.0, 48.0, 36.0, 17.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.894886016845703, -4.7289509773254395, -4.563016414642334, -4.39708137512207, -4.231146812438965, -4.065211772918701, -3.8992769718170166, -3.733342170715332, -3.5674073696136475, -3.401472568511963, -3.2355377674102783, -3.0696029663085938, -2.90366792678833, -2.7377333641052246, -2.571798324584961, -2.4058635234832764, -2.239928722381592, -2.0739939212799072, -1.9080591201782227, -1.7421241998672485, -1.576189398765564, -1.4102545976638794, -1.2443196773529053, -1.0783848762512207, -0.9124500751495361, -0.7465152740478516, -0.5805804133415222, -0.41464558243751526, -0.2487107515335083, -0.08277595043182373, 0.08315891027450562, 0.24909377098083496, 0.41502904891967773, 0.5809638500213623, 0.7468987107276917, 0.912833571434021, 1.0787683725357056, 1.2447031736373901, 1.4106380939483643, 1.5765728950500488, 1.7425076961517334, 1.908442497253418, 2.0743772983551025, 2.240312099456787, 2.406247138977051, 2.5721817016601562, 2.73811674118042, 2.9040515422821045, 3.069986343383789, 3.2359211444854736, 3.401855945587158, 3.5677907466888428, 3.7337255477905273, 3.899660587310791, 4.0655951499938965, 4.23153018951416, 4.397464752197266, 4.563399791717529, 4.729334354400635, 4.895269393920898, 5.061203956604004, 5.227138996124268, 5.393073558807373, 5.559008598327637, 5.7249436378479]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 7.0, 3.0, 6.0, 7.0, 8.0, 12.0, 15.0, 15.0, 17.0, 23.0, 16.0, 20.0, 14.0, 19.0, 28.0, 31.0, 39.0, 40.0, 29.0, 37.0, 44.0, 30.0, 37.0, 52.0, 32.0, 41.0, 35.0, 31.0, 30.0, 25.0, 28.0, 26.0, 24.0, 25.0, 22.0, 21.0, 17.0, 16.0, 17.0, 10.0, 17.0, 9.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.084555625915527, -3.9525306224823, -3.8205056190490723, -3.6884806156158447, -3.556455612182617, -3.4244308471679688, -3.292405843734741, -3.1603808403015137, -3.028355836868286, -2.8963308334350586, -2.764305830001831, -2.6322808265686035, -2.500256061553955, -2.3682308197021484, -2.2362060546875, -2.1041810512542725, -1.972156047821045, -1.8401310443878174, -1.7081060409545898, -1.5760811567306519, -1.4440561532974243, -1.3120311498641968, -1.1800062656402588, -1.0479812622070312, -0.9159562587738037, -0.7839312553405762, -0.6519063115119934, -0.5198813676834106, -0.3878563642501831, -0.25583136081695557, -0.1238064169883728, 0.008218526840209961, 0.1402430534362793, 0.27226802706718445, 0.4042930006980896, 0.5363179445266724, 0.6683429479598999, 0.8003679513931274, 0.9323928952217102, 1.064417839050293, 1.1964428424835205, 1.328467845916748, 1.4604928493499756, 1.5925177335739136, 1.7245427370071411, 1.8565677404403687, 1.9885926246643066, 2.120617628097534, 2.2526426315307617, 2.3846676349639893, 2.516692638397217, 2.6487176418304443, 2.780742645263672, 2.9127674102783203, 3.044792413711548, 3.1768174171447754, 3.308842420578003, 3.4408674240112305, 3.572892427444458, 3.7049174308776855, 3.836942195892334, 3.9689674377441406, 4.100992202758789, 4.2330169677734375, 4.365042209625244]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 6.0, 12.0, 9.0, 12.0, 21.0, 31.0, 37.0, 42.0, 68.0, 77.0, 113.0, 129.0, 164.0, 212.0, 235.0, 313.0, 372.0, 431.0, 512.0, 587.0, 785.0, 1167.0, 1040670.0, 929.0, 670.0, 561.0, 449.0, 399.0, 323.0, 243.0, 193.0, 190.0, 122.0, 121.0, 97.0, 75.0, 55.0, 33.0, 28.0, 29.0, 19.0, 19.0, 9.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-4.427000045776367, -4.280395984649658, -4.133791923522949, -3.9871878623962402, -3.8405838012695312, -3.6939797401428223, -3.5473756790161133, -3.4007716178894043, -3.2541675567626953, -3.1075634956359863, -2.9609594345092773, -2.8143553733825684, -2.6677513122558594, -2.5211472511291504, -2.3745431900024414, -2.2279391288757324, -2.0813350677490234, -1.9347310066223145, -1.7881269454956055, -1.6415228843688965, -1.4949188232421875, -1.3483147621154785, -1.2017107009887695, -1.0551066398620605, -0.9085025787353516, -0.7618985176086426, -0.6152944564819336, -0.4686903953552246, -0.3220863342285156, -0.17548227310180664, -0.028878211975097656, 0.11772584915161133, 0.2643303871154785, 0.4109344482421875, 0.5575385093688965, 0.7041425704956055, 0.8507466316223145, 0.9973506927490234, 1.1439547538757324, 1.2905588150024414, 1.4371628761291504, 1.5837669372558594, 1.7303709983825684, 1.8769750595092773, 2.0235791206359863, 2.1701831817626953, 2.3167872428894043, 2.4633913040161133, 2.6099953651428223, 2.7565994262695312, 2.9032034873962402, 3.049807548522949, 3.196411609649658, 3.343015670776367, 3.489619731903076, 3.636223793029785, 3.782827854156494, 3.929431915283203, 4.076035976409912, 4.222640037536621, 4.36924409866333, 4.515848159790039, 4.662452220916748, 4.809056282043457, 4.955660343170166]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 8.0, 11.0, 15.0, 35.0, 80.0, 155.0, 393.0, 1144.0, 3213.0, 9693.0, 51413792.0, 31560.0, 7211.0, 2556.0, 858.0, 317.0, 132.0, 63.0, 26.0, 21.0, 10.0, 7.0, 8.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.18787384033203, -20.453519821166992, -19.719165802001953, -18.984811782836914, -18.250457763671875, -17.516103744506836, -16.781749725341797, -16.047395706176758, -15.313041687011719, -14.57868766784668, -13.84433364868164, -13.109979629516602, -12.375625610351562, -11.641271591186523, -10.906917572021484, -10.172563552856445, -9.438210487365723, -8.703856468200684, -7.9695024490356445, -7.2351484298706055, -6.500794410705566, -5.766440391540527, -5.0320868492126465, -4.297732830047607, -3.5633788108825684, -2.8290247917175293, -2.0946707725524902, -1.3603169918060303, -0.6259629726409912, 0.10839104652404785, 0.8427448272705078, 1.5770988464355469, 2.311452865600586, 3.045806884765625, 3.780160903930664, 4.514514923095703, 5.248868942260742, 5.983222961425781, 6.717576503753662, 7.451930522918701, 8.186285018920898, 8.920639038085938, 9.654993057250977, 10.389347076416016, 11.123701095581055, 11.858055114746094, 12.592409133911133, 13.326763153076172, 14.061116218566895, 14.795470237731934, 15.529824256896973, 16.264177322387695, 16.998531341552734, 17.732885360717773, 18.467239379882812, 19.20159339904785, 19.93594741821289, 20.67030143737793, 21.40465545654297, 22.139009475708008, 22.873363494873047, 23.607717514038086, 24.342071533203125, 25.076425552368164, 25.810779571533203]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 14.0, 6.0, 27.0, 35.0, 66.0, 69.0, 86.0, 151.0, 186.0, 302.0, 484.0, 759.0, 1212.0, 2023.0, 3615.0, 6101.0, 10912.0, 19809.0, 36960.0, 68946.0, 125730.0, 217430.0, 346115.0, 597760.0, 3375342.0, 621559.0, 349673.0, 222420.0, 127958.0, 70477.0, 37910.0, 20382.0, 11366.0, 6269.0, 3647.0, 2022.0, 1304.0, 796.0, 509.0, 339.0, 196.0, 129.0, 111.0, 83.0, 45.0, 31.0, 28.0, 15.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.810546875, -0.7848281860351562, -0.7591094970703125, -0.7333908081054688, -0.707672119140625, -0.6819534301757812, -0.6562347412109375, -0.6305160522460938, -0.60479736328125, -0.5790786743164062, -0.5533599853515625, -0.5276412963867188, -0.501922607421875, -0.47620391845703125, -0.4504852294921875, -0.42476654052734375, -0.3990478515625, -0.37332916259765625, -0.3476104736328125, -0.32189178466796875, -0.296173095703125, -0.27045440673828125, -0.2447357177734375, -0.21901702880859375, -0.19329833984375, -0.16757965087890625, -0.1418609619140625, -0.11614227294921875, -0.090423583984375, -0.06470489501953125, -0.0389862060546875, -0.01326751708984375, 0.012451171875, 0.03816986083984375, 0.0638885498046875, 0.08960723876953125, 0.115325927734375, 0.14104461669921875, 0.1667633056640625, 0.19248199462890625, 0.21820068359375, 0.24391937255859375, 0.2696380615234375, 0.29535675048828125, 0.321075439453125, 0.34679412841796875, 0.3725128173828125, 0.39823150634765625, 0.4239501953125, 0.44966888427734375, 0.4753875732421875, 0.5011062622070312, 0.526824951171875, 0.5525436401367188, 0.5782623291015625, 0.6039810180664062, 0.62969970703125, 0.6554183959960938, 0.6811370849609375, 0.7068557739257812, 0.732574462890625, 0.7582931518554688, 0.7840118408203125, 0.8097305297851562, 0.83544921875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 3.0, 5.0, 9.0, 18.0, 14.0, 16.0, 20.0, 15.0, 32.0, 33.0, 34.0, 51.0, 27.0, 46.0, 50.0, 35.0, 75.0, 956.0, 110.0, 48.0, 38.0, 48.0, 36.0, 26.0, 42.0, 33.0, 28.0, 14.0, 31.0, 22.0, 12.0, 18.0, 9.0, 7.0, 11.0, 7.0, 6.0, 4.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9296875, -12.5203857421875, -12.111083984375, -11.7017822265625, -11.29248046875, -10.8831787109375, -10.473876953125, -10.0645751953125, -9.6552734375, -9.2459716796875, -8.836669921875, -8.4273681640625, -8.01806640625, -7.6087646484375, -7.199462890625, -6.7901611328125, -6.380859375, -5.9715576171875, -5.562255859375, -5.1529541015625, -4.74365234375, -4.3343505859375, -3.925048828125, -3.5157470703125, -3.1064453125, -2.6971435546875, -2.287841796875, -1.8785400390625, -1.46923828125, -1.0599365234375, -0.650634765625, -0.2413330078125, 0.16796875, 0.5772705078125, 0.986572265625, 1.3958740234375, 1.80517578125, 2.2144775390625, 2.623779296875, 3.0330810546875, 3.4423828125, 3.8516845703125, 4.260986328125, 4.6702880859375, 5.07958984375, 5.4888916015625, 5.898193359375, 6.3074951171875, 6.716796875, 7.1260986328125, 7.535400390625, 7.9447021484375, 8.35400390625, 8.7633056640625, 9.172607421875, 9.5819091796875, 9.9912109375, 10.4005126953125, 10.809814453125, 11.2191162109375, 11.62841796875, 12.0377197265625, 12.447021484375, 12.8563232421875, 13.265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 6.0, 7.0, 15.0, 15.0, 26.0, 38.0, 63.0, 111.0, 217.0, 471.0, 1082.0, 2590.0, 7117.0, 18970.0, 51129.0, 129822.0, 289793.0, 530696.0, 3646687.0, 845763.0, 419395.0, 207161.0, 87072.0, 33396.0, 12120.0, 4436.0, 1755.0, 774.0, 326.0, 160.0, 92.0, 58.0, 26.0, 16.0, 16.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.1201171875, -1.09393310546875, -1.0677490234375, -1.04156494140625, -1.015380859375, -0.98919677734375, -0.9630126953125, -0.93682861328125, -0.91064453125, -0.88446044921875, -0.8582763671875, -0.83209228515625, -0.805908203125, -0.77972412109375, -0.7535400390625, -0.72735595703125, -0.701171875, -0.67498779296875, -0.6488037109375, -0.62261962890625, -0.596435546875, -0.57025146484375, -0.5440673828125, -0.51788330078125, -0.49169921875, -0.46551513671875, -0.4393310546875, -0.41314697265625, -0.386962890625, -0.36077880859375, -0.3345947265625, -0.30841064453125, -0.2822265625, -0.25604248046875, -0.2298583984375, -0.20367431640625, -0.177490234375, -0.15130615234375, -0.1251220703125, -0.09893798828125, -0.07275390625, -0.04656982421875, -0.0203857421875, 0.00579833984375, 0.031982421875, 0.05816650390625, 0.0843505859375, 0.11053466796875, 0.13671875, 0.16290283203125, 0.1890869140625, 0.21527099609375, 0.241455078125, 0.26763916015625, 0.2938232421875, 0.32000732421875, 0.34619140625, 0.37237548828125, 0.3985595703125, 0.42474365234375, 0.450927734375, 0.47711181640625, 0.5032958984375, 0.52947998046875, 0.5556640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 14.0, 14.0, 20.0, 23.0, 23.0, 33.0, 31.0, 34.0, 41.0, 47.0, 49.0, 46.0, 56.0, 729.0, 399.0, 42.0, 54.0, 48.0, 54.0, 42.0, 34.0, 34.0, 23.0, 24.0, 15.0, 23.0, 14.0, 17.0, 13.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -9.926025390625, -9.49267578125, -9.059326171875, -8.6259765625, -8.192626953125, -7.75927734375, -7.325927734375, -6.892578125, -6.459228515625, -6.02587890625, -5.592529296875, -5.1591796875, -4.725830078125, -4.29248046875, -3.859130859375, -3.42578125, -2.992431640625, -2.55908203125, -2.125732421875, -1.6923828125, -1.259033203125, -0.82568359375, -0.392333984375, 0.041015625, 0.474365234375, 0.90771484375, 1.341064453125, 1.7744140625, 2.207763671875, 2.64111328125, 3.074462890625, 3.5078125, 3.941162109375, 4.37451171875, 4.807861328125, 5.2412109375, 5.674560546875, 6.10791015625, 6.541259765625, 6.974609375, 7.407958984375, 7.84130859375, 8.274658203125, 8.7080078125, 9.141357421875, 9.57470703125, 10.008056640625, 10.44140625, 10.874755859375, 11.30810546875, 11.741455078125, 12.1748046875, 12.608154296875, 13.04150390625, 13.474853515625, 13.908203125, 14.341552734375, 14.77490234375, 15.208251953125, 15.6416015625, 16.074951171875, 16.50830078125, 16.941650390625, 17.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 8.0, 10.0, 13.0, 25.0, 43.0, 63.0, 90.0, 163.0, 203.0, 336.0, 553.0, 822.0, 1378.0, 2734.0, 5518.0, 14007.0, 44053.0, 204353.0, 4574113.0, 1228844.0, 155472.0, 36119.0, 11836.0, 4856.0, 2367.0, 1269.0, 780.0, 485.0, 311.0, 207.0, 133.0, 81.0, 50.0, 37.0, 26.0, 23.0, 5.0, 17.0, 6.0, 5.0, 8.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5712890625, -1.5129241943359375, -1.454559326171875, -1.3961944580078125, -1.33782958984375, -1.2794647216796875, -1.221099853515625, -1.1627349853515625, -1.1043701171875, -1.0460052490234375, -0.987640380859375, -0.9292755126953125, -0.87091064453125, -0.8125457763671875, -0.754180908203125, -0.6958160400390625, -0.637451171875, -0.5790863037109375, -0.520721435546875, -0.4623565673828125, -0.40399169921875, -0.3456268310546875, -0.287261962890625, -0.2288970947265625, -0.1705322265625, -0.1121673583984375, -0.053802490234375, 0.0045623779296875, 0.06292724609375, 0.1212921142578125, 0.179656982421875, 0.2380218505859375, 0.29638671875, 0.3547515869140625, 0.413116455078125, 0.4714813232421875, 0.52984619140625, 0.5882110595703125, 0.646575927734375, 0.7049407958984375, 0.7633056640625, 0.8216705322265625, 0.880035400390625, 0.9384002685546875, 0.99676513671875, 1.0551300048828125, 1.113494873046875, 1.1718597412109375, 1.230224609375, 1.2885894775390625, 1.346954345703125, 1.4053192138671875, 1.46368408203125, 1.5220489501953125, 1.580413818359375, 1.6387786865234375, 1.6971435546875, 1.7555084228515625, 1.813873291015625, 1.8722381591796875, 1.93060302734375, 1.9889678955078125, 2.047332763671875, 2.1056976318359375, 2.1640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 7.0, 9.0, 6.0, 10.0, 9.0, 24.0, 27.0, 28.0, 33.0, 41.0, 36.0, 54.0, 56.0, 43.0, 40.0, 150.0, 986.0, 61.0, 49.0, 37.0, 49.0, 40.0, 35.0, 26.0, 29.0, 27.0, 28.0, 13.0, 19.0, 13.0, 5.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5078125, -12.07861328125, -11.6494140625, -11.22021484375, -10.791015625, -10.36181640625, -9.9326171875, -9.50341796875, -9.07421875, -8.64501953125, -8.2158203125, -7.78662109375, -7.357421875, -6.92822265625, -6.4990234375, -6.06982421875, -5.640625, -5.21142578125, -4.7822265625, -4.35302734375, -3.923828125, -3.49462890625, -3.0654296875, -2.63623046875, -2.20703125, -1.77783203125, -1.3486328125, -0.91943359375, -0.490234375, -0.06103515625, 0.3681640625, 0.79736328125, 1.2265625, 1.65576171875, 2.0849609375, 2.51416015625, 2.943359375, 3.37255859375, 3.8017578125, 4.23095703125, 4.66015625, 5.08935546875, 5.5185546875, 5.94775390625, 6.376953125, 6.80615234375, 7.2353515625, 7.66455078125, 8.09375, 8.52294921875, 8.9521484375, 9.38134765625, 9.810546875, 10.23974609375, 10.6689453125, 11.09814453125, 11.52734375, 11.95654296875, 12.3857421875, 12.81494140625, 13.244140625, 13.67333984375, 14.1025390625, 14.53173828125, 14.9609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 10.0, 27.0, 58.0, 290.0, 361.0, 179.0, 45.0, 18.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.83673858642578, -38.67256164550781, -37.508384704589844, -36.34421157836914, -35.18003463745117, -34.0158576965332, -32.8516845703125, -31.68750762939453, -30.523330688476562, -29.359153747558594, -28.194978713989258, -27.030803680419922, -25.866626739501953, -24.702449798583984, -23.53827476501465, -22.374099731445312, -21.209922790527344, -20.045745849609375, -18.88157081604004, -17.717395782470703, -16.553218841552734, -15.389042854309082, -14.22486686706543, -13.060690879821777, -11.896514892578125, -10.732338905334473, -9.56816291809082, -8.403986930847168, -7.239810943603516, -6.075634956359863, -4.911458969116211, -3.7472829818725586, -2.583110809326172, -1.4189348220825195, -0.2547588348388672, 0.9094171524047852, 2.0735931396484375, 3.23776912689209, 4.401945114135742, 5.5661211013793945, 6.730297088623047, 7.894473075866699, 9.058649063110352, 10.222825050354004, 11.387001037597656, 12.551177024841309, 13.715353012084961, 14.879528999328613, 16.043704986572266, 17.207881927490234, 18.37205696105957, 19.536231994628906, 20.700408935546875, 21.864585876464844, 23.02876091003418, 24.192935943603516, 25.357112884521484, 26.521289825439453, 27.68546485900879, 28.849639892578125, 30.013816833496094, 31.177993774414062, 32.34217071533203, 33.506343841552734, 34.6705207824707]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 13.0, 10.0, 19.0, 16.0, 39.0, 56.0, 54.0, 71.0, 96.0, 88.0, 103.0, 81.0, 83.0, 62.0, 45.0, 30.0, 33.0, 24.0, 17.0, 11.0, 14.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.75379180908203, -34.51516342163086, -33.27653121948242, -32.03790283203125, -30.799270629882812, -29.56064224243164, -28.322011947631836, -27.08338165283203, -25.844751358032227, -24.606121063232422, -23.367490768432617, -22.128860473632812, -20.89023208618164, -19.651599884033203, -18.41297149658203, -17.174341201782227, -15.935710906982422, -14.697080612182617, -13.458450317382812, -12.219820976257324, -10.98119068145752, -9.742560386657715, -8.503931045532227, -7.265300750732422, -6.026670455932617, -4.7880401611328125, -3.549410343170166, -2.3107802867889404, -1.0721502304077148, 0.16648006439208984, 1.4051098823547363, 2.643739700317383, 3.882373809814453, 5.121004104614258, 6.359633922576904, 7.598263740539551, 8.836894035339355, 10.07552433013916, 11.314153671264648, 12.552783966064453, 13.791414260864258, 15.030044555664062, 16.268674850463867, 17.507305145263672, 18.745933532714844, 19.98456573486328, 21.223194122314453, 22.461824417114258, 23.700454711914062, 24.939085006713867, 26.177715301513672, 27.416345596313477, 28.65497589111328, 29.893604278564453, 31.132234573364258, 32.37086486816406, 33.6094970703125, 34.84812545776367, 36.08675765991211, 37.32538604736328, 38.56401824951172, 39.80264663696289, 41.04127883911133, 42.2799072265625, 43.51853561401367]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 10.0, 20.0, 892.0, 1817.0, 2797.0, 6540.0, 39773.0, 3110763.0, 1000234.0, 25372.0, 3689.0, 1995.0, 295.0, 26.0, 18.0, 10.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.1486968994140625, -0.142730712890625, -0.1367645263671875, -0.13079833984375, -0.1248321533203125, -0.118865966796875, -0.1128997802734375, -0.10693359375, -0.1009674072265625, -0.095001220703125, -0.0890350341796875, -0.08306884765625, -0.0771026611328125, -0.071136474609375, -0.0651702880859375, -0.0592041015625, -0.0532379150390625, -0.047271728515625, -0.0413055419921875, -0.03533935546875, -0.0293731689453125, -0.023406982421875, -0.0174407958984375, -0.011474609375, -0.0055084228515625, 0.000457763671875, 0.0064239501953125, 0.01239013671875, 0.0183563232421875, 0.024322509765625, 0.0302886962890625, 0.0362548828125, 0.0422210693359375, 0.048187255859375, 0.0541534423828125, 0.06011962890625, 0.0660858154296875, 0.072052001953125, 0.0780181884765625, 0.083984375, 0.0899505615234375, 0.095916748046875, 0.1018829345703125, 0.10784912109375, 0.1138153076171875, 0.119781494140625, 0.1257476806640625, 0.1317138671875, 0.1376800537109375, 0.143646240234375, 0.1496124267578125, 0.15557861328125, 0.1615447998046875, 0.167510986328125, 0.1734771728515625, 0.179443359375, 0.1854095458984375, 0.191375732421875, 0.1973419189453125, 0.20330810546875, 0.2092742919921875, 0.215240478515625, 0.2212066650390625, 0.2271728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 9.0, 12.0, 18.0, 35.0, 41.0, 81.0, 147.0, 339.0, 132.0, 71.0, 40.0, 18.0, 16.0, 9.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1600341796875, -0.15440750122070312, -0.14878082275390625, -0.14315414428710938, -0.1375274658203125, -0.13190078735351562, -0.12627410888671875, -0.12064743041992188, -0.115020751953125, -0.10939407348632812, -0.10376739501953125, -0.09814071655273438, -0.0925140380859375, -0.08688735961914062, -0.08126068115234375, -0.07563400268554688, -0.07000732421875, -0.06438064575195312, -0.05875396728515625, -0.053127288818359375, -0.0475006103515625, -0.041873931884765625, -0.03624725341796875, -0.030620574951171875, -0.024993896484375, -0.019367218017578125, -0.01374053955078125, -0.008113861083984375, -0.0024871826171875, 0.003139495849609375, 0.00876617431640625, 0.014392852783203125, 0.02001953125, 0.025646209716796875, 0.03127288818359375, 0.036899566650390625, 0.0425262451171875, 0.048152923583984375, 0.05377960205078125, 0.059406280517578125, 0.065032958984375, 0.07065963745117188, 0.07628631591796875, 0.08191299438476562, 0.0875396728515625, 0.09316635131835938, 0.09879302978515625, 0.10441970825195312, 0.11004638671875, 0.11567306518554688, 0.12129974365234375, 0.12692642211914062, 0.1325531005859375, 0.13817977905273438, 0.14380645751953125, 0.14943313598632812, 0.155059814453125, 0.16068649291992188, 0.16631317138671875, 0.17193984985351562, 0.1775665283203125, 0.18319320678710938, 0.18881988525390625, 0.19444656372070312, 0.2000732421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 23.0, 32.0, 35.0, 48.0, 132.0, 408.0, 3295.0, 4181872.0, 7511.0, 567.0, 160.0, 70.0, 44.0, 22.0, 21.0, 8.0, 6.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.29569244384765625, -0.2813262939453125, -0.26696014404296875, -0.252593994140625, -0.23822784423828125, -0.2238616943359375, -0.20949554443359375, -0.19512939453125, -0.18076324462890625, -0.1663970947265625, -0.15203094482421875, -0.137664794921875, -0.12329864501953125, -0.1089324951171875, -0.09456634521484375, -0.0802001953125, -0.06583404541015625, -0.0514678955078125, -0.03710174560546875, -0.022735595703125, -0.00836944580078125, 0.0059967041015625, 0.02036285400390625, 0.03472900390625, 0.04909515380859375, 0.0634613037109375, 0.07782745361328125, 0.092193603515625, 0.10655975341796875, 0.1209259033203125, 0.13529205322265625, 0.149658203125, 0.16402435302734375, 0.1783905029296875, 0.19275665283203125, 0.207122802734375, 0.22148895263671875, 0.2358551025390625, 0.25022125244140625, 0.26458740234375, 0.27895355224609375, 0.2933197021484375, 0.30768585205078125, 0.322052001953125, 0.33641815185546875, 0.3507843017578125, 0.36515045166015625, 0.3795166015625, 0.39388275146484375, 0.4082489013671875, 0.42261505126953125, 0.436981201171875, 0.45134735107421875, 0.4657135009765625, 0.48007965087890625, 0.49444580078125, 0.5088119506835938, 0.5231781005859375, 0.5375442504882812, 0.551910400390625, 0.5662765502929688, 0.5806427001953125, 0.5950088500976562, 0.609375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 10.0, 18.0, 28.0, 34.0, 28.0, 102.0, 217.0, 567.0, 1280.0, 960.0, 470.0, 168.0, 69.0, 41.0, 28.0, 23.0, 13.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06317138671875, -0.060128211975097656, -0.05708503723144531, -0.05404186248779297, -0.050998687744140625, -0.04795551300048828, -0.04491233825683594, -0.041869163513183594, -0.03882598876953125, -0.035782814025878906, -0.03273963928222656, -0.02969646453857422, -0.026653289794921875, -0.02361011505126953, -0.020566940307617188, -0.017523765563964844, -0.0144805908203125, -0.011437416076660156, -0.008394241333007812, -0.005351066589355469, -0.002307891845703125, 0.0007352828979492188, 0.0037784576416015625, 0.006821632385253906, 0.00986480712890625, 0.012907981872558594, 0.015951156616210938, 0.01899433135986328, 0.022037506103515625, 0.02508068084716797, 0.028123855590820312, 0.031167030334472656, 0.034210205078125, 0.037253379821777344, 0.04029655456542969, 0.04333972930908203, 0.046382904052734375, 0.04942607879638672, 0.05246925354003906, 0.055512428283691406, 0.05855560302734375, 0.061598777770996094, 0.06464195251464844, 0.06768512725830078, 0.07072830200195312, 0.07377147674560547, 0.07681465148925781, 0.07985782623291016, 0.0829010009765625, 0.08594417572021484, 0.08898735046386719, 0.09203052520751953, 0.09507369995117188, 0.09811687469482422, 0.10116004943847656, 0.1042032241821289, 0.10724639892578125, 0.1102895736694336, 0.11333274841308594, 0.11637592315673828, 0.11941909790039062, 0.12246227264404297, 0.1255054473876953, 0.12854862213134766, 0.131591796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 25.0, 848.0, 142.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.639014720916748, -2.5812911987304688, -2.5235679149627686, -2.4658443927764893, -2.40812087059021, -2.3503975868225098, -2.2926740646362305, -2.234950542449951, -2.177227258682251, -2.1195037364959717, -2.0617804527282715, -2.004056930541992, -1.9463335275650024, -1.8886101245880127, -1.8308866024017334, -1.7731631994247437, -1.7154396772384644, -1.6577162742614746, -1.5999927520751953, -1.5422693490982056, -1.4845459461212158, -1.4268224239349365, -1.3690990209579468, -1.311375617980957, -1.2536520957946777, -1.195928692817688, -1.1382051706314087, -1.080481767654419, -1.0227583646774292, -0.9650349020957947, -0.9073114395141602, -0.8495880365371704, -0.7918646335601807, -0.7341411709785461, -0.6764177680015564, -0.6186943054199219, -0.5609709024429321, -0.5032474398612976, -0.4455239772796631, -0.38780054450035095, -0.3300771117210388, -0.2723536789417267, -0.21463023126125336, -0.15690678358078003, -0.0991833508014679, -0.04145991802215576, 0.01626354455947876, 0.0739869773387909, 0.13171041011810303, 0.18943384289741516, 0.2471572905778885, 0.3048807382583618, 0.36260417103767395, 0.4203276038169861, 0.4780510663986206, 0.5357744693756104, 0.5934979319572449, 0.6512213945388794, 0.7089447975158691, 0.7666682600975037, 0.8243917226791382, 0.8821151256561279, 0.9398385882377625, 0.997562050819397, 1.0552854537963867]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 17.0, 24.0, 20.0, 34.0, 28.0, 43.0, 38.0, 39.0, 48.0, 46.0, 41.0, 46.0, 47.0, 53.0, 44.0, 44.0, 46.0, 51.0, 37.0, 23.0, 34.0, 20.0, 20.0, 18.0, 15.0, 14.0, 14.0, 12.0, 12.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1742118000984192, -0.16894155740737915, -0.1636713296175003, -0.15840108692646027, -0.15313085913658142, -0.14786061644554138, -0.14259037375450134, -0.1373201459646225, -0.13204991817474365, -0.1267796754837036, -0.12150944769382477, -0.11623920500278473, -0.11096897721290588, -0.10569873452186584, -0.1004284992814064, -0.09515826404094696, -0.08988802134990692, -0.08461778610944748, -0.07934755086898804, -0.074077308177948, -0.06880708038806915, -0.06353683769702911, -0.05826660245656967, -0.05299636721611023, -0.04772613197565079, -0.042455896735191345, -0.0371856614947319, -0.03191542252898216, -0.02664518728852272, -0.021374952048063278, -0.016104713082313538, -0.010834477841854095, -0.005564242601394653, -0.00029400642961263657, 0.00497622974216938, 0.010246466845273972, 0.015516702085733414, 0.020786937326192856, 0.026057176291942596, 0.03132741153240204, 0.03659764677286148, 0.04186788201332092, 0.047138117253780365, 0.052408356219530106, 0.05767859145998955, 0.06294882297515869, 0.06821906566619873, 0.07348930090665817, 0.07875953614711761, 0.08402977138757706, 0.0893000066280365, 0.09457024931907654, 0.09984047710895538, 0.10511071979999542, 0.11038095504045486, 0.1156511902809143, 0.12092142552137375, 0.1261916607618332, 0.13146190345287323, 0.13673213124275208, 0.14200237393379211, 0.14727260172367096, 0.152542844414711, 0.15781307220458984, 0.16308331489562988]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 20.0, 6.0, 13.0, 13.0, 28.0, 33.0, 42.0, 61.0, 70.0, 110.0, 183.0, 232.0, 443.0, 848.0, 1980.0, 5429.0, 26903.0, 918887.0, 78919.0, 8975.0, 2687.0, 1090.0, 566.0, 355.0, 203.0, 119.0, 91.0, 63.0, 42.0, 26.0, 28.0, 14.0, 15.0, 11.0, 9.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.935546875, -0.9029388427734375, -0.870330810546875, -0.8377227783203125, -0.80511474609375, -0.7725067138671875, -0.739898681640625, -0.7072906494140625, -0.6746826171875, -0.6420745849609375, -0.609466552734375, -0.5768585205078125, -0.54425048828125, -0.5116424560546875, -0.479034423828125, -0.4464263916015625, -0.413818359375, -0.3812103271484375, -0.348602294921875, -0.3159942626953125, -0.28338623046875, -0.2507781982421875, -0.218170166015625, -0.1855621337890625, -0.1529541015625, -0.1203460693359375, -0.087738037109375, -0.0551300048828125, -0.02252197265625, 0.0100860595703125, 0.042694091796875, 0.0753021240234375, 0.10791015625, 0.1405181884765625, 0.173126220703125, 0.2057342529296875, 0.23834228515625, 0.2709503173828125, 0.303558349609375, 0.3361663818359375, 0.3687744140625, 0.4013824462890625, 0.433990478515625, 0.4665985107421875, 0.49920654296875, 0.5318145751953125, 0.564422607421875, 0.5970306396484375, 0.629638671875, 0.6622467041015625, 0.694854736328125, 0.7274627685546875, 0.76007080078125, 0.7926788330078125, 0.825286865234375, 0.8578948974609375, 0.8905029296875, 0.9231109619140625, 0.955718994140625, 0.9883270263671875, 1.02093505859375, 1.0535430908203125, 1.086151123046875, 1.1187591552734375, 1.1513671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 15.0, 16.0, 33.0, 45.0, 71.0, 148.0, 349.0, 130.0, 74.0, 43.0, 16.0, 13.0, 9.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16455078125, -0.1587677001953125, -0.152984619140625, -0.1472015380859375, -0.14141845703125, -0.1356353759765625, -0.129852294921875, -0.1240692138671875, -0.1182861328125, -0.1125030517578125, -0.106719970703125, -0.1009368896484375, -0.09515380859375, -0.0893707275390625, -0.083587646484375, -0.0778045654296875, -0.072021484375, -0.0662384033203125, -0.060455322265625, -0.0546722412109375, -0.04888916015625, -0.0431060791015625, -0.037322998046875, -0.0315399169921875, -0.0257568359375, -0.0199737548828125, -0.014190673828125, -0.0084075927734375, -0.00262451171875, 0.0031585693359375, 0.008941650390625, 0.0147247314453125, 0.0205078125, 0.0262908935546875, 0.032073974609375, 0.0378570556640625, 0.04364013671875, 0.0494232177734375, 0.055206298828125, 0.0609893798828125, 0.0667724609375, 0.0725555419921875, 0.078338623046875, 0.0841217041015625, 0.08990478515625, 0.0956878662109375, 0.101470947265625, 0.1072540283203125, 0.113037109375, 0.1188201904296875, 0.124603271484375, 0.1303863525390625, 0.13616943359375, 0.1419525146484375, 0.147735595703125, 0.1535186767578125, 0.1593017578125, 0.1650848388671875, 0.170867919921875, 0.1766510009765625, 0.18243408203125, 0.1882171630859375, 0.194000244140625, 0.1997833251953125, 0.20556640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 10.0, 5.0, 9.0, 10.0, 11.0, 19.0, 25.0, 19.0, 24.0, 42.0, 58.0, 60.0, 74.0, 99.0, 129.0, 158.0, 298.0, 502.0, 1082.0, 3567.0, 17496.0, 118066.0, 580559.0, 276644.0, 39093.0, 6949.0, 1672.0, 678.0, 325.0, 215.0, 143.0, 117.0, 79.0, 64.0, 55.0, 32.0, 36.0, 26.0, 23.0, 11.0, 16.0, 7.0, 15.0, 7.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.2249755859375, -0.2176513671875, -0.2103271484375, -0.2030029296875, -0.1956787109375, -0.1883544921875, -0.1810302734375, -0.1737060546875, -0.1663818359375, -0.1590576171875, -0.1517333984375, -0.1444091796875, -0.1370849609375, -0.1297607421875, -0.1224365234375, -0.1151123046875, -0.1077880859375, -0.1004638671875, -0.0931396484375, -0.0858154296875, -0.0784912109375, -0.0711669921875, -0.0638427734375, -0.0565185546875, -0.0491943359375, -0.0418701171875, -0.0345458984375, -0.0272216796875, -0.0198974609375, -0.0125732421875, -0.0052490234375, 0.0020751953125, 0.0093994140625, 0.0167236328125, 0.0240478515625, 0.0313720703125, 0.0386962890625, 0.0460205078125, 0.0533447265625, 0.0606689453125, 0.0679931640625, 0.0753173828125, 0.0826416015625, 0.0899658203125, 0.0972900390625, 0.1046142578125, 0.1119384765625, 0.1192626953125, 0.1265869140625, 0.1339111328125, 0.1412353515625, 0.1485595703125, 0.1558837890625, 0.1632080078125, 0.1705322265625, 0.1778564453125, 0.1851806640625, 0.1925048828125, 0.1998291015625, 0.2071533203125, 0.2144775390625, 0.2218017578125, 0.2291259765625, 0.2364501953125, 0.2437744140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 3.0, 1.0, 7.0, 3.0, 9.0, 15.0, 13.0, 21.0, 20.0, 20.0, 15.0, 34.0, 25.0, 34.0, 28.0, 39.0, 34.0, 41.0, 40.0, 38.0, 28.0, 36.0, 57.0, 38.0, 39.0, 25.0, 37.0, 31.0, 29.0, 38.0, 32.0, 33.0, 25.0, 18.0, 17.0, 11.0, 16.0, 12.0, 7.0, 9.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1937255859375, -0.18821144104003906, -0.18269729614257812, -0.1771831512451172, -0.17166900634765625, -0.1661548614501953, -0.16064071655273438, -0.15512657165527344, -0.1496124267578125, -0.14409828186035156, -0.13858413696289062, -0.1330699920654297, -0.12755584716796875, -0.12204170227050781, -0.11652755737304688, -0.11101341247558594, -0.105499267578125, -0.09998512268066406, -0.09447097778320312, -0.08895683288574219, -0.08344268798828125, -0.07792854309082031, -0.07241439819335938, -0.06690025329589844, -0.0613861083984375, -0.05587196350097656, -0.050357818603515625, -0.04484367370605469, -0.03932952880859375, -0.03381538391113281, -0.028301239013671875, -0.022787094116210938, -0.01727294921875, -0.011758804321289062, -0.006244659423828125, -0.0007305145263671875, 0.00478363037109375, 0.010297775268554688, 0.015811920166015625, 0.021326065063476562, 0.0268402099609375, 0.03235435485839844, 0.037868499755859375, 0.04338264465332031, 0.04889678955078125, 0.05441093444824219, 0.059925079345703125, 0.06543922424316406, 0.070953369140625, 0.07646751403808594, 0.08198165893554688, 0.08749580383300781, 0.09300994873046875, 0.09852409362792969, 0.10403823852539062, 0.10955238342285156, 0.1150665283203125, 0.12058067321777344, 0.12609481811523438, 0.1316089630126953, 0.13712310791015625, 0.1426372528076172, 0.14815139770507812, 0.15366554260253906, 0.1591796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 8.0, 13.0, 12.0, 13.0, 31.0, 31.0, 40.0, 74.0, 95.0, 155.0, 246.0, 317.0, 531.0, 806.0, 1286.0, 2280.0, 4024.0, 7766.0, 16500.0, 40266.0, 116127.0, 370705.0, 320975.0, 99847.0, 35391.0, 14918.0, 7134.0, 3678.0, 1959.0, 1146.0, 740.0, 448.0, 312.0, 202.0, 141.0, 82.0, 56.0, 53.0, 42.0, 34.0, 8.0, 14.0, 11.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06536865234375, -0.06325531005859375, -0.0611419677734375, -0.05902862548828125, -0.056915283203125, -0.05480194091796875, -0.0526885986328125, -0.05057525634765625, -0.0484619140625, -0.04634857177734375, -0.0442352294921875, -0.04212188720703125, -0.040008544921875, -0.03789520263671875, -0.0357818603515625, -0.03366851806640625, -0.03155517578125, -0.02944183349609375, -0.0273284912109375, -0.02521514892578125, -0.023101806640625, -0.02098846435546875, -0.0188751220703125, -0.01676177978515625, -0.0146484375, -0.01253509521484375, -0.0104217529296875, -0.00830841064453125, -0.006195068359375, -0.00408172607421875, -0.0019683837890625, 0.00014495849609375, 0.00225830078125, 0.00437164306640625, 0.0064849853515625, 0.00859832763671875, 0.010711669921875, 0.01282501220703125, 0.0149383544921875, 0.01705169677734375, 0.0191650390625, 0.02127838134765625, 0.0233917236328125, 0.02550506591796875, 0.027618408203125, 0.02973175048828125, 0.0318450927734375, 0.03395843505859375, 0.03607177734375, 0.03818511962890625, 0.0402984619140625, 0.04241180419921875, 0.044525146484375, 0.04663848876953125, 0.0487518310546875, 0.05086517333984375, 0.052978515625, 0.05509185791015625, 0.0572052001953125, 0.05931854248046875, 0.061431884765625, 0.06354522705078125, 0.0656585693359375, 0.06777191162109375, 0.06988525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 5.0, 6.0, 8.0, 9.0, 14.0, 24.0, 19.0, 33.0, 37.0, 52.0, 54.0, 63.0, 92.0, 67.0, 110.0, 81.0, 82.0, 54.0, 43.0, 37.0, 14.0, 29.0, 15.0, 10.0, 4.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1298805475234985e-05, -1.0974705219268799e-05, -1.0650604963302612e-05, -1.0326504707336426e-05, -1.000240445137024e-05, -9.678304195404053e-06, -9.354203939437866e-06, -9.03010368347168e-06, -8.706003427505493e-06, -8.381903171539307e-06, -8.05780291557312e-06, -7.733702659606934e-06, -7.409602403640747e-06, -7.0855021476745605e-06, -6.761401891708374e-06, -6.4373016357421875e-06, -6.113201379776001e-06, -5.7891011238098145e-06, -5.465000867843628e-06, -5.140900611877441e-06, -4.816800355911255e-06, -4.492700099945068e-06, -4.168599843978882e-06, -3.844499588012695e-06, -3.520399332046509e-06, -3.1962990760803223e-06, -2.8721988201141357e-06, -2.5480985641479492e-06, -2.2239983081817627e-06, -1.8998980522155762e-06, -1.5757977962493896e-06, -1.2516975402832031e-06, -9.275972843170166e-07, -6.034970283508301e-07, -2.7939677238464355e-07, 4.470348358154297e-08, 3.688037395477295e-07, 6.92903995513916e-07, 1.0170042514801025e-06, 1.341104507446289e-06, 1.6652047634124756e-06, 1.989305019378662e-06, 2.3134052753448486e-06, 2.637505531311035e-06, 2.9616057872772217e-06, 3.285706043243408e-06, 3.6098062992095947e-06, 3.933906555175781e-06, 4.258006811141968e-06, 4.582107067108154e-06, 4.906207323074341e-06, 5.230307579040527e-06, 5.554407835006714e-06, 5.8785080909729e-06, 6.202608346939087e-06, 6.5267086029052734e-06, 6.85080885887146e-06, 7.1749091148376465e-06, 7.499009370803833e-06, 7.82310962677002e-06, 8.147209882736206e-06, 8.471310138702393e-06, 8.795410394668579e-06, 9.119510650634766e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 11.0, 11.0, 13.0, 26.0, 21.0, 31.0, 55.0, 106.0, 131.0, 220.0, 399.0, 779.0, 1422.0, 2902.0, 6949.0, 20941.0, 82015.0, 404445.0, 410161.0, 83400.0, 21181.0, 7127.0, 2952.0, 1452.0, 725.0, 402.0, 242.0, 154.0, 85.0, 51.0, 45.0, 33.0, 20.0, 12.0, 7.0, 7.0, 7.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09063720703125, -0.08804798126220703, -0.08545875549316406, -0.0828695297241211, -0.08028030395507812, -0.07769107818603516, -0.07510185241699219, -0.07251262664794922, -0.06992340087890625, -0.06733417510986328, -0.06474494934082031, -0.062155723571777344, -0.059566497802734375, -0.056977272033691406, -0.05438804626464844, -0.05179882049560547, -0.0492095947265625, -0.04662036895751953, -0.04403114318847656, -0.041441917419433594, -0.038852691650390625, -0.036263465881347656, -0.03367424011230469, -0.03108501434326172, -0.02849578857421875, -0.02590656280517578, -0.023317337036132812, -0.020728111267089844, -0.018138885498046875, -0.015549659729003906, -0.012960433959960938, -0.010371208190917969, -0.007781982421875, -0.005192756652832031, -0.0026035308837890625, -1.430511474609375e-05, 0.002574920654296875, 0.005164146423339844, 0.0077533721923828125, 0.010342597961425781, 0.01293182373046875, 0.015521049499511719, 0.018110275268554688, 0.020699501037597656, 0.023288726806640625, 0.025877952575683594, 0.028467178344726562, 0.03105640411376953, 0.0336456298828125, 0.03623485565185547, 0.03882408142089844, 0.041413307189941406, 0.044002532958984375, 0.046591758728027344, 0.04918098449707031, 0.05177021026611328, 0.05435943603515625, 0.05694866180419922, 0.05953788757324219, 0.062127113342285156, 0.06471633911132812, 0.0673055648803711, 0.06989479064941406, 0.07248401641845703, 0.0750732421875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 11.0, 12.0, 16.0, 21.0, 28.0, 39.0, 35.0, 39.0, 55.0, 54.0, 62.0, 69.0, 88.0, 80.0, 60.0, 50.0, 46.0, 34.0, 38.0, 28.0, 26.0, 19.0, 11.0, 9.0, 7.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0458984375, -0.04403400421142578, -0.04216957092285156, -0.040305137634277344, -0.038440704345703125, -0.036576271057128906, -0.03471183776855469, -0.03284740447998047, -0.03098297119140625, -0.02911853790283203, -0.027254104614257812, -0.025389671325683594, -0.023525238037109375, -0.021660804748535156, -0.019796371459960938, -0.01793193817138672, -0.0160675048828125, -0.014203071594238281, -0.012338638305664062, -0.010474205017089844, -0.008609771728515625, -0.006745338439941406, -0.0048809051513671875, -0.0030164718627929688, -0.00115203857421875, 0.0007123947143554688, 0.0025768280029296875, 0.004441261291503906, 0.006305694580078125, 0.008170127868652344, 0.010034561157226562, 0.011898994445800781, 0.013763427734375, 0.01562786102294922, 0.017492294311523438, 0.019356727600097656, 0.021221160888671875, 0.023085594177246094, 0.024950027465820312, 0.02681446075439453, 0.02867889404296875, 0.03054332733154297, 0.03240776062011719, 0.034272193908691406, 0.036136627197265625, 0.038001060485839844, 0.03986549377441406, 0.04172992706298828, 0.0435943603515625, 0.04545879364013672, 0.04732322692871094, 0.049187660217285156, 0.051052093505859375, 0.052916526794433594, 0.05478096008300781, 0.05664539337158203, 0.05850982666015625, 0.06037425994873047, 0.06223869323730469, 0.0641031265258789, 0.06596755981445312, 0.06783199310302734, 0.06969642639160156, 0.07156085968017578, 0.07342529296875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 10.0, 29.0, 60.0, 167.0, 390.0, 261.0, 68.0, 17.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.976993560791016, -4.872744560241699, -4.768496036529541, -4.664247035980225, -4.559998512268066, -4.45574951171875, -4.351500988006592, -4.247251987457275, -4.143003463745117, -4.038754463195801, -3.9345059394836426, -3.8302571773529053, -3.726008415222168, -3.6217594146728516, -3.5175106525421143, -3.413261890411377, -3.3090128898620605, -3.2047641277313232, -3.100515365600586, -2.9962666034698486, -2.8920178413391113, -2.787768840789795, -2.6835200786590576, -2.5792713165283203, -2.475022554397583, -2.3707737922668457, -2.2665250301361084, -2.162276268005371, -2.0580272674560547, -1.953778624534607, -1.84952974319458, -1.7452809810638428, -1.6410322189331055, -1.5367834568023682, -1.4325346946716309, -1.328285813331604, -1.2240370512008667, -1.1197882890701294, -1.0155394077301025, -0.9112906455993652, -0.8070418834686279, -0.7027931213378906, -0.5985442996025085, -0.49429550766944885, -0.39004671573638916, -0.28579795360565186, -0.18154913187026978, -0.0773003101348877, 0.02694845199584961, 0.1311972439289093, 0.235446035861969, 0.3396948277950287, 0.4439436197280884, 0.5481923818588257, 0.6524412035942078, 0.7566900253295898, 0.8609387874603271, 0.9651875495910645, 1.0694363117218018, 1.1736851930618286, 1.277933955192566, 1.3821827173233032, 1.48643159866333, 1.5906803607940674, 1.6949291229248047]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 7.0, 17.0, 22.0, 26.0, 25.0, 46.0, 32.0, 39.0, 42.0, 48.0, 53.0, 54.0, 62.0, 46.0, 51.0, 56.0, 43.0, 51.0, 42.0, 33.0, 34.0, 34.0, 36.0, 21.0, 25.0, 14.0, 18.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8114482164382935, -1.7571368217468262, -1.7028255462646484, -1.6485141515731812, -1.5942028760910034, -1.5398914813995361, -1.4855802059173584, -1.4312688112258911, -1.3769574165344238, -1.3226460218429565, -1.2683347463607788, -1.2140233516693115, -1.1597120761871338, -1.1054006814956665, -1.0510892868041992, -0.9967780113220215, -0.9424667358398438, -0.8881554007530212, -0.8338440656661987, -0.7795326709747314, -0.7252213954925537, -0.6709100008010864, -0.6165986657142639, -0.5622873306274414, -0.5079759955406189, -0.4536646604537964, -0.3993533253669739, -0.345041960477829, -0.29073062539100647, -0.23641929030418396, -0.18210792541503906, -0.12779659032821655, -0.0734853744506836, -0.019174031913280487, 0.03513731062412262, 0.08944866061210632, 0.14375999569892883, 0.19807133078575134, 0.25238269567489624, 0.30669403076171875, 0.36100536584854126, 0.41531670093536377, 0.4696280360221863, 0.5239393711090088, 0.5782507658004761, 0.6325620412826538, 0.6868734359741211, 0.7411847710609436, 0.7954961061477661, 0.8498074412345886, 0.9041187763214111, 0.9584301710128784, 1.0127414464950562, 1.0670528411865234, 1.1213641166687012, 1.1756755113601685, 1.2299869060516357, 1.284298300743103, 1.3386095762252808, 1.392920970916748, 1.4472322463989258, 1.501543641090393, 1.5558550357818604, 1.610166311264038, 1.6644775867462158]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 7.0, 2.0, 1.0, 8.0, 14.0, 15.0, 22.0, 36.0, 56.0, 164.0, 915.0, 1450033.0, 2741716.0, 927.0, 178.0, 75.0, 44.0, 21.0, 17.0, 9.0, 9.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.908203125, -0.87188720703125, -0.8355712890625, -0.79925537109375, -0.762939453125, -0.72662353515625, -0.6903076171875, -0.65399169921875, -0.61767578125, -0.58135986328125, -0.5450439453125, -0.50872802734375, -0.472412109375, -0.43609619140625, -0.3997802734375, -0.36346435546875, -0.3271484375, -0.29083251953125, -0.2545166015625, -0.21820068359375, -0.181884765625, -0.14556884765625, -0.1092529296875, -0.07293701171875, -0.03662109375, -0.00030517578125, 0.0360107421875, 0.07232666015625, 0.108642578125, 0.14495849609375, 0.1812744140625, 0.21759033203125, 0.25390625, 0.29022216796875, 0.3265380859375, 0.36285400390625, 0.399169921875, 0.43548583984375, 0.4718017578125, 0.50811767578125, 0.54443359375, 0.58074951171875, 0.6170654296875, 0.65338134765625, 0.689697265625, 0.72601318359375, 0.7623291015625, 0.79864501953125, 0.8349609375, 0.87127685546875, 0.9075927734375, 0.94390869140625, 0.980224609375, 1.01654052734375, 1.0528564453125, 1.08917236328125, 1.12548828125, 1.16180419921875, 1.1981201171875, 1.23443603515625, 1.270751953125, 1.30706787109375, 1.3433837890625, 1.37969970703125, 1.416015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 16.0, 24.0, 33.0, 49.0, 105.0, 147.0, 187.0, 160.0, 97.0, 59.0, 37.0, 15.0, 19.0, 6.0, 15.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1231689453125, -0.11816215515136719, -0.11315536499023438, -0.10814857482910156, -0.10314178466796875, -0.09813499450683594, -0.09312820434570312, -0.08812141418457031, -0.0831146240234375, -0.07810783386230469, -0.07310104370117188, -0.06809425354003906, -0.06308746337890625, -0.05808067321777344, -0.053073883056640625, -0.04806709289550781, -0.043060302734375, -0.03805351257324219, -0.033046722412109375, -0.028039932250976562, -0.02303314208984375, -0.018026351928710938, -0.013019561767578125, -0.008012771606445312, -0.0030059814453125, 0.0020008087158203125, 0.007007598876953125, 0.012014389038085938, 0.01702117919921875, 0.022027969360351562, 0.027034759521484375, 0.03204154968261719, 0.03704833984375, 0.04205513000488281, 0.047061920166015625, 0.05206871032714844, 0.05707550048828125, 0.06208229064941406, 0.06708908081054688, 0.07209587097167969, 0.0771026611328125, 0.08210945129394531, 0.08711624145507812, 0.09212303161621094, 0.09712982177734375, 0.10213661193847656, 0.10714340209960938, 0.11215019226074219, 0.117156982421875, 0.12216377258300781, 0.12717056274414062, 0.13217735290527344, 0.13718414306640625, 0.14219093322753906, 0.14719772338867188, 0.1522045135498047, 0.1572113037109375, 0.1622180938720703, 0.16722488403320312, 0.17223167419433594, 0.17723846435546875, 0.18224525451660156, 0.18725204467773438, 0.1922588348388672, 0.197265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 18.0, 25.0, 30.0, 37.0, 54.0, 75.0, 161.0, 299.0, 1011.0, 4042.0, 24739.0, 423824.0, 3622569.0, 102968.0, 11047.0, 2188.0, 612.0, 235.0, 118.0, 63.0, 27.0, 25.0, 14.0, 11.0, 14.0, 8.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.439453125, -0.42930030822753906, -0.4191474914550781, -0.4089946746826172, -0.39884185791015625, -0.3886890411376953, -0.3785362243652344, -0.36838340759277344, -0.3582305908203125, -0.34807777404785156, -0.3379249572753906, -0.3277721405029297, -0.31761932373046875, -0.3074665069580078, -0.2973136901855469, -0.28716087341308594, -0.277008056640625, -0.26685523986816406, -0.2567024230957031, -0.2465496063232422, -0.23639678955078125, -0.2262439727783203, -0.21609115600585938, -0.20593833923339844, -0.1957855224609375, -0.18563270568847656, -0.17547988891601562, -0.1653270721435547, -0.15517425537109375, -0.1450214385986328, -0.13486862182617188, -0.12471580505371094, -0.11456298828125, -0.10441017150878906, -0.09425735473632812, -0.08410453796386719, -0.07395172119140625, -0.06379890441894531, -0.053646087646484375, -0.04349327087402344, -0.0333404541015625, -0.023187637329101562, -0.013034820556640625, -0.0028820037841796875, 0.00727081298828125, 0.017423629760742188, 0.027576446533203125, 0.03772926330566406, 0.047882080078125, 0.05803489685058594, 0.06818771362304688, 0.07834053039550781, 0.08849334716796875, 0.09864616394042969, 0.10879898071289062, 0.11895179748535156, 0.1291046142578125, 0.13925743103027344, 0.14941024780273438, 0.1595630645751953, 0.16971588134765625, 0.1798686981201172, 0.19002151489257812, 0.20017433166503906, 0.2103271484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 7.0, 8.0, 14.0, 13.0, 11.0, 22.0, 34.0, 21.0, 42.0, 53.0, 62.0, 102.0, 144.0, 209.0, 411.0, 739.0, 946.0, 510.0, 295.0, 165.0, 76.0, 61.0, 33.0, 19.0, 15.0, 10.0, 6.0, 5.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1312255859375, -0.1279773712158203, -0.12472915649414062, -0.12148094177246094, -0.11823272705078125, -0.11498451232910156, -0.11173629760742188, -0.10848808288574219, -0.1052398681640625, -0.10199165344238281, -0.09874343872070312, -0.09549522399902344, -0.09224700927734375, -0.08899879455566406, -0.08575057983398438, -0.08250236511230469, -0.079254150390625, -0.07600593566894531, -0.07275772094726562, -0.06950950622558594, -0.06626129150390625, -0.06301307678222656, -0.059764862060546875, -0.05651664733886719, -0.0532684326171875, -0.05002021789550781, -0.046772003173828125, -0.04352378845214844, -0.04027557373046875, -0.03702735900878906, -0.033779144287109375, -0.030530929565429688, -0.02728271484375, -0.024034500122070312, -0.020786285400390625, -0.017538070678710938, -0.01428985595703125, -0.011041641235351562, -0.007793426513671875, -0.0045452117919921875, -0.0012969970703125, 0.0019512176513671875, 0.005199432373046875, 0.008447647094726562, 0.01169586181640625, 0.014944076538085938, 0.018192291259765625, 0.021440505981445312, 0.024688720703125, 0.027936935424804688, 0.031185150146484375, 0.03443336486816406, 0.03768157958984375, 0.04092979431152344, 0.044178009033203125, 0.04742622375488281, 0.0506744384765625, 0.05392265319824219, 0.057170867919921875, 0.06041908264160156, 0.06366729736328125, 0.06691551208496094, 0.07016372680664062, 0.07341194152832031, 0.07666015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 697.0, 310.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.005799770355225, -3.782850980758667, -3.5599021911621094, -3.3369534015655518, -3.114004611968994, -2.8910558223724365, -2.668107032775879, -2.4451582431793213, -2.2222094535827637, -1.999260663986206, -1.7763118743896484, -1.5533630847930908, -1.3304142951965332, -1.1074655055999756, -0.884516716003418, -0.6615679264068604, -0.43861913681030273, -0.21567034721374512, 0.0072784423828125, 0.23022723197937012, 0.45317602157592773, 0.6761248111724854, 0.899073600769043, 1.1220223903656006, 1.3449711799621582, 1.5679199695587158, 1.7908687591552734, 2.013817548751831, 2.2367663383483887, 2.4597151279449463, 2.682663917541504, 2.9056127071380615, 3.1285619735717773, 3.351510763168335, 3.5744595527648926, 3.79740834236145, 4.020357131958008, 4.2433061599731445, 4.466254711151123, 4.689203262329102, 4.912152290344238, 5.135101318359375, 5.3580498695373535, 5.580998420715332, 5.803947448730469, 6.0268964767456055, 6.249845027923584, 6.4727935791015625, 6.695742607116699, 6.918691635131836, 7.1416401863098145, 7.364588737487793, 7.58753776550293, 7.810486793518066, 8.033435821533203, 8.256383895874023, 8.47933292388916, 8.702281951904297, 8.925230026245117, 9.148179054260254, 9.37112808227539, 9.594077110290527, 9.817026138305664, 10.039974212646484, 10.262923240661621]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 8.0, 12.0, 11.0, 15.0, 19.0, 32.0, 45.0, 34.0, 52.0, 55.0, 60.0, 60.0, 64.0, 52.0, 56.0, 53.0, 52.0, 49.0, 42.0, 47.0, 38.0, 37.0, 34.0, 16.0, 15.0, 11.0, 7.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4416899085044861, -0.42432186007499695, -0.4069538116455078, -0.3895857632160187, -0.37221771478652954, -0.3548496663570404, -0.33748161792755127, -0.32011356949806213, -0.302745521068573, -0.28537747263908386, -0.2680094242095947, -0.2506413757801056, -0.23327332735061646, -0.21590527892112732, -0.19853723049163818, -0.18116918206214905, -0.1638011336326599, -0.14643308520317078, -0.12906503677368164, -0.1116969883441925, -0.09432893991470337, -0.07696089148521423, -0.0595928430557251, -0.04222479462623596, -0.024856746196746826, -0.00748869776725769, 0.009879350662231445, 0.02724739909172058, 0.04461544752120972, 0.06198349595069885, 0.07935154438018799, 0.09671959280967712, 0.11408764123916626, 0.1314556896686554, 0.14882373809814453, 0.16619178652763367, 0.1835598349571228, 0.20092788338661194, 0.21829593181610107, 0.2356639802455902, 0.25303202867507935, 0.2704000771045685, 0.2877681255340576, 0.30513617396354675, 0.3225042223930359, 0.339872270822525, 0.35724031925201416, 0.3746083676815033, 0.39197641611099243, 0.40934446454048157, 0.4267125129699707, 0.44408056139945984, 0.461448609828949, 0.4788166582584381, 0.49618470668792725, 0.5135527849197388, 0.5309208035469055, 0.5482888221740723, 0.5656569004058838, 0.5830249786376953, 0.6003929972648621, 0.6177610158920288, 0.6351290941238403, 0.6524971723556519, 0.6698651909828186]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 8.0, 26.0, 26.0, 35.0, 63.0, 78.0, 147.0, 199.0, 373.0, 739.0, 1745.0, 5872.0, 30044.0, 298410.0, 639332.0, 57376.0, 9481.0, 2513.0, 938.0, 424.0, 260.0, 139.0, 103.0, 61.0, 40.0, 29.0, 17.0, 7.0, 12.0, 14.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.27724456787109375, -0.2666473388671875, -0.25605010986328125, -0.245452880859375, -0.23485565185546875, -0.2242584228515625, -0.21366119384765625, -0.20306396484375, -0.19246673583984375, -0.1818695068359375, -0.17127227783203125, -0.160675048828125, -0.15007781982421875, -0.1394805908203125, -0.12888336181640625, -0.1182861328125, -0.10768890380859375, -0.0970916748046875, -0.08649444580078125, -0.075897216796875, -0.06529998779296875, -0.0547027587890625, -0.04410552978515625, -0.03350830078125, -0.02291107177734375, -0.0123138427734375, -0.00171661376953125, 0.008880615234375, 0.01947784423828125, 0.0300750732421875, 0.04067230224609375, 0.05126953125, 0.06186676025390625, 0.0724639892578125, 0.08306121826171875, 0.093658447265625, 0.10425567626953125, 0.1148529052734375, 0.12545013427734375, 0.13604736328125, 0.14664459228515625, 0.1572418212890625, 0.16783905029296875, 0.178436279296875, 0.18903350830078125, 0.1996307373046875, 0.21022796630859375, 0.2208251953125, 0.23142242431640625, 0.2420196533203125, 0.25261688232421875, 0.263214111328125, 0.27381134033203125, 0.2844085693359375, 0.29500579833984375, 0.30560302734375, 0.31620025634765625, 0.3267974853515625, 0.33739471435546875, 0.347991943359375, 0.35858917236328125, 0.3691864013671875, 0.37978363037109375, 0.390380859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 7.0, 10.0, 7.0, 22.0, 29.0, 29.0, 49.0, 91.0, 119.0, 169.0, 158.0, 117.0, 66.0, 43.0, 21.0, 19.0, 20.0, 9.0, 9.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11322021484375, -0.10846805572509766, -0.10371589660644531, -0.09896373748779297, -0.09421157836914062, -0.08945941925048828, -0.08470726013183594, -0.0799551010131836, -0.07520294189453125, -0.0704507827758789, -0.06569862365722656, -0.06094646453857422, -0.056194305419921875, -0.05144214630126953, -0.04668998718261719, -0.041937828063964844, -0.0371856689453125, -0.032433509826660156, -0.027681350708007812, -0.02292919158935547, -0.018177032470703125, -0.013424873352050781, -0.008672714233398438, -0.003920555114746094, 0.00083160400390625, 0.005583763122558594, 0.010335922241210938, 0.015088081359863281, 0.019840240478515625, 0.02459239959716797, 0.029344558715820312, 0.034096717834472656, 0.038848876953125, 0.043601036071777344, 0.04835319519042969, 0.05310535430908203, 0.057857513427734375, 0.06260967254638672, 0.06736183166503906, 0.0721139907836914, 0.07686614990234375, 0.0816183090209961, 0.08637046813964844, 0.09112262725830078, 0.09587478637695312, 0.10062694549560547, 0.10537910461425781, 0.11013126373291016, 0.1148834228515625, 0.11963558197021484, 0.12438774108886719, 0.12913990020751953, 0.13389205932617188, 0.13864421844482422, 0.14339637756347656, 0.1481485366821289, 0.15290069580078125, 0.1576528549194336, 0.16240501403808594, 0.16715717315673828, 0.17190933227539062, 0.17666149139404297, 0.1814136505126953, 0.18616580963134766, 0.19091796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 7.0, 6.0, 8.0, 18.0, 13.0, 15.0, 14.0, 20.0, 20.0, 29.0, 23.0, 36.0, 34.0, 43.0, 45.0, 55.0, 127.0, 554.0, 9230.0, 890338.0, 145033.0, 2181.0, 295.0, 84.0, 58.0, 43.0, 22.0, 31.0, 33.0, 18.0, 22.0, 22.0, 13.0, 13.0, 11.0, 11.0, 6.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8560028076171875, -0.826263427734375, -0.7965240478515625, -0.76678466796875, -0.7370452880859375, -0.707305908203125, -0.6775665283203125, -0.6478271484375, -0.6180877685546875, -0.588348388671875, -0.5586090087890625, -0.52886962890625, -0.4991302490234375, -0.469390869140625, -0.4396514892578125, -0.409912109375, -0.3801727294921875, -0.350433349609375, -0.3206939697265625, -0.29095458984375, -0.2612152099609375, -0.231475830078125, -0.2017364501953125, -0.1719970703125, -0.1422576904296875, -0.112518310546875, -0.0827789306640625, -0.05303955078125, -0.0233001708984375, 0.006439208984375, 0.0361785888671875, 0.06591796875, 0.0956573486328125, 0.125396728515625, 0.1551361083984375, 0.18487548828125, 0.2146148681640625, 0.244354248046875, 0.2740936279296875, 0.3038330078125, 0.3335723876953125, 0.363311767578125, 0.3930511474609375, 0.42279052734375, 0.4525299072265625, 0.482269287109375, 0.5120086669921875, 0.541748046875, 0.5714874267578125, 0.601226806640625, 0.6309661865234375, 0.66070556640625, 0.6904449462890625, 0.720184326171875, 0.7499237060546875, 0.7796630859375, 0.8094024658203125, 0.839141845703125, 0.8688812255859375, 0.89862060546875, 0.9283599853515625, 0.958099365234375, 0.9878387451171875, 1.017578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 12.0, 10.0, 18.0, 14.0, 16.0, 19.0, 23.0, 24.0, 30.0, 41.0, 30.0, 43.0, 38.0, 38.0, 33.0, 46.0, 43.0, 43.0, 48.0, 41.0, 39.0, 36.0, 56.0, 30.0, 26.0, 27.0, 27.0, 28.0, 26.0, 12.0, 12.0, 13.0, 16.0, 7.0, 2.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15545082092285156, -0.15001296997070312, -0.1445751190185547, -0.13913726806640625, -0.1336994171142578, -0.12826156616210938, -0.12282371520996094, -0.1173858642578125, -0.11194801330566406, -0.10651016235351562, -0.10107231140136719, -0.09563446044921875, -0.09019660949707031, -0.08475875854492188, -0.07932090759277344, -0.073883056640625, -0.06844520568847656, -0.06300735473632812, -0.05756950378417969, -0.05213165283203125, -0.04669380187988281, -0.041255950927734375, -0.03581809997558594, -0.0303802490234375, -0.024942398071289062, -0.019504547119140625, -0.014066696166992188, -0.00862884521484375, -0.0031909942626953125, 0.002246856689453125, 0.0076847076416015625, 0.01312255859375, 0.018560409545898438, 0.023998260498046875, 0.029436111450195312, 0.03487396240234375, 0.04031181335449219, 0.045749664306640625, 0.05118751525878906, 0.0566253662109375, 0.06206321716308594, 0.06750106811523438, 0.07293891906738281, 0.07837677001953125, 0.08381462097167969, 0.08925247192382812, 0.09469032287597656, 0.100128173828125, 0.10556602478027344, 0.11100387573242188, 0.11644172668457031, 0.12187957763671875, 0.1273174285888672, 0.13275527954101562, 0.13819313049316406, 0.1436309814453125, 0.14906883239746094, 0.15450668334960938, 0.1599445343017578, 0.16538238525390625, 0.1708202362060547, 0.17625808715820312, 0.18169593811035156, 0.1871337890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 11.0, 12.0, 17.0, 27.0, 32.0, 52.0, 91.0, 163.0, 271.0, 475.0, 923.0, 1896.0, 4327.0, 11128.0, 36516.0, 182085.0, 632592.0, 132465.0, 29001.0, 9235.0, 3681.0, 1720.0, 826.0, 431.0, 205.0, 116.0, 88.0, 40.0, 36.0, 22.0, 22.0, 11.0, 13.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1361083984375, -0.1322650909423828, -0.12842178344726562, -0.12457847595214844, -0.12073516845703125, -0.11689186096191406, -0.11304855346679688, -0.10920524597167969, -0.1053619384765625, -0.10151863098144531, -0.09767532348632812, -0.09383201599121094, -0.08998870849609375, -0.08614540100097656, -0.08230209350585938, -0.07845878601074219, -0.074615478515625, -0.07077217102050781, -0.06692886352539062, -0.06308555603027344, -0.05924224853515625, -0.05539894104003906, -0.051555633544921875, -0.04771232604980469, -0.0438690185546875, -0.04002571105957031, -0.036182403564453125, -0.03233909606933594, -0.02849578857421875, -0.024652481079101562, -0.020809173583984375, -0.016965866088867188, -0.01312255859375, -0.009279251098632812, -0.005435943603515625, -0.0015926361083984375, 0.00225067138671875, 0.0060939788818359375, 0.009937286376953125, 0.013780593872070312, 0.0176239013671875, 0.021467208862304688, 0.025310516357421875, 0.029153823852539062, 0.03299713134765625, 0.03684043884277344, 0.040683746337890625, 0.04452705383300781, 0.048370361328125, 0.05221366882324219, 0.056056976318359375, 0.05990028381347656, 0.06374359130859375, 0.06758689880371094, 0.07143020629882812, 0.07527351379394531, 0.0791168212890625, 0.08296012878417969, 0.08680343627929688, 0.09064674377441406, 0.09449005126953125, 0.09833335876464844, 0.10217666625976562, 0.10601997375488281, 0.10986328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 9.0, 10.0, 9.0, 12.0, 13.0, 11.0, 22.0, 22.0, 36.0, 43.0, 57.0, 48.0, 78.0, 66.0, 86.0, 62.0, 80.0, 83.0, 51.0, 45.0, 27.0, 40.0, 12.0, 13.0, 19.0, 9.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.046627044677734e-06, -7.783062756061554e-06, -7.5194984674453735e-06, -7.255934178829193e-06, -6.992369890213013e-06, -6.728805601596832e-06, -6.465241312980652e-06, -6.2016770243644714e-06, -5.938112735748291e-06, -5.674548447132111e-06, -5.41098415851593e-06, -5.14741986989975e-06, -4.883855581283569e-06, -4.620291292667389e-06, -4.3567270040512085e-06, -4.093162715435028e-06, -3.829598426818848e-06, -3.5660341382026672e-06, -3.302469849586487e-06, -3.0389055609703064e-06, -2.775341272354126e-06, -2.5117769837379456e-06, -2.248212695121765e-06, -1.9846484065055847e-06, -1.7210841178894043e-06, -1.4575198292732239e-06, -1.1939555406570435e-06, -9.30391252040863e-07, -6.668269634246826e-07, -4.032626748085022e-07, -1.3969838619232178e-07, 1.2386590242385864e-07, 3.8743019104003906e-07, 6.509944796562195e-07, 9.145587682723999e-07, 1.1781230568885803e-06, 1.4416873455047607e-06, 1.7052516341209412e-06, 1.9688159227371216e-06, 2.232380211353302e-06, 2.4959444999694824e-06, 2.759508788585663e-06, 3.0230730772018433e-06, 3.2866373658180237e-06, 3.550201654434204e-06, 3.8137659430503845e-06, 4.077330231666565e-06, 4.340894520282745e-06, 4.604458808898926e-06, 4.868023097515106e-06, 5.131587386131287e-06, 5.395151674747467e-06, 5.6587159633636475e-06, 5.922280251979828e-06, 6.185844540596008e-06, 6.449408829212189e-06, 6.712973117828369e-06, 6.9765374064445496e-06, 7.24010169506073e-06, 7.50366598367691e-06, 7.76723027229309e-06, 8.030794560909271e-06, 8.294358849525452e-06, 8.557923138141632e-06, 8.821487426757812e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 4.0, 6.0, 8.0, 13.0, 14.0, 15.0, 30.0, 27.0, 41.0, 68.0, 104.0, 264.0, 1770.0, 162067.0, 878428.0, 4883.0, 382.0, 146.0, 62.0, 44.0, 37.0, 28.0, 24.0, 18.0, 18.0, 14.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3330078125, -0.3219642639160156, -0.31092071533203125, -0.2998771667480469, -0.2888336181640625, -0.2777900695800781, -0.26674652099609375, -0.2557029724121094, -0.244659423828125, -0.23361587524414062, -0.22257232666015625, -0.21152877807617188, -0.2004852294921875, -0.18944168090820312, -0.17839813232421875, -0.16735458374023438, -0.15631103515625, -0.14526748657226562, -0.13422393798828125, -0.12318038940429688, -0.1121368408203125, -0.10109329223632812, -0.09004974365234375, -0.07900619506835938, -0.067962646484375, -0.056919097900390625, -0.04587554931640625, -0.034832000732421875, -0.0237884521484375, -0.012744903564453125, -0.00170135498046875, 0.009342193603515625, 0.0203857421875, 0.031429290771484375, 0.04247283935546875, 0.053516387939453125, 0.0645599365234375, 0.07560348510742188, 0.08664703369140625, 0.09769058227539062, 0.108734130859375, 0.11977767944335938, 0.13082122802734375, 0.14186477661132812, 0.1529083251953125, 0.16395187377929688, 0.17499542236328125, 0.18603897094726562, 0.19708251953125, 0.20812606811523438, 0.21916961669921875, 0.23021316528320312, 0.2412567138671875, 0.2523002624511719, 0.26334381103515625, 0.2743873596191406, 0.285430908203125, 0.2964744567871094, 0.30751800537109375, 0.3185615539550781, 0.3296051025390625, 0.3406486511230469, 0.35169219970703125, 0.3627357482910156, 0.373779296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 5.0, 10.0, 14.0, 16.0, 19.0, 23.0, 26.0, 36.0, 46.0, 71.0, 59.0, 99.0, 85.0, 86.0, 76.0, 67.0, 46.0, 31.0, 34.0, 23.0, 23.0, 20.0, 16.0, 17.0, 11.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060638427734375, -0.05871772766113281, -0.056797027587890625, -0.05487632751464844, -0.05295562744140625, -0.05103492736816406, -0.049114227294921875, -0.04719352722167969, -0.0452728271484375, -0.04335212707519531, -0.041431427001953125, -0.03951072692871094, -0.03759002685546875, -0.03566932678222656, -0.033748626708984375, -0.03182792663574219, -0.0299072265625, -0.027986526489257812, -0.026065826416015625, -0.024145126342773438, -0.02222442626953125, -0.020303726196289062, -0.018383026123046875, -0.016462326049804688, -0.0145416259765625, -0.012620925903320312, -0.010700225830078125, -0.008779525756835938, -0.00685882568359375, -0.0049381256103515625, -0.003017425537109375, -0.0010967254638671875, 0.000823974609375, 0.0027446746826171875, 0.004665374755859375, 0.0065860748291015625, 0.00850677490234375, 0.010427474975585938, 0.012348175048828125, 0.014268875122070312, 0.0161895751953125, 0.018110275268554688, 0.020030975341796875, 0.021951675415039062, 0.02387237548828125, 0.025793075561523438, 0.027713775634765625, 0.029634475708007812, 0.03155517578125, 0.03347587585449219, 0.035396575927734375, 0.03731727600097656, 0.03923797607421875, 0.04115867614746094, 0.043079376220703125, 0.04500007629394531, 0.0469207763671875, 0.04884147644042969, 0.050762176513671875, 0.05268287658691406, 0.05460357666015625, 0.05652427673339844, 0.058444976806640625, 0.06036567687988281, 0.062286376953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 25.0, 444.0, 489.0, 44.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.230231285095215, -8.071907997131348, -7.913585662841797, -7.755262851715088, -7.596940040588379, -7.438616752624512, -7.280294418334961, -7.121971130371094, -6.963648319244385, -6.805325508117676, -6.647002696990967, -6.488679885864258, -6.330357074737549, -6.17203426361084, -6.013710975646973, -5.855388164520264, -5.697065353393555, -5.538742542266846, -5.380419731140137, -5.222096920013428, -5.063774108886719, -4.905450820922852, -4.747128486633301, -4.588805198669434, -4.430482864379883, -4.272160053253174, -4.113837242126465, -3.955514430999756, -3.7971913814544678, -3.638868570327759, -3.48054575920105, -3.3222227096557617, -3.163900136947632, -3.005577325820923, -2.847254514694214, -2.688931465148926, -2.530608654022217, -2.372285842895508, -2.213963031768799, -2.05564022064209, -1.8973172903060913, -1.7389944791793823, -1.5806715488433838, -1.4223487377166748, -1.2640259265899658, -1.1057029962539673, -0.9473801851272583, -0.7890572547912598, -0.6307344436645508, -0.472411572933197, -0.31408873200416565, -0.15576589107513428, 0.0025569796562194824, 0.16087985038757324, 0.3192026615142822, 0.47752559185028076, 0.6358484029769897, 0.7941712737083435, 0.9524941444396973, 1.1108169555664062, 1.2691397666931152, 1.4274626970291138, 1.5857855081558228, 1.7441084384918213, 1.9024312496185303]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 5.0, 5.0, 5.0, 7.0, 8.0, 12.0, 11.0, 15.0, 11.0, 24.0, 28.0, 16.0, 40.0, 45.0, 43.0, 42.0, 34.0, 35.0, 50.0, 51.0, 39.0, 41.0, 41.0, 45.0, 41.0, 34.0, 29.0, 29.0, 30.0, 30.0, 26.0, 21.0, 20.0, 21.0, 15.0, 15.0, 11.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8964300751686096, -0.8689583539962769, -0.8414866328239441, -0.8140149116516113, -0.7865432500839233, -0.7590715289115906, -0.7315998077392578, -0.704128086566925, -0.6766563653945923, -0.6491846442222595, -0.6217129230499268, -0.5942412614822388, -0.566769540309906, -0.5392978191375732, -0.5118260979652405, -0.4843543767929077, -0.45688268542289734, -0.4294109642505646, -0.4019392728805542, -0.37446755170822144, -0.34699583053588867, -0.3195241093635559, -0.29205241799354553, -0.26458069682121277, -0.2371089905500412, -0.20963728427886963, -0.18216556310653687, -0.1546938568353653, -0.12722215056419373, -0.09975042939186096, -0.07227872312068939, -0.04480700194835663, -0.01733529567718506, 0.010136416181921959, 0.037608128041028976, 0.06507983803749084, 0.09255155175924301, 0.12002326548099518, 0.14749497175216675, 0.1749666929244995, 0.20243839919567108, 0.22991010546684265, 0.2573818266391754, 0.2848535180091858, 0.31232523918151855, 0.3397969603538513, 0.3672686815261841, 0.39474040269851685, 0.4222120940685272, 0.44968381524086, 0.47715550661087036, 0.5046272277832031, 0.5320989489555359, 0.5595706701278687, 0.5870423316955566, 0.6145141124725342, 0.6419857740402222, 0.6694574952125549, 0.6969292163848877, 0.7244008779525757, 0.7518725991249084, 0.7793443202972412, 0.806816041469574, 0.8342877626419067, 0.8617594838142395]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 14.0, 22.0, 27.0, 37.0, 70.0, 90.0, 196.0, 368.0, 915.0, 3181.0, 14448.0, 261187.0, 3862930.0, 43225.0, 4818.0, 1323.0, 565.0, 319.0, 175.0, 115.0, 68.0, 37.0, 32.0, 19.0, 17.0, 15.0, 14.0, 7.0, 6.0, 4.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.27197265625, -0.2616233825683594, -0.25127410888671875, -0.24092483520507812, -0.2305755615234375, -0.22022628784179688, -0.20987701416015625, -0.19952774047851562, -0.189178466796875, -0.17882919311523438, -0.16847991943359375, -0.15813064575195312, -0.1477813720703125, -0.13743209838867188, -0.12708282470703125, -0.11673355102539062, -0.10638427734375, -0.09603500366210938, -0.08568572998046875, -0.07533645629882812, -0.0649871826171875, -0.054637908935546875, -0.04428863525390625, -0.033939361572265625, -0.023590087890625, -0.013240814208984375, -0.00289154052734375, 0.007457733154296875, 0.0178070068359375, 0.028156280517578125, 0.03850555419921875, 0.048854827880859375, 0.0592041015625, 0.06955337524414062, 0.07990264892578125, 0.09025192260742188, 0.1006011962890625, 0.11095046997070312, 0.12129974365234375, 0.13164901733398438, 0.141998291015625, 0.15234756469726562, 0.16269683837890625, 0.17304611206054688, 0.1833953857421875, 0.19374465942382812, 0.20409393310546875, 0.21444320678710938, 0.22479248046875, 0.23514175415039062, 0.24549102783203125, 0.2558403015136719, 0.2661895751953125, 0.2765388488769531, 0.28688812255859375, 0.2972373962402344, 0.307586669921875, 0.3179359436035156, 0.32828521728515625, 0.3386344909667969, 0.3489837646484375, 0.3593330383300781, 0.36968231201171875, 0.3800315856933594, 0.390380859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 14.0, 16.0, 17.0, 22.0, 37.0, 60.0, 98.0, 158.0, 184.0, 155.0, 74.0, 76.0, 24.0, 20.0, 18.0, 16.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.11033344268798828, -0.10561561584472656, -0.10089778900146484, -0.09617996215820312, -0.0914621353149414, -0.08674430847167969, -0.08202648162841797, -0.07730865478515625, -0.07259082794189453, -0.06787300109863281, -0.0631551742553711, -0.058437347412109375, -0.053719520568847656, -0.04900169372558594, -0.04428386688232422, -0.0395660400390625, -0.03484821319580078, -0.030130386352539062, -0.025412559509277344, -0.020694732666015625, -0.015976905822753906, -0.011259078979492188, -0.006541252136230469, -0.00182342529296875, 0.0028944015502929688, 0.0076122283935546875, 0.012330055236816406, 0.017047882080078125, 0.021765708923339844, 0.026483535766601562, 0.03120136260986328, 0.035919189453125, 0.04063701629638672, 0.04535484313964844, 0.050072669982910156, 0.054790496826171875, 0.059508323669433594, 0.06422615051269531, 0.06894397735595703, 0.07366180419921875, 0.07837963104248047, 0.08309745788574219, 0.0878152847290039, 0.09253311157226562, 0.09725093841552734, 0.10196876525878906, 0.10668659210205078, 0.1114044189453125, 0.11612224578857422, 0.12084007263183594, 0.12555789947509766, 0.13027572631835938, 0.1349935531616211, 0.1397113800048828, 0.14442920684814453, 0.14914703369140625, 0.15386486053466797, 0.1585826873779297, 0.1633005142211914, 0.16801834106445312, 0.17273616790771484, 0.17745399475097656, 0.18217182159423828, 0.1868896484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 23.0, 50.0, 115.0, 342.0, 1097.0, 11155.0, 1627359.0, 2539088.0, 13303.0, 1140.0, 306.0, 140.0, 58.0, 33.0, 29.0, 6.0, 5.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4560279846191406, -0.43915557861328125, -0.4222831726074219, -0.4054107666015625, -0.3885383605957031, -0.37166595458984375, -0.3547935485839844, -0.337921142578125, -0.3210487365722656, -0.30417633056640625, -0.2873039245605469, -0.2704315185546875, -0.2535591125488281, -0.23668670654296875, -0.21981430053710938, -0.20294189453125, -0.18606948852539062, -0.16919708251953125, -0.15232467651367188, -0.1354522705078125, -0.11857986450195312, -0.10170745849609375, -0.08483505249023438, -0.067962646484375, -0.051090240478515625, -0.03421783447265625, -0.017345428466796875, -0.0004730224609375, 0.016399383544921875, 0.03327178955078125, 0.050144195556640625, 0.0670166015625, 0.08388900756835938, 0.10076141357421875, 0.11763381958007812, 0.1345062255859375, 0.15137863159179688, 0.16825103759765625, 0.18512344360351562, 0.201995849609375, 0.21886825561523438, 0.23574066162109375, 0.2526130676269531, 0.2694854736328125, 0.2863578796386719, 0.30323028564453125, 0.3201026916503906, 0.33697509765625, 0.3538475036621094, 0.37071990966796875, 0.3875923156738281, 0.4044647216796875, 0.4213371276855469, 0.43820953369140625, 0.4550819396972656, 0.471954345703125, 0.4888267517089844, 0.5056991577148438, 0.5225715637207031, 0.5394439697265625, 0.5563163757324219, 0.5731887817382812, 0.5900611877441406, 0.60693359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 12.0, 8.0, 21.0, 41.0, 86.0, 158.0, 406.0, 752.0, 1302.0, 648.0, 283.0, 147.0, 96.0, 47.0, 31.0, 16.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.188446044921875, -0.18243408203125, -0.176422119140625, -0.17041015625, -0.164398193359375, -0.15838623046875, -0.152374267578125, -0.1463623046875, -0.140350341796875, -0.13433837890625, -0.128326416015625, -0.122314453125, -0.116302490234375, -0.11029052734375, -0.104278564453125, -0.0982666015625, -0.092254638671875, -0.08624267578125, -0.080230712890625, -0.07421875, -0.068206787109375, -0.06219482421875, -0.056182861328125, -0.0501708984375, -0.044158935546875, -0.03814697265625, -0.032135009765625, -0.026123046875, -0.020111083984375, -0.01409912109375, -0.008087158203125, -0.0020751953125, 0.003936767578125, 0.00994873046875, 0.015960693359375, 0.02197265625, 0.027984619140625, 0.03399658203125, 0.040008544921875, 0.0460205078125, 0.052032470703125, 0.05804443359375, 0.064056396484375, 0.070068359375, 0.076080322265625, 0.08209228515625, 0.088104248046875, 0.0941162109375, 0.100128173828125, 0.10614013671875, 0.112152099609375, 0.1181640625, 0.124176025390625, 0.13018798828125, 0.136199951171875, 0.1422119140625, 0.148223876953125, 0.15423583984375, 0.160247802734375, 0.166259765625, 0.172271728515625, 0.17828369140625, 0.184295654296875, 0.1903076171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 841.0, 172.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.509147644042969, -13.248595237731934, -12.988042831420898, -12.727490425109863, -12.466938018798828, -12.20638656616211, -11.945834159851074, -11.685281753540039, -11.424729347229004, -11.164176940917969, -10.903624534606934, -10.643072128295898, -10.38252067565918, -10.121968269348145, -9.86141586303711, -9.600863456726074, -9.340311050415039, -9.079758644104004, -8.819206237792969, -8.558653831481934, -8.298101425170898, -8.03754997253418, -7.7769975662231445, -7.516445159912109, -7.255892753601074, -6.995340347290039, -6.734787940979004, -6.474236011505127, -6.213683605194092, -5.953131198883057, -5.69257926940918, -5.4320268630981445, -5.171474933624268, -4.910922527313232, -4.6503705978393555, -4.38981819152832, -4.129265785217285, -3.86871337890625, -3.608161211013794, -3.347609043121338, -3.0870566368103027, -2.8265042304992676, -2.5659520626068115, -2.3053998947143555, -2.0448474884033203, -1.7842952013015747, -1.523742914199829, -1.2631906270980835, -1.002638339996338, -0.7420860528945923, -0.4815337657928467, -0.22098147869110107, 0.03957080841064453, 0.30012309551239014, 0.5606753826141357, 0.8212276697158813, 1.081779956817627, 1.3423322439193726, 1.6028845310211182, 1.8634368181228638, 2.1239891052246094, 2.3845415115356445, 2.6450936794281006, 2.9056458473205566, 3.166198253631592]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 14.0, 11.0, 20.0, 15.0, 24.0, 37.0, 39.0, 52.0, 50.0, 57.0, 70.0, 69.0, 76.0, 51.0, 63.0, 53.0, 55.0, 55.0, 39.0, 31.0, 28.0, 17.0, 16.0, 19.0, 15.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0], "bins": [-0.7734193801879883, -0.7562493681907654, -0.7390792965888977, -0.7219092845916748, -0.7047392725944519, -0.687569260597229, -0.6703991889953613, -0.6532291769981384, -0.6360591650009155, -0.6188891530036926, -0.601719081401825, -0.584549069404602, -0.5673790574073792, -0.5502090454101562, -0.5330389738082886, -0.5158689618110657, -0.498698890209198, -0.4815288484096527, -0.4643588364124298, -0.4471887946128845, -0.4300187826156616, -0.41284874081611633, -0.39567869901657104, -0.37850868701934814, -0.36133864521980286, -0.34416860342025757, -0.32699859142303467, -0.3098285496234894, -0.2926585078239441, -0.2754884958267212, -0.2583184540271759, -0.2411484271287918, -0.2239784598350525, -0.2068084329366684, -0.1896384060382843, -0.172468364238739, -0.15529833734035492, -0.13812831044197083, -0.12095827609300613, -0.10378824174404144, -0.08661821484565735, -0.06944818794727325, -0.05227815359830856, -0.03510812297463417, -0.017938092350959778, -0.0007680654525756836, 0.016401968896389008, 0.0335720032453537, 0.05074203014373779, 0.06791205704212189, 0.08508209139108658, 0.10225212574005127, 0.11942215263843536, 0.13659217953681946, 0.15376222133636475, 0.17093224823474884, 0.18810227513313293, 0.20527230203151703, 0.22244232892990112, 0.2396123707294464, 0.2567824125289917, 0.2739524245262146, 0.2911224663257599, 0.3082925081253052, 0.3254625201225281]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 8.0, 16.0, 25.0, 31.0, 33.0, 41.0, 70.0, 92.0, 137.0, 169.0, 268.0, 496.0, 953.0, 2153.0, 6210.0, 24996.0, 215567.0, 707223.0, 70408.0, 12782.0, 3628.0, 1432.0, 624.0, 366.0, 217.0, 155.0, 107.0, 66.0, 45.0, 40.0, 32.0, 30.0, 15.0, 18.0, 13.0, 9.0, 7.0, 9.0, 5.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4086418151855469, -0.39418792724609375, -0.3797340393066406, -0.3652801513671875, -0.3508262634277344, -0.33637237548828125, -0.3219184875488281, -0.307464599609375, -0.2930107116699219, -0.27855682373046875, -0.2641029357910156, -0.2496490478515625, -0.23519515991210938, -0.22074127197265625, -0.20628738403320312, -0.19183349609375, -0.17737960815429688, -0.16292572021484375, -0.14847183227539062, -0.1340179443359375, -0.11956405639648438, -0.10511016845703125, -0.09065628051757812, -0.076202392578125, -0.061748504638671875, -0.04729461669921875, -0.032840728759765625, -0.0183868408203125, -0.003932952880859375, 0.01052093505859375, 0.024974822998046875, 0.0394287109375, 0.053882598876953125, 0.06833648681640625, 0.08279037475585938, 0.0972442626953125, 0.11169815063476562, 0.12615203857421875, 0.14060592651367188, 0.155059814453125, 0.16951370239257812, 0.18396759033203125, 0.19842147827148438, 0.2128753662109375, 0.22732925415039062, 0.24178314208984375, 0.2562370300292969, 0.27069091796875, 0.2851448059082031, 0.29959869384765625, 0.3140525817871094, 0.3285064697265625, 0.3429603576660156, 0.35741424560546875, 0.3718681335449219, 0.386322021484375, 0.4007759094238281, 0.41522979736328125, 0.4296836853027344, 0.4441375732421875, 0.4585914611816406, 0.47304534912109375, 0.4874992370605469, 0.501953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 10.0, 8.0, 14.0, 21.0, 35.0, 39.0, 78.0, 121.0, 188.0, 184.0, 120.0, 72.0, 39.0, 26.0, 18.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.117919921875, -0.11318397521972656, -0.10844802856445312, -0.10371208190917969, -0.09897613525390625, -0.09424018859863281, -0.08950424194335938, -0.08476829528808594, -0.0800323486328125, -0.07529640197753906, -0.07056045532226562, -0.06582450866699219, -0.06108856201171875, -0.05635261535644531, -0.051616668701171875, -0.04688072204589844, -0.042144775390625, -0.03740882873535156, -0.032672882080078125, -0.027936935424804688, -0.02320098876953125, -0.018465042114257812, -0.013729095458984375, -0.008993148803710938, -0.0042572021484375, 0.0004787445068359375, 0.005214691162109375, 0.009950637817382812, 0.01468658447265625, 0.019422531127929688, 0.024158477783203125, 0.028894424438476562, 0.03363037109375, 0.03836631774902344, 0.043102264404296875, 0.04783821105957031, 0.05257415771484375, 0.05731010437011719, 0.062046051025390625, 0.06678199768066406, 0.0715179443359375, 0.07625389099121094, 0.08098983764648438, 0.08572578430175781, 0.09046173095703125, 0.09519767761230469, 0.09993362426757812, 0.10466957092285156, 0.109405517578125, 0.11414146423339844, 0.11887741088867188, 0.12361335754394531, 0.12834930419921875, 0.1330852508544922, 0.13782119750976562, 0.14255714416503906, 0.1472930908203125, 0.15202903747558594, 0.15676498413085938, 0.1615009307861328, 0.16623687744140625, 0.1709728240966797, 0.17570877075195312, 0.18044471740722656, 0.1851806640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 5.0, 2.0, 11.0, 11.0, 10.0, 14.0, 15.0, 21.0, 30.0, 55.0, 48.0, 64.0, 87.0, 108.0, 177.0, 267.0, 580.0, 1453.0, 4693.0, 19233.0, 130061.0, 667440.0, 189855.0, 25072.0, 5812.0, 1739.0, 614.0, 347.0, 201.0, 126.0, 91.0, 83.0, 39.0, 45.0, 35.0, 26.0, 14.0, 14.0, 18.0, 9.0, 4.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.447998046875, -0.4350433349609375, -0.422088623046875, -0.4091339111328125, -0.39617919921875, -0.3832244873046875, -0.370269775390625, -0.3573150634765625, -0.3443603515625, -0.3314056396484375, -0.318450927734375, -0.3054962158203125, -0.29254150390625, -0.2795867919921875, -0.266632080078125, -0.2536773681640625, -0.24072265625, -0.2277679443359375, -0.214813232421875, -0.2018585205078125, -0.18890380859375, -0.1759490966796875, -0.162994384765625, -0.1500396728515625, -0.1370849609375, -0.1241302490234375, -0.111175537109375, -0.0982208251953125, -0.08526611328125, -0.0723114013671875, -0.059356689453125, -0.0464019775390625, -0.033447265625, -0.0204925537109375, -0.007537841796875, 0.0054168701171875, 0.01837158203125, 0.0313262939453125, 0.044281005859375, 0.0572357177734375, 0.0701904296875, 0.0831451416015625, 0.096099853515625, 0.1090545654296875, 0.12200927734375, 0.1349639892578125, 0.147918701171875, 0.1608734130859375, 0.173828125, 0.1867828369140625, 0.199737548828125, 0.2126922607421875, 0.22564697265625, 0.2386016845703125, 0.251556396484375, 0.2645111083984375, 0.2774658203125, 0.2904205322265625, 0.303375244140625, 0.3163299560546875, 0.32928466796875, 0.3422393798828125, 0.355194091796875, 0.3681488037109375, 0.381103515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 5.0, 18.0, 17.0, 14.0, 22.0, 24.0, 29.0, 28.0, 32.0, 46.0, 52.0, 45.0, 41.0, 42.0, 55.0, 47.0, 50.0, 52.0, 44.0, 42.0, 38.0, 39.0, 36.0, 36.0, 16.0, 16.0, 16.0, 12.0, 8.0, 11.0, 5.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.14111328125, -0.13638687133789062, -0.13166046142578125, -0.12693405151367188, -0.1222076416015625, -0.11748123168945312, -0.11275482177734375, -0.10802841186523438, -0.103302001953125, -0.09857559204101562, -0.09384918212890625, -0.08912277221679688, -0.0843963623046875, -0.07966995239257812, -0.07494354248046875, -0.07021713256835938, -0.06549072265625, -0.060764312744140625, -0.05603790283203125, -0.051311492919921875, -0.0465850830078125, -0.041858673095703125, -0.03713226318359375, -0.032405853271484375, -0.027679443359375, -0.022953033447265625, -0.01822662353515625, -0.013500213623046875, -0.0087738037109375, -0.004047393798828125, 0.00067901611328125, 0.005405426025390625, 0.0101318359375, 0.014858245849609375, 0.01958465576171875, 0.024311065673828125, 0.0290374755859375, 0.033763885498046875, 0.03849029541015625, 0.043216705322265625, 0.047943115234375, 0.052669525146484375, 0.05739593505859375, 0.062122344970703125, 0.0668487548828125, 0.07157516479492188, 0.07630157470703125, 0.08102798461914062, 0.08575439453125, 0.09048080444335938, 0.09520721435546875, 0.09993362426757812, 0.1046600341796875, 0.10938644409179688, 0.11411285400390625, 0.11883926391601562, 0.123565673828125, 0.12829208374023438, 0.13301849365234375, 0.13774490356445312, 0.1424713134765625, 0.14719772338867188, 0.15192413330078125, 0.15665054321289062, 0.161376953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 6.0, 9.0, 15.0, 23.0, 33.0, 41.0, 63.0, 99.0, 137.0, 174.0, 301.0, 422.0, 664.0, 1098.0, 1791.0, 3217.0, 5830.0, 12057.0, 31040.0, 121802.0, 478653.0, 290933.0, 61233.0, 19482.0, 8559.0, 4406.0, 2479.0, 1490.0, 888.0, 504.0, 376.0, 244.0, 128.0, 84.0, 81.0, 41.0, 40.0, 29.0, 16.0, 10.0, 9.0, 9.0, 14.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1444091796875, -0.1395587921142578, -0.13470840454101562, -0.12985801696777344, -0.12500762939453125, -0.12015724182128906, -0.11530685424804688, -0.11045646667480469, -0.1056060791015625, -0.10075569152832031, -0.09590530395507812, -0.09105491638183594, -0.08620452880859375, -0.08135414123535156, -0.07650375366210938, -0.07165336608886719, -0.066802978515625, -0.06195259094238281, -0.057102203369140625, -0.05225181579589844, -0.04740142822265625, -0.04255104064941406, -0.037700653076171875, -0.03285026550292969, -0.0279998779296875, -0.023149490356445312, -0.018299102783203125, -0.013448715209960938, -0.00859832763671875, -0.0037479400634765625, 0.001102447509765625, 0.0059528350830078125, 0.01080322265625, 0.015653610229492188, 0.020503997802734375, 0.025354385375976562, 0.03020477294921875, 0.03505516052246094, 0.039905548095703125, 0.04475593566894531, 0.0496063232421875, 0.05445671081542969, 0.059307098388671875, 0.06415748596191406, 0.06900787353515625, 0.07385826110839844, 0.07870864868164062, 0.08355903625488281, 0.088409423828125, 0.09325981140136719, 0.09811019897460938, 0.10296058654785156, 0.10781097412109375, 0.11266136169433594, 0.11751174926757812, 0.12236213684082031, 0.1272125244140625, 0.1320629119873047, 0.13691329956054688, 0.14176368713378906, 0.14661407470703125, 0.15146446228027344, 0.15631484985351562, 0.1611652374267578, 0.166015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 20.0, 40.0, 78.0, 142.0, 215.0, 219.0, 131.0, 55.0, 23.0, 15.0, 11.0, 9.0, 1.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.713369369506836e-05, -3.606826066970825e-05, -3.5002827644348145e-05, -3.393739461898804e-05, -3.287196159362793e-05, -3.180652856826782e-05, -3.0741095542907715e-05, -2.9675662517547607e-05, -2.86102294921875e-05, -2.7544796466827393e-05, -2.6479363441467285e-05, -2.5413930416107178e-05, -2.434849739074707e-05, -2.3283064365386963e-05, -2.2217631340026855e-05, -2.1152198314666748e-05, -2.008676528930664e-05, -1.9021332263946533e-05, -1.7955899238586426e-05, -1.689046621322632e-05, -1.582503318786621e-05, -1.4759600162506104e-05, -1.3694167137145996e-05, -1.2628734111785889e-05, -1.1563301086425781e-05, -1.0497868061065674e-05, -9.432435035705566e-06, -8.367002010345459e-06, -7.3015689849853516e-06, -6.236135959625244e-06, -5.170702934265137e-06, -4.105269908905029e-06, -3.039836883544922e-06, -1.9744038581848145e-06, -9.08970832824707e-07, 1.564621925354004e-07, 1.2218952178955078e-06, 2.2873282432556152e-06, 3.3527612686157227e-06, 4.41819429397583e-06, 5.4836273193359375e-06, 6.549060344696045e-06, 7.614493370056152e-06, 8.67992639541626e-06, 9.745359420776367e-06, 1.0810792446136475e-05, 1.1876225471496582e-05, 1.294165849685669e-05, 1.4007091522216797e-05, 1.5072524547576904e-05, 1.6137957572937012e-05, 1.720339059829712e-05, 1.8268823623657227e-05, 1.9334256649017334e-05, 2.039968967437744e-05, 2.146512269973755e-05, 2.2530555725097656e-05, 2.3595988750457764e-05, 2.466142177581787e-05, 2.572685480117798e-05, 2.6792287826538086e-05, 2.7857720851898193e-05, 2.89231538772583e-05, 2.9988586902618408e-05, 3.1054019927978516e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 7.0, 14.0, 13.0, 20.0, 32.0, 39.0, 78.0, 96.0, 174.0, 306.0, 591.0, 1506.0, 4144.0, 16810.0, 118648.0, 670849.0, 201692.0, 24309.0, 5645.0, 1888.0, 749.0, 383.0, 191.0, 118.0, 66.0, 49.0, 32.0, 28.0, 16.0, 9.0, 11.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1845703125, -0.1785411834716797, -0.17251205444335938, -0.16648292541503906, -0.16045379638671875, -0.15442466735839844, -0.14839553833007812, -0.1423664093017578, -0.1363372802734375, -0.1303081512451172, -0.12427902221679688, -0.11824989318847656, -0.11222076416015625, -0.10619163513183594, -0.10016250610351562, -0.09413337707519531, -0.088104248046875, -0.08207511901855469, -0.07604598999023438, -0.07001686096191406, -0.06398773193359375, -0.05795860290527344, -0.051929473876953125, -0.04590034484863281, -0.0398712158203125, -0.03384208679199219, -0.027812957763671875, -0.021783828735351562, -0.01575469970703125, -0.009725570678710938, -0.003696441650390625, 0.0023326873779296875, 0.00836181640625, 0.014390945434570312, 0.020420074462890625, 0.026449203491210938, 0.03247833251953125, 0.03850746154785156, 0.044536590576171875, 0.05056571960449219, 0.0565948486328125, 0.06262397766113281, 0.06865310668945312, 0.07468223571777344, 0.08071136474609375, 0.08674049377441406, 0.09276962280273438, 0.09879875183105469, 0.104827880859375, 0.11085700988769531, 0.11688613891601562, 0.12291526794433594, 0.12894439697265625, 0.13497352600097656, 0.14100265502929688, 0.1470317840576172, 0.1530609130859375, 0.1590900421142578, 0.16511917114257812, 0.17114830017089844, 0.17717742919921875, 0.18320655822753906, 0.18923568725585938, 0.1952648162841797, 0.2012939453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 7.0, 14.0, 20.0, 12.0, 21.0, 33.0, 35.0, 56.0, 42.0, 54.0, 69.0, 71.0, 76.0, 80.0, 73.0, 76.0, 40.0, 44.0, 37.0, 27.0, 18.0, 18.0, 13.0, 6.0, 7.0, 5.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06829833984375, -0.06624031066894531, -0.06418228149414062, -0.06212425231933594, -0.06006622314453125, -0.05800819396972656, -0.055950164794921875, -0.05389213562011719, -0.0518341064453125, -0.04977607727050781, -0.047718048095703125, -0.04566001892089844, -0.04360198974609375, -0.04154396057128906, -0.039485931396484375, -0.03742790222167969, -0.035369873046875, -0.03331184387207031, -0.031253814697265625, -0.029195785522460938, -0.02713775634765625, -0.025079727172851562, -0.023021697998046875, -0.020963668823242188, -0.0189056396484375, -0.016847610473632812, -0.014789581298828125, -0.012731552124023438, -0.01067352294921875, -0.008615493774414062, -0.006557464599609375, -0.0044994354248046875, -0.00244140625, -0.0003833770751953125, 0.001674652099609375, 0.0037326812744140625, 0.00579071044921875, 0.007848739624023438, 0.009906768798828125, 0.011964797973632812, 0.0140228271484375, 0.016080856323242188, 0.018138885498046875, 0.020196914672851562, 0.02225494384765625, 0.024312973022460938, 0.026371002197265625, 0.028429031372070312, 0.030487060546875, 0.03254508972167969, 0.034603118896484375, 0.03666114807128906, 0.03871917724609375, 0.04077720642089844, 0.042835235595703125, 0.04489326477050781, 0.0469512939453125, 0.04900932312011719, 0.051067352294921875, 0.05312538146972656, 0.05518341064453125, 0.05724143981933594, 0.059299468994140625, 0.06135749816894531, 0.06341552734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 30.0, 91.0, 225.0, 288.0, 203.0, 98.0, 29.0, 17.0, 7.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.949930191040039, -1.9041064977645874, -1.8582826852798462, -1.8124589920043945, -1.7666351795196533, -1.7208114862442017, -1.67498779296875, -1.6291639804840088, -1.5833401679992676, -1.537516474723816, -1.4916926622390747, -1.445868968963623, -1.4000451564788818, -1.3542214632034302, -1.3083977699279785, -1.2625739574432373, -1.2167502641677856, -1.170926570892334, -1.1251027584075928, -1.0792790651321411, -1.0334552526474, -0.9876315593719482, -0.9418078064918518, -0.8959840536117554, -0.8501603007316589, -0.8043365478515625, -0.7585127949714661, -0.7126890420913696, -0.666865348815918, -0.6210415363311768, -0.5752178430557251, -0.5293940901756287, -0.48357027769088745, -0.437746524810791, -0.3919227719306946, -0.34609904885292053, -0.3002752959728241, -0.25445154309272766, -0.2086278200149536, -0.16280406713485718, -0.11698031425476074, -0.0711565688252449, -0.025332823395729065, 0.020490914583206177, 0.06631466746330261, 0.11213842034339905, 0.1579621434211731, 0.20378589630126953, 0.24960964918136597, 0.2954334020614624, 0.34125715494155884, 0.3870808780193329, 0.4329046308994293, 0.47872838377952576, 0.5245521068572998, 0.5703758597373962, 0.6161996126174927, 0.6620233654975891, 0.7078471183776855, 0.7536708116531372, 0.7994946241378784, 0.8453183174133301, 0.8911420702934265, 0.936965823173523, 0.9827895760536194]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 12.0, 9.0, 14.0, 12.0, 16.0, 21.0, 25.0, 28.0, 41.0, 33.0, 40.0, 36.0, 53.0, 57.0, 51.0, 47.0, 60.0, 43.0, 50.0, 42.0, 51.0, 48.0, 37.0, 31.0, 29.0, 24.0, 24.0, 14.0, 16.0, 10.0, 8.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46683305501937866, -0.4494871497154236, -0.4321412742137909, -0.4147953689098358, -0.3974494934082031, -0.38010358810424805, -0.36275768280029297, -0.3454118072986603, -0.3280659317970276, -0.3107200264930725, -0.2933741509914398, -0.27602824568748474, -0.25868237018585205, -0.24133646488189697, -0.2239905744791031, -0.2066446840763092, -0.18929877877235413, -0.17195288836956024, -0.15460699796676636, -0.13726109266281128, -0.11991520971059799, -0.10256931930780411, -0.08522342145442963, -0.06787753105163574, -0.05053164064884186, -0.033185750246047974, -0.01583985611796379, 0.0015060380101203918, 0.018851928412914276, 0.03619781881570816, 0.05354371666908264, 0.07088960707187653, 0.08823549747467041, 0.1055813878774643, 0.12292727828025818, 0.14027318358421326, 0.15761905908584595, 0.17496496438980103, 0.1923108547925949, 0.2096567451953888, 0.22700263559818268, 0.24434852600097656, 0.26169443130493164, 0.27904030680656433, 0.2963862121105194, 0.3137320876121521, 0.3310779929161072, 0.34842389822006226, 0.36576977372169495, 0.38311567902565, 0.4004615545272827, 0.4178074598312378, 0.4351533353328705, 0.45249924063682556, 0.46984511613845825, 0.48719102144241333, 0.5045369267463684, 0.5218828320503235, 0.5392287373542786, 0.5565745830535889, 0.573920488357544, 0.591266393661499, 0.6086122989654541, 0.6259582042694092, 0.6433040499687195]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 7.0, 11.0, 19.0, 32.0, 48.0, 114.0, 201.0, 434.0, 1074.0, 3338.0, 8619.0, 32320.0, 686462.0, 3356012.0, 89788.0, 10549.0, 2668.0, 990.0, 542.0, 350.0, 182.0, 128.0, 96.0, 69.0, 52.0, 38.0, 34.0, 18.0, 11.0, 15.0, 13.0, 5.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.1614990234375, -0.1548328399658203, -0.14816665649414062, -0.14150047302246094, -0.13483428955078125, -0.12816810607910156, -0.12150192260742188, -0.11483573913574219, -0.1081695556640625, -0.10150337219238281, -0.09483718872070312, -0.08817100524902344, -0.08150482177734375, -0.07483863830566406, -0.06817245483398438, -0.06150627136230469, -0.054840087890625, -0.04817390441894531, -0.041507720947265625, -0.03484153747558594, -0.02817535400390625, -0.021509170532226562, -0.014842987060546875, -0.008176803588867188, -0.0015106201171875, 0.0051555633544921875, 0.011821746826171875, 0.018487930297851562, 0.02515411376953125, 0.03182029724121094, 0.038486480712890625, 0.04515266418457031, 0.05181884765625, 0.05848503112792969, 0.06515121459960938, 0.07181739807128906, 0.07848358154296875, 0.08514976501464844, 0.09181594848632812, 0.09848213195800781, 0.1051483154296875, 0.11181449890136719, 0.11848068237304688, 0.12514686584472656, 0.13181304931640625, 0.13847923278808594, 0.14514541625976562, 0.1518115997314453, 0.158477783203125, 0.1651439666748047, 0.17181015014648438, 0.17847633361816406, 0.18514251708984375, 0.19180870056152344, 0.19847488403320312, 0.2051410675048828, 0.2118072509765625, 0.2184734344482422, 0.22513961791992188, 0.23180580139160156, 0.23847198486328125, 0.24513816833496094, 0.2518043518066406, 0.2584705352783203, 0.26513671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 20.0, 5.0, 31.0, 33.0, 44.0, 103.0, 148.0, 164.0, 174.0, 99.0, 69.0, 39.0, 21.0, 18.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1083984375, -0.10380744934082031, -0.09921646118164062, -0.09462547302246094, -0.09003448486328125, -0.08544349670410156, -0.08085250854492188, -0.07626152038574219, -0.0716705322265625, -0.06707954406738281, -0.062488555908203125, -0.05789756774902344, -0.05330657958984375, -0.04871559143066406, -0.044124603271484375, -0.03953361511230469, -0.034942626953125, -0.030351638793945312, -0.025760650634765625, -0.021169662475585938, -0.01657867431640625, -0.011987686157226562, -0.007396697998046875, -0.0028057098388671875, 0.0017852783203125, 0.0063762664794921875, 0.010967254638671875, 0.015558242797851562, 0.02014923095703125, 0.024740219116210938, 0.029331207275390625, 0.03392219543457031, 0.03851318359375, 0.04310417175292969, 0.047695159912109375, 0.05228614807128906, 0.05687713623046875, 0.06146812438964844, 0.06605911254882812, 0.07065010070800781, 0.0752410888671875, 0.07983207702636719, 0.08442306518554688, 0.08901405334472656, 0.09360504150390625, 0.09819602966308594, 0.10278701782226562, 0.10737800598144531, 0.111968994140625, 0.11655998229980469, 0.12115097045898438, 0.12574195861816406, 0.13033294677734375, 0.13492393493652344, 0.13951492309570312, 0.1441059112548828, 0.1486968994140625, 0.1532878875732422, 0.15787887573242188, 0.16246986389160156, 0.16706085205078125, 0.17165184020996094, 0.17624282836914062, 0.1808338165283203, 0.1854248046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 9.0, 22.0, 15.0, 50.0, 41.0, 80.0, 127.0, 198.0, 339.0, 659.0, 1361.0, 3634.0, 12804.0, 64373.0, 485962.0, 2799461.0, 713415.0, 87696.0, 16391.0, 4299.0, 1605.0, 754.0, 358.0, 204.0, 145.0, 86.0, 50.0, 32.0, 34.0, 12.0, 12.0, 11.0, 9.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13652992248535156, -0.13158035278320312, -0.1266307830810547, -0.12168121337890625, -0.11673164367675781, -0.11178207397460938, -0.10683250427246094, -0.1018829345703125, -0.09693336486816406, -0.09198379516601562, -0.08703422546386719, -0.08208465576171875, -0.07713508605957031, -0.07218551635742188, -0.06723594665527344, -0.062286376953125, -0.05733680725097656, -0.052387237548828125, -0.04743766784667969, -0.04248809814453125, -0.03753852844238281, -0.032588958740234375, -0.027639389038085938, -0.0226898193359375, -0.017740249633789062, -0.012790679931640625, -0.007841110229492188, -0.00289154052734375, 0.0020580291748046875, 0.007007598876953125, 0.011957168579101562, 0.01690673828125, 0.021856307983398438, 0.026805877685546875, 0.03175544738769531, 0.03670501708984375, 0.04165458679199219, 0.046604156494140625, 0.05155372619628906, 0.0565032958984375, 0.06145286560058594, 0.06640243530273438, 0.07135200500488281, 0.07630157470703125, 0.08125114440917969, 0.08620071411132812, 0.09115028381347656, 0.096099853515625, 0.10104942321777344, 0.10599899291992188, 0.11094856262207031, 0.11589813232421875, 0.12084770202636719, 0.12579727172851562, 0.13074684143066406, 0.1356964111328125, 0.14064598083496094, 0.14559555053710938, 0.1505451202392578, 0.15549468994140625, 0.1604442596435547, 0.16539382934570312, 0.17034339904785156, 0.17529296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 12.0, 5.0, 14.0, 12.0, 22.0, 49.0, 43.0, 80.0, 111.0, 134.0, 161.0, 251.0, 304.0, 396.0, 424.0, 461.0, 406.0, 299.0, 215.0, 155.0, 138.0, 109.0, 56.0, 46.0, 38.0, 29.0, 21.0, 24.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.1123046875, -0.10935401916503906, -0.10640335083007812, -0.10345268249511719, -0.10050201416015625, -0.09755134582519531, -0.09460067749023438, -0.09165000915527344, -0.0886993408203125, -0.08574867248535156, -0.08279800415039062, -0.07984733581542969, -0.07689666748046875, -0.07394599914550781, -0.07099533081054688, -0.06804466247558594, -0.065093994140625, -0.06214332580566406, -0.059192657470703125, -0.05624198913574219, -0.05329132080078125, -0.05034065246582031, -0.047389984130859375, -0.04443931579589844, -0.0414886474609375, -0.03853797912597656, -0.035587310791015625, -0.03263664245605469, -0.02968597412109375, -0.026735305786132812, -0.023784637451171875, -0.020833969116210938, -0.01788330078125, -0.014932632446289062, -0.011981964111328125, -0.009031295776367188, -0.00608062744140625, -0.0031299591064453125, -0.000179290771484375, 0.0027713775634765625, 0.0057220458984375, 0.008672714233398438, 0.011623382568359375, 0.014574050903320312, 0.01752471923828125, 0.020475387573242188, 0.023426055908203125, 0.026376724243164062, 0.029327392578125, 0.03227806091308594, 0.035228729248046875, 0.03817939758300781, 0.04113006591796875, 0.04408073425292969, 0.047031402587890625, 0.04998207092285156, 0.0529327392578125, 0.05588340759277344, 0.058834075927734375, 0.06178474426269531, 0.06473541259765625, 0.06768608093261719, 0.07063674926757812, 0.07358741760253906, 0.0765380859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 23.0, 52.0, 147.0, 253.0, 249.0, 147.0, 65.0, 42.0, 13.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4258193373680115, -0.393331378698349, -0.36084339022636414, -0.32835543155670166, -0.2958674430847168, -0.2633794844150543, -0.23089152574539185, -0.19840355217456818, -0.1659155786037445, -0.13342760503292084, -0.10093963891267776, -0.06845167279243469, -0.03596369922161102, -0.0034757256507873535, 0.029012233018875122, 0.06150020658969879, 0.09398818016052246, 0.12647615373134613, 0.1589641273021698, 0.19145208597183228, 0.22394005954265594, 0.2564280331134796, 0.2889159917831421, 0.32140398025512695, 0.35389193892478943, 0.3863798975944519, 0.41886788606643677, 0.45135584473609924, 0.4838438034057617, 0.5163317918777466, 0.5488197803497314, 0.5813077092170715, 0.6137956380844116, 0.6462836265563965, 0.6787715554237366, 0.7112595438957214, 0.7437475323677063, 0.7762354612350464, 0.8087234497070312, 0.8412114381790161, 0.873699426651001, 0.9061874151229858, 0.9386753439903259, 0.9711633324623108, 1.0036512613296509, 1.0361392498016357, 1.0686272382736206, 1.1011152267456055, 1.1336030960083008, 1.1660910844802856, 1.1985790729522705, 1.2310669422149658, 1.2635549306869507, 1.2960429191589355, 1.3285309076309204, 1.3610188961029053, 1.3935068845748901, 1.425994873046875, 1.4584828615188599, 1.4909708499908447, 1.52345871925354, 1.555946707725525, 1.5884346961975098, 1.6209226846694946, 1.6534106731414795]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 8.0, 13.0, 14.0, 14.0, 16.0, 23.0, 25.0, 26.0, 40.0, 33.0, 29.0, 41.0, 33.0, 45.0, 45.0, 60.0, 48.0, 44.0, 34.0, 43.0, 32.0, 39.0, 33.0, 31.0, 24.0, 31.0, 21.0, 18.0, 16.0, 18.0, 12.0, 16.0, 15.0, 6.0, 10.0, 7.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31851905584335327, -0.30708131194114685, -0.29564356803894043, -0.284205824136734, -0.2727680802345276, -0.26133033633232117, -0.24989260733127594, -0.23845486342906952, -0.2270171195268631, -0.21557937562465668, -0.20414163172245026, -0.19270390272140503, -0.1812661588191986, -0.1698284149169922, -0.15839067101478577, -0.14695292711257935, -0.13551518321037292, -0.1240774393081665, -0.11263969540596008, -0.10120195895433426, -0.08976421505212784, -0.07832647114992142, -0.0668887346982956, -0.05545099079608917, -0.04401324689388275, -0.03257550299167633, -0.021137762814760208, -0.009700022637844086, 0.0017377212643623352, 0.013175465166568756, 0.02461320161819458, 0.036050945520401, 0.04748868942260742, 0.05892643332481384, 0.07036417722702026, 0.08180191367864609, 0.09323965758085251, 0.10467740148305893, 0.11611513793468475, 0.12755288183689117, 0.1389906257390976, 0.15042836964130402, 0.16186611354351044, 0.17330384254455566, 0.18474158644676208, 0.1961793303489685, 0.20761707425117493, 0.21905481815338135, 0.23049256205558777, 0.2419303059577942, 0.2533680498600006, 0.26480579376220703, 0.27624353766441345, 0.2876812815666199, 0.2991189956665039, 0.3105567693710327, 0.32199448347091675, 0.33343222737312317, 0.3448699712753296, 0.356307715177536, 0.36774545907974243, 0.37918320298194885, 0.3906209468841553, 0.4020586609840393, 0.4134964346885681]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 4.0, 9.0, 10.0, 8.0, 23.0, 14.0, 26.0, 43.0, 66.0, 80.0, 125.0, 211.0, 361.0, 665.0, 1801.0, 6431.0, 42057.0, 555519.0, 401795.0, 30946.0, 5328.0, 1447.0, 589.0, 349.0, 192.0, 134.0, 92.0, 56.0, 56.0, 34.0, 19.0, 11.0, 14.0, 13.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.49462127685546875, -0.4775238037109375, -0.46042633056640625, -0.443328857421875, -0.42623138427734375, -0.4091339111328125, -0.39203643798828125, -0.37493896484375, -0.35784149169921875, -0.3407440185546875, -0.32364654541015625, -0.306549072265625, -0.28945159912109375, -0.2723541259765625, -0.25525665283203125, -0.2381591796875, -0.22106170654296875, -0.2039642333984375, -0.18686676025390625, -0.169769287109375, -0.15267181396484375, -0.1355743408203125, -0.11847686767578125, -0.10137939453125, -0.08428192138671875, -0.0671844482421875, -0.05008697509765625, -0.032989501953125, -0.01589202880859375, 0.0012054443359375, 0.01830291748046875, 0.035400390625, 0.05249786376953125, 0.0695953369140625, 0.08669281005859375, 0.103790283203125, 0.12088775634765625, 0.1379852294921875, 0.15508270263671875, 0.17218017578125, 0.18927764892578125, 0.2063751220703125, 0.22347259521484375, 0.240570068359375, 0.25766754150390625, 0.2747650146484375, 0.29186248779296875, 0.3089599609375, 0.32605743408203125, 0.3431549072265625, 0.36025238037109375, 0.377349853515625, 0.39444732666015625, 0.4115447998046875, 0.42864227294921875, 0.44573974609375, 0.46283721923828125, 0.4799346923828125, 0.49703216552734375, 0.514129638671875, 0.5312271118164062, 0.5483245849609375, 0.5654220581054688, 0.58251953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 10.0, 12.0, 13.0, 21.0, 37.0, 55.0, 112.0, 126.0, 202.0, 155.0, 99.0, 72.0, 39.0, 20.0, 12.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10060787200927734, -0.09593009948730469, -0.09125232696533203, -0.08657455444335938, -0.08189678192138672, -0.07721900939941406, -0.0725412368774414, -0.06786346435546875, -0.0631856918334961, -0.05850791931152344, -0.05383014678955078, -0.049152374267578125, -0.04447460174560547, -0.03979682922363281, -0.035119056701660156, -0.0304412841796875, -0.025763511657714844, -0.021085739135742188, -0.01640796661376953, -0.011730194091796875, -0.007052421569824219, -0.0023746490478515625, 0.0023031234741210938, 0.00698089599609375, 0.011658668518066406, 0.016336441040039062, 0.02101421356201172, 0.025691986083984375, 0.03036975860595703, 0.03504753112792969, 0.039725303649902344, 0.044403076171875, 0.049080848693847656, 0.05375862121582031, 0.05843639373779297, 0.06311416625976562, 0.06779193878173828, 0.07246971130371094, 0.0771474838256836, 0.08182525634765625, 0.0865030288696289, 0.09118080139160156, 0.09585857391357422, 0.10053634643554688, 0.10521411895751953, 0.10989189147949219, 0.11456966400146484, 0.1192474365234375, 0.12392520904541016, 0.1286029815673828, 0.13328075408935547, 0.13795852661132812, 0.14263629913330078, 0.14731407165527344, 0.1519918441772461, 0.15666961669921875, 0.1613473892211914, 0.16602516174316406, 0.17070293426513672, 0.17538070678710938, 0.18005847930908203, 0.1847362518310547, 0.18941402435302734, 0.194091796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 8.0, 5.0, 11.0, 19.0, 12.0, 21.0, 35.0, 62.0, 59.0, 163.0, 284.0, 807.0, 2726.0, 12499.0, 78452.0, 454383.0, 414094.0, 69446.0, 11419.0, 2416.0, 813.0, 365.0, 144.0, 96.0, 57.0, 50.0, 19.0, 18.0, 16.0, 9.0, 10.0, 7.0, 6.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.467041015625, -0.45195770263671875, -0.4368743896484375, -0.42179107666015625, -0.406707763671875, -0.39162445068359375, -0.3765411376953125, -0.36145782470703125, -0.34637451171875, -0.33129119873046875, -0.3162078857421875, -0.30112457275390625, -0.286041259765625, -0.27095794677734375, -0.2558746337890625, -0.24079132080078125, -0.2257080078125, -0.21062469482421875, -0.1955413818359375, -0.18045806884765625, -0.165374755859375, -0.15029144287109375, -0.1352081298828125, -0.12012481689453125, -0.10504150390625, -0.08995819091796875, -0.0748748779296875, -0.05979156494140625, -0.044708251953125, -0.02962493896484375, -0.0145416259765625, 0.00054168701171875, 0.015625, 0.03070831298828125, 0.0457916259765625, 0.06087493896484375, 0.075958251953125, 0.09104156494140625, 0.1061248779296875, 0.12120819091796875, 0.13629150390625, 0.15137481689453125, 0.1664581298828125, 0.18154144287109375, 0.196624755859375, 0.21170806884765625, 0.2267913818359375, 0.24187469482421875, 0.2569580078125, 0.27204132080078125, 0.2871246337890625, 0.30220794677734375, 0.317291259765625, 0.33237457275390625, 0.3474578857421875, 0.36254119873046875, 0.37762451171875, 0.39270782470703125, 0.4077911376953125, 0.42287445068359375, 0.437957763671875, 0.45304107666015625, 0.4681243896484375, 0.48320770263671875, 0.498291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 6.0, 11.0, 14.0, 23.0, 21.0, 28.0, 29.0, 29.0, 30.0, 38.0, 60.0, 38.0, 56.0, 57.0, 43.0, 61.0, 42.0, 63.0, 56.0, 50.0, 43.0, 40.0, 32.0, 29.0, 17.0, 13.0, 10.0, 7.0, 5.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2274169921875, -0.2210540771484375, -0.214691162109375, -0.2083282470703125, -0.20196533203125, -0.1956024169921875, -0.189239501953125, -0.1828765869140625, -0.176513671875, -0.1701507568359375, -0.163787841796875, -0.1574249267578125, -0.15106201171875, -0.1446990966796875, -0.138336181640625, -0.1319732666015625, -0.1256103515625, -0.1192474365234375, -0.112884521484375, -0.1065216064453125, -0.10015869140625, -0.0937957763671875, -0.087432861328125, -0.0810699462890625, -0.07470703125, -0.0683441162109375, -0.061981201171875, -0.0556182861328125, -0.04925537109375, -0.0428924560546875, -0.036529541015625, -0.0301666259765625, -0.0238037109375, -0.0174407958984375, -0.011077880859375, -0.0047149658203125, 0.00164794921875, 0.0080108642578125, 0.014373779296875, 0.0207366943359375, 0.027099609375, 0.0334625244140625, 0.039825439453125, 0.0461883544921875, 0.05255126953125, 0.0589141845703125, 0.065277099609375, 0.0716400146484375, 0.0780029296875, 0.0843658447265625, 0.090728759765625, 0.0970916748046875, 0.10345458984375, 0.1098175048828125, 0.116180419921875, 0.1225433349609375, 0.12890625, 0.1352691650390625, 0.141632080078125, 0.1479949951171875, 0.15435791015625, 0.1607208251953125, 0.167083740234375, 0.1734466552734375, 0.1798095703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 4.0, 10.0, 9.0, 11.0, 24.0, 46.0, 52.0, 77.0, 135.0, 154.0, 268.0, 432.0, 786.0, 1602.0, 3421.0, 8504.0, 25990.0, 100697.0, 374362.0, 383738.0, 105080.0, 27347.0, 8659.0, 3482.0, 1599.0, 808.0, 449.0, 292.0, 167.0, 126.0, 56.0, 52.0, 36.0, 24.0, 14.0, 11.0, 1.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1605224609375, -0.15517425537109375, -0.1498260498046875, -0.14447784423828125, -0.139129638671875, -0.13378143310546875, -0.1284332275390625, -0.12308502197265625, -0.11773681640625, -0.11238861083984375, -0.1070404052734375, -0.10169219970703125, -0.096343994140625, -0.09099578857421875, -0.0856475830078125, -0.08029937744140625, -0.074951171875, -0.06960296630859375, -0.0642547607421875, -0.05890655517578125, -0.053558349609375, -0.04821014404296875, -0.0428619384765625, -0.03751373291015625, -0.03216552734375, -0.02681732177734375, -0.0214691162109375, -0.01612091064453125, -0.010772705078125, -0.00542449951171875, -7.62939453125e-05, 0.00527191162109375, 0.0106201171875, 0.01596832275390625, 0.0213165283203125, 0.02666473388671875, 0.032012939453125, 0.03736114501953125, 0.0427093505859375, 0.04805755615234375, 0.05340576171875, 0.05875396728515625, 0.0641021728515625, 0.06945037841796875, 0.074798583984375, 0.08014678955078125, 0.0854949951171875, 0.09084320068359375, 0.09619140625, 0.10153961181640625, 0.1068878173828125, 0.11223602294921875, 0.117584228515625, 0.12293243408203125, 0.1282806396484375, 0.13362884521484375, 0.13897705078125, 0.14432525634765625, 0.1496734619140625, 0.15502166748046875, 0.160369873046875, 0.16571807861328125, 0.1710662841796875, 0.17641448974609375, 0.1817626953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 9.0, 4.0, 11.0, 13.0, 20.0, 24.0, 29.0, 58.0, 85.0, 116.0, 166.0, 120.0, 98.0, 66.0, 54.0, 37.0, 29.0, 19.0, 13.0, 15.0, 4.0, 3.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.15522775053978e-05, -3.06200236082077e-05, -2.968776971101761e-05, -2.8755515813827515e-05, -2.782326191663742e-05, -2.6891008019447327e-05, -2.5958754122257233e-05, -2.502650022506714e-05, -2.4094246327877045e-05, -2.316199243068695e-05, -2.2229738533496857e-05, -2.1297484636306763e-05, -2.036523073911667e-05, -1.9432976841926575e-05, -1.850072294473648e-05, -1.7568469047546387e-05, -1.6636215150356293e-05, -1.57039612531662e-05, -1.4771707355976105e-05, -1.383945345878601e-05, -1.2907199561595917e-05, -1.1974945664405823e-05, -1.1042691767215729e-05, -1.0110437870025635e-05, -9.17818397283554e-06, -8.245930075645447e-06, -7.313676178455353e-06, -6.381422281265259e-06, -5.449168384075165e-06, -4.516914486885071e-06, -3.584660589694977e-06, -2.652406692504883e-06, -1.7201527953147888e-06, -7.878988981246948e-07, 1.4435499906539917e-07, 1.0766088962554932e-06, 2.008862793445587e-06, 2.941116690635681e-06, 3.873370587825775e-06, 4.805624485015869e-06, 5.737878382205963e-06, 6.670132279396057e-06, 7.602386176586151e-06, 8.534640073776245e-06, 9.466893970966339e-06, 1.0399147868156433e-05, 1.1331401765346527e-05, 1.2263655662536621e-05, 1.3195909559726715e-05, 1.4128163456916809e-05, 1.5060417354106903e-05, 1.5992671251296997e-05, 1.692492514848709e-05, 1.7857179045677185e-05, 1.878943294286728e-05, 1.9721686840057373e-05, 2.0653940737247467e-05, 2.158619463443756e-05, 2.2518448531627655e-05, 2.345070242881775e-05, 2.4382956326007843e-05, 2.5315210223197937e-05, 2.624746412038803e-05, 2.7179718017578125e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 8.0, 8.0, 14.0, 15.0, 23.0, 32.0, 51.0, 84.0, 149.0, 328.0, 1174.0, 5718.0, 60304.0, 786295.0, 179703.0, 11739.0, 1875.0, 517.0, 204.0, 107.0, 57.0, 47.0, 23.0, 10.0, 16.0, 7.0, 10.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.390380859375, -0.3794364929199219, -0.36849212646484375, -0.3575477600097656, -0.3466033935546875, -0.3356590270996094, -0.32471466064453125, -0.3137702941894531, -0.302825927734375, -0.2918815612792969, -0.28093719482421875, -0.2699928283691406, -0.2590484619140625, -0.24810409545898438, -0.23715972900390625, -0.22621536254882812, -0.21527099609375, -0.20432662963867188, -0.19338226318359375, -0.18243789672851562, -0.1714935302734375, -0.16054916381835938, -0.14960479736328125, -0.13866043090820312, -0.127716064453125, -0.11677169799804688, -0.10582733154296875, -0.09488296508789062, -0.0839385986328125, -0.07299423217773438, -0.06204986572265625, -0.051105499267578125, -0.0401611328125, -0.029216766357421875, -0.01827239990234375, -0.007328033447265625, 0.0036163330078125, 0.014560699462890625, 0.02550506591796875, 0.036449432373046875, 0.047393798828125, 0.058338165283203125, 0.06928253173828125, 0.08022689819335938, 0.0911712646484375, 0.10211563110351562, 0.11305999755859375, 0.12400436401367188, 0.13494873046875, 0.14589309692382812, 0.15683746337890625, 0.16778182983398438, 0.1787261962890625, 0.18967056274414062, 0.20061492919921875, 0.21155929565429688, 0.222503662109375, 0.23344802856445312, 0.24439239501953125, 0.2553367614746094, 0.2662811279296875, 0.2772254943847656, 0.28816986083984375, 0.2991142272949219, 0.31005859375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 13.0, 13.0, 25.0, 25.0, 34.0, 53.0, 74.0, 110.0, 124.0, 125.0, 102.0, 76.0, 65.0, 52.0, 29.0, 21.0, 13.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13134765625, -0.1266918182373047, -0.12203598022460938, -0.11738014221191406, -0.11272430419921875, -0.10806846618652344, -0.10341262817382812, -0.09875679016113281, -0.0941009521484375, -0.08944511413574219, -0.08478927612304688, -0.08013343811035156, -0.07547760009765625, -0.07082176208496094, -0.06616592407226562, -0.06151008605957031, -0.056854248046875, -0.05219841003417969, -0.047542572021484375, -0.04288673400878906, -0.03823089599609375, -0.03357505798339844, -0.028919219970703125, -0.024263381958007812, -0.0196075439453125, -0.014951705932617188, -0.010295867919921875, -0.0056400299072265625, -0.00098419189453125, 0.0036716461181640625, 0.008327484130859375, 0.012983322143554688, 0.01763916015625, 0.022294998168945312, 0.026950836181640625, 0.03160667419433594, 0.03626251220703125, 0.04091835021972656, 0.045574188232421875, 0.05023002624511719, 0.0548858642578125, 0.05954170227050781, 0.06419754028320312, 0.06885337829589844, 0.07350921630859375, 0.07816505432128906, 0.08282089233398438, 0.08747673034667969, 0.092132568359375, 0.09678840637207031, 0.10144424438476562, 0.10610008239746094, 0.11075592041015625, 0.11541175842285156, 0.12006759643554688, 0.12472343444824219, 0.1293792724609375, 0.1340351104736328, 0.13869094848632812, 0.14334678649902344, 0.14800262451171875, 0.15265846252441406, 0.15731430053710938, 0.1619701385498047, 0.1666259765625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 11.0, 68.0, 278.0, 428.0, 179.0, 36.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.753924369812012, -4.651325702667236, -4.548727512359619, -4.446128845214844, -4.343530178070068, -4.240931510925293, -4.138333320617676, -4.0357346534729, -3.933135986328125, -3.8305375576019287, -3.7279388904571533, -3.625340461730957, -3.5227417945861816, -3.4201433658599854, -3.317544937133789, -3.2149462699890137, -3.1123478412628174, -3.009749412536621, -2.9071507453918457, -2.8045523166656494, -2.701953649520874, -2.5993552207946777, -2.4967565536499023, -2.394158124923706, -2.2915596961975098, -2.1889612674713135, -2.086362600326538, -1.9837641716003418, -1.8811655044555664, -1.7785670757293701, -1.6759685277938843, -1.5733699798583984, -1.4707715511322021, -1.3681730031967163, -1.2655744552612305, -1.1629760265350342, -1.0603773593902588, -0.9577788710594177, -0.8551803827285767, -0.7525818347930908, -0.649983286857605, -0.5473847389221191, -0.4447862207889557, -0.34218770265579224, -0.2395891547203064, -0.13699060678482056, -0.03439211845397949, 0.06820642948150635, 0.1708049774169922, 0.273403525352478, 0.3760020434856415, 0.47860056161880493, 0.5811991095542908, 0.6837976574897766, 0.7863961458206177, 0.8889946937561035, 0.9915932416915894, 1.0941917896270752, 1.196790337562561, 1.2993888854980469, 1.4019873142242432, 1.5045859813690186, 1.6071844100952148, 1.7097829580307007, 1.8123815059661865]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 2.0, 6.0, 14.0, 22.0, 25.0, 29.0, 32.0, 45.0, 55.0, 59.0, 67.0, 84.0, 71.0, 60.0, 66.0, 59.0, 56.0, 54.0, 39.0, 33.0, 27.0, 15.0, 23.0, 13.0, 8.0, 7.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8294411301612854, -0.7996581196784973, -0.7698750495910645, -0.7400920391082764, -0.7103090286254883, -0.6805259585380554, -0.6507429480552673, -0.6209598779678345, -0.5911768674850464, -0.5613938570022583, -0.5316107869148254, -0.5018277764320374, -0.4720447361469269, -0.4422616958618164, -0.4124786853790283, -0.38269564509391785, -0.3529126048088074, -0.3231295645236969, -0.2933465242385864, -0.26356351375579834, -0.23378047347068787, -0.2039974331855774, -0.1742144078016281, -0.14443138241767883, -0.11464834213256836, -0.08486530929803848, -0.055082276463508606, -0.02529924362897873, 0.0044837892055511475, 0.03426682949066162, 0.0640498548746109, 0.09383288025856018, 0.12361598014831543, 0.1533990204334259, 0.18318204581737518, 0.21296507120132446, 0.24274811148643494, 0.2725311517715454, 0.3023141622543335, 0.33209720253944397, 0.36188024282455444, 0.3916632831096649, 0.4214463233947754, 0.4512293338775635, 0.48101237416267395, 0.5107954144477844, 0.5405784249305725, 0.5703614950180054, 0.6001445055007935, 0.6299275159835815, 0.6597105860710144, 0.6894935965538025, 0.7192766666412354, 0.7490596771240234, 0.7788426876068115, 0.8086256980895996, 0.8384087681770325, 0.8681917786598206, 0.8979748487472534, 0.9277578592300415, 0.9575408697128296, 0.9873239398002625, 1.0171070098876953, 1.0468900203704834, 1.0766730308532715]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 12.0, 26.0, 51.0, 82.0, 168.0, 527.0, 3113.0, 31601.0, 3978354.0, 174098.0, 4535.0, 1035.0, 333.0, 169.0, 64.0, 44.0, 26.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2981986999511719, -0.28560638427734375, -0.2730140686035156, -0.2604217529296875, -0.24782943725585938, -0.23523712158203125, -0.22264480590820312, -0.210052490234375, -0.19746017456054688, -0.18486785888671875, -0.17227554321289062, -0.1596832275390625, -0.14709091186523438, -0.13449859619140625, -0.12190628051757812, -0.10931396484375, -0.09672164916992188, -0.08412933349609375, -0.07153701782226562, -0.0589447021484375, -0.046352386474609375, -0.03376007080078125, -0.021167755126953125, -0.008575439453125, 0.004016876220703125, 0.01660919189453125, 0.029201507568359375, 0.0417938232421875, 0.054386138916015625, 0.06697845458984375, 0.07957077026367188, 0.0921630859375, 0.10475540161132812, 0.11734771728515625, 0.12994003295898438, 0.1425323486328125, 0.15512466430664062, 0.16771697998046875, 0.18030929565429688, 0.192901611328125, 0.20549392700195312, 0.21808624267578125, 0.23067855834960938, 0.2432708740234375, 0.2558631896972656, 0.26845550537109375, 0.2810478210449219, 0.29364013671875, 0.3062324523925781, 0.31882476806640625, 0.3314170837402344, 0.3440093994140625, 0.3566017150878906, 0.36919403076171875, 0.3817863464355469, 0.394378662109375, 0.4069709777832031, 0.41956329345703125, 0.4321556091308594, 0.4447479248046875, 0.4573402404785156, 0.46993255615234375, 0.4825248718261719, 0.4951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 12.0, 10.0, 17.0, 23.0, 32.0, 62.0, 93.0, 107.0, 137.0, 144.0, 123.0, 93.0, 52.0, 40.0, 27.0, 12.0, 6.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.08414745330810547, -0.07973289489746094, -0.0753183364868164, -0.07090377807617188, -0.06648921966552734, -0.06207466125488281, -0.05766010284423828, -0.05324554443359375, -0.04883098602294922, -0.04441642761230469, -0.040001869201660156, -0.035587310791015625, -0.031172752380371094, -0.026758193969726562, -0.02234363555908203, -0.0179290771484375, -0.013514518737792969, -0.009099960327148438, -0.004685401916503906, -0.000270843505859375, 0.004143714904785156, 0.008558273315429688, 0.012972831726074219, 0.01738739013671875, 0.02180194854736328, 0.026216506958007812, 0.030631065368652344, 0.035045623779296875, 0.039460182189941406, 0.04387474060058594, 0.04828929901123047, 0.052703857421875, 0.05711841583251953, 0.06153297424316406, 0.0659475326538086, 0.07036209106445312, 0.07477664947509766, 0.07919120788574219, 0.08360576629638672, 0.08802032470703125, 0.09243488311767578, 0.09684944152832031, 0.10126399993896484, 0.10567855834960938, 0.1100931167602539, 0.11450767517089844, 0.11892223358154297, 0.1233367919921875, 0.12775135040283203, 0.13216590881347656, 0.1365804672241211, 0.14099502563476562, 0.14540958404541016, 0.1498241424560547, 0.15423870086669922, 0.15865325927734375, 0.16306781768798828, 0.1674823760986328, 0.17189693450927734, 0.17631149291992188, 0.1807260513305664, 0.18514060974121094, 0.18955516815185547, 0.1939697265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 8.0, 9.0, 11.0, 21.0, 30.0, 44.0, 60.0, 82.0, 112.0, 206.0, 377.0, 641.0, 1441.0, 3959.0, 14831.0, 81786.0, 714980.0, 2744558.0, 546899.0, 65702.0, 12191.0, 3436.0, 1285.0, 624.0, 350.0, 216.0, 112.0, 104.0, 59.0, 37.0, 30.0, 25.0, 14.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14310073852539062, -0.13788604736328125, -0.13267135620117188, -0.1274566650390625, -0.12224197387695312, -0.11702728271484375, -0.11181259155273438, -0.106597900390625, -0.10138320922851562, -0.09616851806640625, -0.09095382690429688, -0.0857391357421875, -0.08052444458007812, -0.07530975341796875, -0.07009506225585938, -0.06488037109375, -0.059665679931640625, -0.05445098876953125, -0.049236297607421875, -0.0440216064453125, -0.038806915283203125, -0.03359222412109375, -0.028377532958984375, -0.023162841796875, -0.017948150634765625, -0.01273345947265625, -0.007518768310546875, -0.0023040771484375, 0.002910614013671875, 0.00812530517578125, 0.013339996337890625, 0.0185546875, 0.023769378662109375, 0.02898406982421875, 0.034198760986328125, 0.0394134521484375, 0.044628143310546875, 0.04984283447265625, 0.055057525634765625, 0.060272216796875, 0.06548690795898438, 0.07070159912109375, 0.07591629028320312, 0.0811309814453125, 0.08634567260742188, 0.09156036376953125, 0.09677505493164062, 0.10198974609375, 0.10720443725585938, 0.11241912841796875, 0.11763381958007812, 0.1228485107421875, 0.12806320190429688, 0.13327789306640625, 0.13849258422851562, 0.143707275390625, 0.14892196655273438, 0.15413665771484375, 0.15935134887695312, 0.1645660400390625, 0.16978073120117188, 0.17499542236328125, 0.18021011352539062, 0.1854248046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 10.0, 17.0, 21.0, 22.0, 38.0, 37.0, 55.0, 71.0, 93.0, 155.0, 181.0, 246.0, 280.0, 359.0, 403.0, 406.0, 403.0, 296.0, 228.0, 213.0, 142.0, 105.0, 76.0, 62.0, 41.0, 27.0, 19.0, 25.0, 11.0, 12.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11114501953125, -0.10807609558105469, -0.10500717163085938, -0.10193824768066406, -0.09886932373046875, -0.09580039978027344, -0.09273147583007812, -0.08966255187988281, -0.0865936279296875, -0.08352470397949219, -0.08045578002929688, -0.07738685607910156, -0.07431793212890625, -0.07124900817871094, -0.06818008422851562, -0.06511116027832031, -0.062042236328125, -0.05897331237792969, -0.055904388427734375, -0.05283546447753906, -0.04976654052734375, -0.04669761657714844, -0.043628692626953125, -0.04055976867675781, -0.0374908447265625, -0.03442192077636719, -0.031352996826171875, -0.028284072875976562, -0.02521514892578125, -0.022146224975585938, -0.019077301025390625, -0.016008377075195312, -0.012939453125, -0.009870529174804688, -0.006801605224609375, -0.0037326812744140625, -0.00066375732421875, 0.0024051666259765625, 0.005474090576171875, 0.008543014526367188, 0.0116119384765625, 0.014680862426757812, 0.017749786376953125, 0.020818710327148438, 0.02388763427734375, 0.026956558227539062, 0.030025482177734375, 0.03309440612792969, 0.036163330078125, 0.03923225402832031, 0.042301177978515625, 0.04537010192871094, 0.04843902587890625, 0.05150794982910156, 0.054576873779296875, 0.05764579772949219, 0.0607147216796875, 0.06378364562988281, 0.06685256958007812, 0.06992149353027344, 0.07299041748046875, 0.07605934143066406, 0.07912826538085938, 0.08219718933105469, 0.08526611328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 33.0, 131.0, 400.0, 327.0, 100.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4440441131591797, -1.3808889389038086, -1.3177337646484375, -1.2545785903930664, -1.1914234161376953, -1.1282682418823242, -1.0651129484176636, -1.0019577741622925, -0.9388025999069214, -0.8756474256515503, -0.8124922513961792, -0.7493370175361633, -0.6861818432807922, -0.6230266690254211, -0.5598714351654053, -0.4967162609100342, -0.4335610866546631, -0.370405912399292, -0.3072507083415985, -0.24409551918506622, -0.18094033002853394, -0.11778515577316284, -0.05462995171546936, 0.008525252342224121, 0.07168042659759521, 0.1348356157541275, 0.1979908049106598, 0.26114600896835327, 0.32430118322372437, 0.38745635747909546, 0.45061156153678894, 0.5137667655944824, 0.5769219398498535, 0.6400771141052246, 0.7032322883605957, 0.7663875222206116, 0.8295426964759827, 0.8926978707313538, 0.9558531045913696, 1.0190082788467407, 1.0821634531021118, 1.145318627357483, 1.208473801612854, 1.271628975868225, 1.3347842693328857, 1.3979394435882568, 1.461094617843628, 1.524249792098999, 1.5874049663543701, 1.6505601406097412, 1.7137153148651123, 1.7768704891204834, 1.8400256633758545, 1.9031808376312256, 1.9663361310958862, 2.029491424560547, 2.092646598815918, 2.155801773071289, 2.21895694732666, 2.2821121215820312, 2.3452672958374023, 2.4084224700927734, 2.4715776443481445, 2.5347328186035156, 2.5978879928588867]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 6.0, 8.0, 10.0, 17.0, 22.0, 24.0, 26.0, 26.0, 25.0, 31.0, 35.0, 46.0, 40.0, 38.0, 35.0, 43.0, 50.0, 42.0, 40.0, 57.0, 46.0, 39.0, 28.0, 34.0, 25.0, 27.0, 30.0, 20.0, 17.0, 18.0, 14.0, 18.0, 8.0, 13.0, 8.0, 6.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33290839195251465, -0.32202205061912537, -0.31113573908805847, -0.3002493977546692, -0.2893630862236023, -0.278476744890213, -0.26759040355682373, -0.25670409202575684, -0.24581775069236755, -0.23493142426013947, -0.22404509782791138, -0.2131587564945221, -0.202272430062294, -0.19138610363006592, -0.18049977719783783, -0.16961345076560974, -0.15872712433338165, -0.14784079790115356, -0.13695447146892548, -0.1260681450366974, -0.1151818037033081, -0.10429547727108002, -0.09340915083885193, -0.08252281695604324, -0.07163649052381516, -0.06075016036629677, -0.04986383020877838, -0.03897750377655029, -0.028091173619031906, -0.01720484346151352, -0.006318517029285431, 0.004567816853523254, 0.015454143285751343, 0.02634047344326973, 0.037226803600788116, 0.048113130033016205, 0.05899946019053459, 0.06988579034805298, 0.08077211678028107, 0.09165845066308975, 0.10254477709531784, 0.11343110352754593, 0.12431743741035461, 0.1352037638425827, 0.1460900902748108, 0.15697643160820007, 0.16786274313926697, 0.17874908447265625, 0.18963541090488434, 0.20052173733711243, 0.21140806376934052, 0.2222943902015686, 0.23318073153495789, 0.24406705796718597, 0.25495338439941406, 0.26583972573280334, 0.27672603726387024, 0.2876123785972595, 0.2984986901283264, 0.3093850314617157, 0.3202713429927826, 0.3311576843261719, 0.34204399585723877, 0.35293033719062805, 0.36381667852401733]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 6.0, 13.0, 15.0, 23.0, 27.0, 35.0, 51.0, 70.0, 93.0, 145.0, 233.0, 375.0, 696.0, 1471.0, 3641.0, 11696.0, 55979.0, 409135.0, 476497.0, 67381.0, 13377.0, 3994.0, 1632.0, 787.0, 383.0, 255.0, 165.0, 101.0, 76.0, 56.0, 53.0, 17.0, 11.0, 16.0, 5.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.373046875, -0.3617591857910156, -0.35047149658203125, -0.3391838073730469, -0.3278961181640625, -0.3166084289550781, -0.30532073974609375, -0.2940330505371094, -0.282745361328125, -0.2714576721191406, -0.26016998291015625, -0.24888229370117188, -0.2375946044921875, -0.22630691528320312, -0.21501922607421875, -0.20373153686523438, -0.19244384765625, -0.18115615844726562, -0.16986846923828125, -0.15858078002929688, -0.1472930908203125, -0.13600540161132812, -0.12471771240234375, -0.11343002319335938, -0.102142333984375, -0.09085464477539062, -0.07956695556640625, -0.06827926635742188, -0.0569915771484375, -0.045703887939453125, -0.03441619873046875, -0.023128509521484375, -0.0118408203125, -0.000553131103515625, 0.01073455810546875, 0.022022247314453125, 0.0333099365234375, 0.044597625732421875, 0.05588531494140625, 0.06717300415039062, 0.078460693359375, 0.08974838256835938, 0.10103607177734375, 0.11232376098632812, 0.1236114501953125, 0.13489913940429688, 0.14618682861328125, 0.15747451782226562, 0.16876220703125, 0.18004989624023438, 0.19133758544921875, 0.20262527465820312, 0.2139129638671875, 0.22520065307617188, 0.23648834228515625, 0.24777603149414062, 0.259063720703125, 0.2703514099121094, 0.28163909912109375, 0.2929267883300781, 0.3042144775390625, 0.3155021667480469, 0.32678985595703125, 0.3380775451660156, 0.349365234375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 18.0, 22.0, 22.0, 56.0, 78.0, 122.0, 121.0, 158.0, 134.0, 92.0, 71.0, 39.0, 25.0, 14.0, 5.0, 9.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09075927734375, -0.08629131317138672, -0.08182334899902344, -0.07735538482666016, -0.07288742065429688, -0.0684194564819336, -0.06395149230957031, -0.05948352813720703, -0.05501556396484375, -0.05054759979248047, -0.04607963562011719, -0.041611671447753906, -0.037143707275390625, -0.032675743103027344, -0.028207778930664062, -0.02373981475830078, -0.0192718505859375, -0.014803886413574219, -0.010335922241210938, -0.005867958068847656, -0.001399993896484375, 0.0030679702758789062, 0.0075359344482421875, 0.012003898620605469, 0.01647186279296875, 0.02093982696533203, 0.025407791137695312, 0.029875755310058594, 0.034343719482421875, 0.038811683654785156, 0.04327964782714844, 0.04774761199951172, 0.052215576171875, 0.05668354034423828, 0.06115150451660156, 0.06561946868896484, 0.07008743286132812, 0.0745553970336914, 0.07902336120605469, 0.08349132537841797, 0.08795928955078125, 0.09242725372314453, 0.09689521789550781, 0.1013631820678711, 0.10583114624023438, 0.11029911041259766, 0.11476707458496094, 0.11923503875732422, 0.1237030029296875, 0.12817096710205078, 0.13263893127441406, 0.13710689544677734, 0.14157485961914062, 0.1460428237915039, 0.1505107879638672, 0.15497875213623047, 0.15944671630859375, 0.16391468048095703, 0.1683826446533203, 0.1728506088256836, 0.17731857299804688, 0.18178653717041016, 0.18625450134277344, 0.19072246551513672, 0.1951904296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 10.0, 21.0, 22.0, 27.0, 41.0, 52.0, 91.0, 149.0, 271.0, 472.0, 1161.0, 3772.0, 18512.0, 109749.0, 501297.0, 339513.0, 58777.0, 10344.0, 2403.0, 869.0, 381.0, 188.0, 115.0, 106.0, 59.0, 31.0, 21.0, 24.0, 16.0, 14.0, 10.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.37744140625, -0.3666038513183594, -0.35576629638671875, -0.3449287414550781, -0.3340911865234375, -0.3232536315917969, -0.31241607666015625, -0.3015785217285156, -0.290740966796875, -0.2799034118652344, -0.26906585693359375, -0.2582283020019531, -0.2473907470703125, -0.23655319213867188, -0.22571563720703125, -0.21487808227539062, -0.20404052734375, -0.19320297241210938, -0.18236541748046875, -0.17152786254882812, -0.1606903076171875, -0.14985275268554688, -0.13901519775390625, -0.12817764282226562, -0.117340087890625, -0.10650253295898438, -0.09566497802734375, -0.08482742309570312, -0.0739898681640625, -0.06315231323242188, -0.05231475830078125, -0.041477203369140625, -0.0306396484375, -0.019802093505859375, -0.00896453857421875, 0.001873016357421875, 0.0127105712890625, 0.023548126220703125, 0.03438568115234375, 0.045223236083984375, 0.056060791015625, 0.06689834594726562, 0.07773590087890625, 0.08857345581054688, 0.0994110107421875, 0.11024856567382812, 0.12108612060546875, 0.13192367553710938, 0.14276123046875, 0.15359878540039062, 0.16443634033203125, 0.17527389526367188, 0.1861114501953125, 0.19694900512695312, 0.20778656005859375, 0.21862411499023438, 0.229461669921875, 0.24029922485351562, 0.25113677978515625, 0.2619743347167969, 0.2728118896484375, 0.2836494445800781, 0.29448699951171875, 0.3053245544433594, 0.316162109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 7.0, 9.0, 8.0, 12.0, 23.0, 19.0, 24.0, 39.0, 22.0, 34.0, 36.0, 33.0, 40.0, 43.0, 40.0, 55.0, 47.0, 34.0, 48.0, 42.0, 44.0, 35.0, 44.0, 33.0, 26.0, 32.0, 23.0, 26.0, 20.0, 10.0, 16.0, 17.0, 15.0, 12.0, 5.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.17919921875, -0.1738739013671875, -0.168548583984375, -0.1632232666015625, -0.15789794921875, -0.1525726318359375, -0.147247314453125, -0.1419219970703125, -0.1365966796875, -0.1312713623046875, -0.125946044921875, -0.1206207275390625, -0.11529541015625, -0.1099700927734375, -0.104644775390625, -0.0993194580078125, -0.093994140625, -0.0886688232421875, -0.083343505859375, -0.0780181884765625, -0.07269287109375, -0.0673675537109375, -0.062042236328125, -0.0567169189453125, -0.0513916015625, -0.0460662841796875, -0.040740966796875, -0.0354156494140625, -0.03009033203125, -0.0247650146484375, -0.019439697265625, -0.0141143798828125, -0.0087890625, -0.0034637451171875, 0.001861572265625, 0.0071868896484375, 0.01251220703125, 0.0178375244140625, 0.023162841796875, 0.0284881591796875, 0.0338134765625, 0.0391387939453125, 0.044464111328125, 0.0497894287109375, 0.05511474609375, 0.0604400634765625, 0.065765380859375, 0.0710906982421875, 0.076416015625, 0.0817413330078125, 0.087066650390625, 0.0923919677734375, 0.09771728515625, 0.1030426025390625, 0.108367919921875, 0.1136932373046875, 0.1190185546875, 0.1243438720703125, 0.129669189453125, 0.1349945068359375, 0.14031982421875, 0.1456451416015625, 0.150970458984375, 0.1562957763671875, 0.16162109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 5.0, 13.0, 27.0, 35.0, 46.0, 83.0, 136.0, 212.0, 453.0, 794.0, 1534.0, 3304.0, 7192.0, 16570.0, 41067.0, 106411.0, 245007.0, 318242.0, 183463.0, 73492.0, 28252.0, 11893.0, 5127.0, 2466.0, 1243.0, 591.0, 349.0, 193.0, 136.0, 69.0, 50.0, 25.0, 23.0, 15.0, 7.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07794189453125, -0.07560157775878906, -0.07326126098632812, -0.07092094421386719, -0.06858062744140625, -0.06624031066894531, -0.06389999389648438, -0.06155967712402344, -0.0592193603515625, -0.05687904357910156, -0.054538726806640625, -0.05219841003417969, -0.04985809326171875, -0.04751777648925781, -0.045177459716796875, -0.04283714294433594, -0.040496826171875, -0.03815650939941406, -0.035816192626953125, -0.03347587585449219, -0.03113555908203125, -0.028795242309570312, -0.026454925537109375, -0.024114608764648438, -0.0217742919921875, -0.019433975219726562, -0.017093658447265625, -0.014753341674804688, -0.01241302490234375, -0.010072708129882812, -0.007732391357421875, -0.0053920745849609375, -0.0030517578125, -0.0007114410400390625, 0.001628875732421875, 0.0039691925048828125, 0.00630950927734375, 0.008649826049804688, 0.010990142822265625, 0.013330459594726562, 0.0156707763671875, 0.018011093139648438, 0.020351409912109375, 0.022691726684570312, 0.02503204345703125, 0.027372360229492188, 0.029712677001953125, 0.03205299377441406, 0.034393310546875, 0.03673362731933594, 0.039073944091796875, 0.04141426086425781, 0.04375457763671875, 0.04609489440917969, 0.048435211181640625, 0.05077552795410156, 0.0531158447265625, 0.05545616149902344, 0.057796478271484375, 0.06013679504394531, 0.06247711181640625, 0.06481742858886719, 0.06715774536132812, 0.06949806213378906, 0.07183837890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 10.0, 2.0, 12.0, 8.0, 17.0, 21.0, 26.0, 25.0, 33.0, 46.0, 47.0, 72.0, 68.0, 81.0, 72.0, 81.0, 75.0, 52.0, 52.0, 31.0, 27.0, 23.0, 17.0, 17.0, 17.0, 10.0, 9.0, 7.0, 6.0, 2.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1026859283447266e-05, -1.0662712156772614e-05, -1.0298565030097961e-05, -9.93441790342331e-06, -9.570270776748657e-06, -9.206123650074005e-06, -8.841976523399353e-06, -8.477829396724701e-06, -8.113682270050049e-06, -7.749535143375397e-06, -7.385388016700745e-06, -7.0212408900260925e-06, -6.6570937633514404e-06, -6.292946636676788e-06, -5.928799510002136e-06, -5.564652383327484e-06, -5.200505256652832e-06, -4.83635812997818e-06, -4.472211003303528e-06, -4.108063876628876e-06, -3.7439167499542236e-06, -3.3797696232795715e-06, -3.0156224966049194e-06, -2.6514753699302673e-06, -2.2873282432556152e-06, -1.923181116580963e-06, -1.559033989906311e-06, -1.194886863231659e-06, -8.307397365570068e-07, -4.6659260988235474e-07, -1.0244548320770264e-07, 2.6170164346694946e-07, 6.258487701416016e-07, 9.899958968162537e-07, 1.3541430234909058e-06, 1.7182901501655579e-06, 2.08243727684021e-06, 2.446584403514862e-06, 2.810731530189514e-06, 3.1748786568641663e-06, 3.5390257835388184e-06, 3.9031729102134705e-06, 4.2673200368881226e-06, 4.631467163562775e-06, 4.995614290237427e-06, 5.359761416912079e-06, 5.723908543586731e-06, 6.088055670261383e-06, 6.452202796936035e-06, 6.816349923610687e-06, 7.180497050285339e-06, 7.5446441769599915e-06, 7.908791303634644e-06, 8.272938430309296e-06, 8.637085556983948e-06, 9.0012326836586e-06, 9.365379810333252e-06, 9.729526937007904e-06, 1.0093674063682556e-05, 1.0457821190357208e-05, 1.082196831703186e-05, 1.1186115443706512e-05, 1.1550262570381165e-05, 1.1914409697055817e-05, 1.2278556823730469e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 13.0, 9.0, 15.0, 24.0, 38.0, 62.0, 85.0, 131.0, 203.0, 361.0, 646.0, 1145.0, 2124.0, 4651.0, 10447.0, 26266.0, 69712.0, 187128.0, 340697.0, 246031.0, 96999.0, 35499.0, 14101.0, 6135.0, 2764.0, 1383.0, 754.0, 403.0, 236.0, 161.0, 97.0, 64.0, 31.0, 23.0, 27.0, 20.0, 15.0, 6.0, 9.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0728759765625, -0.07033348083496094, -0.06779098510742188, -0.06524848937988281, -0.06270599365234375, -0.06016349792480469, -0.057621002197265625, -0.05507850646972656, -0.0525360107421875, -0.04999351501464844, -0.047451019287109375, -0.04490852355957031, -0.04236602783203125, -0.03982353210449219, -0.037281036376953125, -0.03473854064941406, -0.032196044921875, -0.029653549194335938, -0.027111053466796875, -0.024568557739257812, -0.02202606201171875, -0.019483566284179688, -0.016941070556640625, -0.014398574829101562, -0.0118560791015625, -0.009313583374023438, -0.006771087646484375, -0.0042285919189453125, -0.00168609619140625, 0.0008563995361328125, 0.003398895263671875, 0.0059413909912109375, 0.00848388671875, 0.011026382446289062, 0.013568878173828125, 0.016111373901367188, 0.01865386962890625, 0.021196365356445312, 0.023738861083984375, 0.026281356811523438, 0.0288238525390625, 0.03136634826660156, 0.033908843994140625, 0.03645133972167969, 0.03899383544921875, 0.04153633117675781, 0.044078826904296875, 0.04662132263183594, 0.049163818359375, 0.05170631408691406, 0.054248809814453125, 0.05679130554199219, 0.05933380126953125, 0.06187629699707031, 0.06441879272460938, 0.06696128845214844, 0.0695037841796875, 0.07204627990722656, 0.07458877563476562, 0.07713127136230469, 0.07967376708984375, 0.08221626281738281, 0.08475875854492188, 0.08730125427246094, 0.08984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 13.0, 8.0, 9.0, 12.0, 12.0, 14.0, 19.0, 28.0, 21.0, 31.0, 56.0, 45.0, 64.0, 62.0, 51.0, 56.0, 59.0, 62.0, 49.0, 54.0, 40.0, 40.0, 40.0, 31.0, 25.0, 15.0, 9.0, 17.0, 18.0, 7.0, 8.0, 5.0, 8.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.0625448226928711, -0.06075859069824219, -0.05897235870361328, -0.057186126708984375, -0.05539989471435547, -0.05361366271972656, -0.051827430725097656, -0.05004119873046875, -0.048254966735839844, -0.04646873474121094, -0.04468250274658203, -0.042896270751953125, -0.04111003875732422, -0.03932380676269531, -0.037537574768066406, -0.0357513427734375, -0.033965110778808594, -0.03217887878417969, -0.03039264678955078, -0.028606414794921875, -0.02682018280029297, -0.025033950805664062, -0.023247718811035156, -0.02146148681640625, -0.019675254821777344, -0.017889022827148438, -0.01610279083251953, -0.014316558837890625, -0.012530326843261719, -0.010744094848632812, -0.008957862854003906, -0.007171630859375, -0.005385398864746094, -0.0035991668701171875, -0.0018129348754882812, -2.6702880859375e-05, 0.0017595291137695312, 0.0035457611083984375, 0.005331993103027344, 0.00711822509765625, 0.008904457092285156, 0.010690689086914062, 0.012476921081542969, 0.014263153076171875, 0.01604938507080078, 0.017835617065429688, 0.019621849060058594, 0.0214080810546875, 0.023194313049316406, 0.024980545043945312, 0.02676677703857422, 0.028553009033203125, 0.03033924102783203, 0.03212547302246094, 0.033911705017089844, 0.03569793701171875, 0.037484169006347656, 0.03927040100097656, 0.04105663299560547, 0.042842864990234375, 0.04462909698486328, 0.04641532897949219, 0.048201560974121094, 0.04998779296875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 357.0, 504.0, 93.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.004016399383545, -3.883042097091675, -3.762068033218384, -3.6410937309265137, -3.5201194286346436, -3.3991451263427734, -3.2781710624694824, -3.1571967601776123, -3.036222457885742, -2.915248155593872, -2.794274091720581, -2.673299789428711, -2.552325487136841, -2.4313511848449707, -2.3103771209716797, -2.1894028186798096, -2.0684285163879395, -1.9474543333053589, -1.8264800310134888, -1.7055058479309082, -1.584531545639038, -1.4635573625564575, -1.342583179473877, -1.2216088771820068, -1.1006348133087158, -0.9796605706214905, -0.8586863279342651, -0.7377121448516846, -0.6167378425598145, -0.4957636594772339, -0.37478941679000854, -0.2538151741027832, -0.13284087181091309, -0.011866636574268341, 0.1091075986623764, 0.23008182644844055, 0.3510560691356659, 0.47203028202056885, 0.5930045247077942, 0.7139787673950195, 0.8349530100822449, 0.9559272527694702, 1.0769014358520508, 1.197875738143921, 1.3188499212265015, 1.439824104309082, 1.5607984066009521, 1.6817727088928223, 1.8027468919754028, 1.9237210750579834, 2.0446953773498535, 2.1656696796417236, 2.2866437435150146, 2.4076180458068848, 2.528592348098755, 2.649566650390625, 2.770540714263916, 2.891515016555786, 3.012489080429077, 3.1334633827209473, 3.2544376850128174, 3.3754119873046875, 3.4963860511779785, 3.6173603534698486, 3.7383346557617188]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 13.0, 12.0, 16.0, 15.0, 30.0, 18.0, 35.0, 39.0, 41.0, 44.0, 45.0, 55.0, 56.0, 52.0, 64.0, 51.0, 51.0, 53.0, 56.0, 41.0, 36.0, 38.0, 27.0, 23.0, 15.0, 16.0, 11.0, 9.0, 8.0, 2.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7837508320808411, -0.7629237771034241, -0.7420967221260071, -0.7212697267532349, -0.7004426717758179, -0.6796156167984009, -0.6587885618209839, -0.6379615068435669, -0.6171344518661499, -0.5963073968887329, -0.5754803419113159, -0.5546533465385437, -0.5338262915611267, -0.5129992365837097, -0.4921721816062927, -0.47134512662887573, -0.4505181312561035, -0.4296910762786865, -0.4088640511035919, -0.3880369961261749, -0.3672099709510803, -0.34638291597366333, -0.32555586099624634, -0.30472880601882935, -0.28390178084373474, -0.26307472586631775, -0.24224770069122314, -0.22142064571380615, -0.20059360563755035, -0.17976656556129456, -0.15893951058387756, -0.13811247050762177, -0.11728537082672119, -0.0964583307504654, -0.075631283223629, -0.0548042394220829, -0.033977195620536804, -0.013150155544281006, 0.007676891982555389, 0.028503939509391785, 0.04933097958564758, 0.07015801966190338, 0.09098506718873978, 0.11181211471557617, 0.13263915479183197, 0.15346619486808777, 0.17429324984550476, 0.19512028992176056, 0.21594732999801636, 0.23677437007427216, 0.25760141015052795, 0.27842846512794495, 0.29925549030303955, 0.32008254528045654, 0.34090960025787354, 0.3617366552352905, 0.38256368041038513, 0.4033907353878021, 0.42421776056289673, 0.4450448155403137, 0.4658718705177307, 0.4866988956928253, 0.5075259208679199, 0.5283529758453369, 0.5491800308227539]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 14.0, 33.0, 54.0, 99.0, 192.0, 416.0, 1143.0, 3229.0, 9828.0, 46373.0, 1173593.0, 2859380.0, 83436.0, 10671.0, 3096.0, 1195.0, 578.0, 305.0, 179.0, 144.0, 90.0, 74.0, 48.0, 25.0, 17.0, 18.0, 12.0, 5.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15703201293945312, -0.15024566650390625, -0.14345932006835938, -0.1366729736328125, -0.12988662719726562, -0.12310028076171875, -0.11631393432617188, -0.109527587890625, -0.10274124145507812, -0.09595489501953125, -0.08916854858398438, -0.0823822021484375, -0.07559585571289062, -0.06880950927734375, -0.062023162841796875, -0.05523681640625, -0.048450469970703125, -0.04166412353515625, -0.034877777099609375, -0.0280914306640625, -0.021305084228515625, -0.01451873779296875, -0.007732391357421875, -0.000946044921875, 0.005840301513671875, 0.01262664794921875, 0.019412994384765625, 0.0261993408203125, 0.032985687255859375, 0.03977203369140625, 0.046558380126953125, 0.0533447265625, 0.060131072998046875, 0.06691741943359375, 0.07370376586914062, 0.0804901123046875, 0.08727645874023438, 0.09406280517578125, 0.10084915161132812, 0.107635498046875, 0.11442184448242188, 0.12120819091796875, 0.12799453735351562, 0.1347808837890625, 0.14156723022460938, 0.14835357666015625, 0.15513992309570312, 0.16192626953125, 0.16871261596679688, 0.17549896240234375, 0.18228530883789062, 0.1890716552734375, 0.19585800170898438, 0.20264434814453125, 0.20943069458007812, 0.216217041015625, 0.22300338745117188, 0.22978973388671875, 0.23657608032226562, 0.2433624267578125, 0.2501487731933594, 0.25693511962890625, 0.2637214660644531, 0.2705078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 9.0, 28.0, 26.0, 42.0, 80.0, 113.0, 109.0, 130.0, 134.0, 112.0, 84.0, 52.0, 31.0, 20.0, 12.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0772705078125, -0.07289886474609375, -0.0685272216796875, -0.06415557861328125, -0.059783935546875, -0.05541229248046875, -0.0510406494140625, -0.04666900634765625, -0.04229736328125, -0.03792572021484375, -0.0335540771484375, -0.02918243408203125, -0.024810791015625, -0.02043914794921875, -0.0160675048828125, -0.01169586181640625, -0.00732421875, -0.00295257568359375, 0.0014190673828125, 0.00579071044921875, 0.010162353515625, 0.01453399658203125, 0.0189056396484375, 0.02327728271484375, 0.02764892578125, 0.03202056884765625, 0.0363922119140625, 0.04076385498046875, 0.045135498046875, 0.04950714111328125, 0.0538787841796875, 0.05825042724609375, 0.0626220703125, 0.06699371337890625, 0.0713653564453125, 0.07573699951171875, 0.080108642578125, 0.08448028564453125, 0.0888519287109375, 0.09322357177734375, 0.09759521484375, 0.10196685791015625, 0.1063385009765625, 0.11071014404296875, 0.115081787109375, 0.11945343017578125, 0.1238250732421875, 0.12819671630859375, 0.132568359375, 0.13694000244140625, 0.1413116455078125, 0.14568328857421875, 0.150054931640625, 0.15442657470703125, 0.1587982177734375, 0.16316986083984375, 0.16754150390625, 0.17191314697265625, 0.1762847900390625, 0.18065643310546875, 0.185028076171875, 0.18939971923828125, 0.1937713623046875, 0.19814300537109375, 0.2025146484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 10.0, 11.0, 28.0, 21.0, 29.0, 52.0, 73.0, 102.0, 241.0, 472.0, 1287.0, 5757.0, 41387.0, 566595.0, 3230046.0, 314735.0, 27281.0, 4104.0, 1038.0, 388.0, 223.0, 121.0, 81.0, 50.0, 42.0, 29.0, 14.0, 11.0, 11.0, 5.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.22705078125, -0.22004318237304688, -0.21303558349609375, -0.20602798461914062, -0.1990203857421875, -0.19201278686523438, -0.18500518798828125, -0.17799758911132812, -0.170989990234375, -0.16398239135742188, -0.15697479248046875, -0.14996719360351562, -0.1429595947265625, -0.13595199584960938, -0.12894439697265625, -0.12193679809570312, -0.11492919921875, -0.10792160034179688, -0.10091400146484375, -0.09390640258789062, -0.0868988037109375, -0.07989120483398438, -0.07288360595703125, -0.06587600708007812, -0.058868408203125, -0.051860809326171875, -0.04485321044921875, -0.037845611572265625, -0.0308380126953125, -0.023830413818359375, -0.01682281494140625, -0.009815216064453125, -0.0028076171875, 0.004199981689453125, 0.01120758056640625, 0.018215179443359375, 0.0252227783203125, 0.032230377197265625, 0.03923797607421875, 0.046245574951171875, 0.053253173828125, 0.060260772705078125, 0.06726837158203125, 0.07427597045898438, 0.0812835693359375, 0.08829116821289062, 0.09529876708984375, 0.10230636596679688, 0.10931396484375, 0.11632156372070312, 0.12332916259765625, 0.13033676147460938, 0.1373443603515625, 0.14435195922851562, 0.15135955810546875, 0.15836715698242188, 0.165374755859375, 0.17238235473632812, 0.17938995361328125, 0.18639755249023438, 0.1934051513671875, 0.20041275024414062, 0.20742034912109375, 0.21442794799804688, 0.221435546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 14.0, 10.0, 22.0, 17.0, 32.0, 46.0, 55.0, 76.0, 115.0, 167.0, 205.0, 280.0, 389.0, 540.0, 496.0, 449.0, 340.0, 244.0, 172.0, 117.0, 88.0, 58.0, 43.0, 30.0, 22.0, 11.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.11379051208496094, -0.11045455932617188, -0.10711860656738281, -0.10378265380859375, -0.10044670104980469, -0.09711074829101562, -0.09377479553222656, -0.0904388427734375, -0.08710289001464844, -0.08376693725585938, -0.08043098449707031, -0.07709503173828125, -0.07375907897949219, -0.07042312622070312, -0.06708717346191406, -0.063751220703125, -0.06041526794433594, -0.057079315185546875, -0.05374336242675781, -0.05040740966796875, -0.04707145690917969, -0.043735504150390625, -0.04039955139160156, -0.0370635986328125, -0.03372764587402344, -0.030391693115234375, -0.027055740356445312, -0.02371978759765625, -0.020383834838867188, -0.017047882080078125, -0.013711929321289062, -0.0103759765625, -0.0070400238037109375, -0.003704071044921875, -0.0003681182861328125, 0.00296783447265625, 0.0063037872314453125, 0.009639739990234375, 0.012975692749023438, 0.0163116455078125, 0.019647598266601562, 0.022983551025390625, 0.026319503784179688, 0.02965545654296875, 0.03299140930175781, 0.036327362060546875, 0.03966331481933594, 0.042999267578125, 0.04633522033691406, 0.049671173095703125, 0.05300712585449219, 0.05634307861328125, 0.05967903137207031, 0.06301498413085938, 0.06635093688964844, 0.0696868896484375, 0.07302284240722656, 0.07635879516601562, 0.07969474792480469, 0.08303070068359375, 0.08636665344238281, 0.08970260620117188, 0.09303855895996094, 0.09637451171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 9.0, 33.0, 93.0, 195.0, 256.0, 219.0, 122.0, 57.0, 16.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2261666059494019, -1.187685251235962, -1.1492037773132324, -1.1107224225997925, -1.0722410678863525, -1.033759593963623, -0.9952782392501831, -0.9567968249320984, -0.9183154106140137, -0.879833996295929, -0.8413525819778442, -0.8028712272644043, -0.7643898129463196, -0.7259083986282349, -0.6874270439147949, -0.6489456295967102, -0.6104642152786255, -0.5719828009605408, -0.533501386642456, -0.4950200319290161, -0.4565386176109314, -0.4180572032928467, -0.37957581877708435, -0.341094434261322, -0.3026130199432373, -0.2641316056251526, -0.22565022110939026, -0.18716882169246674, -0.1486874222755432, -0.11020602285861969, -0.07172462344169617, -0.03324323892593384, 0.00523829460144043, 0.04371969401836395, 0.08220109343528748, 0.120682492852211, 0.15916389226913452, 0.19764529168605804, 0.23612669110298157, 0.2746080756187439, 0.3130894899368286, 0.35157090425491333, 0.39005228877067566, 0.428533673286438, 0.4670150876045227, 0.5054965019226074, 0.5439778566360474, 0.5824592709541321, 0.6209406852722168, 0.6594220995903015, 0.6979035139083862, 0.7363848686218262, 0.7748662829399109, 0.8133476972579956, 0.8518290519714355, 0.8903104662895203, 0.928791880607605, 0.9672732949256897, 1.0057547092437744, 1.0442360639572144, 1.0827174186706543, 1.1211988925933838, 1.1596802473068237, 1.1981616020202637, 1.2366430759429932]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 9.0, 15.0, 8.0, 16.0, 20.0, 18.0, 32.0, 29.0, 30.0, 42.0, 42.0, 35.0, 52.0, 49.0, 42.0, 41.0, 48.0, 44.0, 40.0, 42.0, 37.0, 47.0, 35.0, 30.0, 19.0, 19.0, 19.0, 18.0, 15.0, 14.0, 12.0, 12.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3093070983886719, -0.2985919117927551, -0.287876695394516, -0.27716150879859924, -0.2664463222026825, -0.25573110580444336, -0.2450159192085266, -0.23430071771144867, -0.22358551621437073, -0.21287031471729279, -0.20215512812137604, -0.1914399266242981, -0.18072472512722015, -0.1700095236301422, -0.15929433703422546, -0.14857913553714752, -0.13786394894123077, -0.12714874744415283, -0.11643355339765549, -0.10571835935115814, -0.0950031578540802, -0.08428796380758286, -0.07357276976108551, -0.06285756826400757, -0.05214237421751022, -0.04142717644572258, -0.030711980536580086, -0.01999678462743759, -0.009281586855649948, 0.0014336109161376953, 0.01214880496263504, 0.022864006459712982, 0.03357920050621033, 0.04429439827799797, 0.055009596049785614, 0.06572479009628296, 0.0764399915933609, 0.08715518563985825, 0.09787037968635559, 0.10858558118343353, 0.11930077522993088, 0.13001596927642822, 0.14073117077350616, 0.1514463722705841, 0.16216155886650085, 0.1728767603635788, 0.18359196186065674, 0.1943071484565735, 0.20502234995365143, 0.21573755145072937, 0.22645273804664612, 0.23716793954372406, 0.247883141040802, 0.25859832763671875, 0.2693135142326355, 0.28002873063087463, 0.2907439172267914, 0.30145910382270813, 0.31217432022094727, 0.322889506816864, 0.33360469341278076, 0.3443199098110199, 0.35503509640693665, 0.3657503128051758, 0.37646549940109253]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 11.0, 9.0, 17.0, 13.0, 25.0, 22.0, 37.0, 36.0, 66.0, 69.0, 120.0, 169.0, 238.0, 301.0, 555.0, 1005.0, 2229.0, 6175.0, 21780.0, 99264.0, 474266.0, 350124.0, 67401.0, 15609.0, 4646.0, 1879.0, 893.0, 491.0, 288.0, 218.0, 154.0, 94.0, 91.0, 61.0, 41.0, 42.0, 25.0, 19.0, 14.0, 14.0, 11.0, 8.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28271484375, -0.2735595703125, -0.264404296875, -0.2552490234375, -0.24609375, -0.2369384765625, -0.227783203125, -0.2186279296875, -0.20947265625, -0.2003173828125, -0.191162109375, -0.1820068359375, -0.1728515625, -0.1636962890625, -0.154541015625, -0.1453857421875, -0.13623046875, -0.1270751953125, -0.117919921875, -0.1087646484375, -0.099609375, -0.0904541015625, -0.081298828125, -0.0721435546875, -0.06298828125, -0.0538330078125, -0.044677734375, -0.0355224609375, -0.0263671875, -0.0172119140625, -0.008056640625, 0.0010986328125, 0.01025390625, 0.0194091796875, 0.028564453125, 0.0377197265625, 0.046875, 0.0560302734375, 0.065185546875, 0.0743408203125, 0.08349609375, 0.0926513671875, 0.101806640625, 0.1109619140625, 0.1201171875, 0.1292724609375, 0.138427734375, 0.1475830078125, 0.15673828125, 0.1658935546875, 0.175048828125, 0.1842041015625, 0.193359375, 0.2025146484375, 0.211669921875, 0.2208251953125, 0.22998046875, 0.2391357421875, 0.248291015625, 0.2574462890625, 0.2666015625, 0.2757568359375, 0.284912109375, 0.2940673828125, 0.30322265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 8.0, 16.0, 19.0, 39.0, 58.0, 92.0, 104.0, 124.0, 115.0, 134.0, 100.0, 80.0, 38.0, 32.0, 20.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06597900390625, -0.06169414520263672, -0.05740928649902344, -0.053124427795410156, -0.048839569091796875, -0.044554710388183594, -0.04026985168457031, -0.03598499298095703, -0.03170013427734375, -0.02741527557373047, -0.023130416870117188, -0.018845558166503906, -0.014560699462890625, -0.010275840759277344, -0.0059909820556640625, -0.0017061233520507812, 0.0025787353515625, 0.006863594055175781, 0.011148452758789062, 0.015433311462402344, 0.019718170166015625, 0.024003028869628906, 0.028287887573242188, 0.03257274627685547, 0.03685760498046875, 0.04114246368408203, 0.04542732238769531, 0.049712181091308594, 0.053997039794921875, 0.058281898498535156, 0.06256675720214844, 0.06685161590576172, 0.071136474609375, 0.07542133331298828, 0.07970619201660156, 0.08399105072021484, 0.08827590942382812, 0.0925607681274414, 0.09684562683105469, 0.10113048553466797, 0.10541534423828125, 0.10970020294189453, 0.11398506164550781, 0.1182699203491211, 0.12255477905273438, 0.12683963775634766, 0.13112449645996094, 0.13540935516357422, 0.1396942138671875, 0.14397907257080078, 0.14826393127441406, 0.15254878997802734, 0.15683364868164062, 0.1611185073852539, 0.1654033660888672, 0.16968822479248047, 0.17397308349609375, 0.17825794219970703, 0.1825428009033203, 0.1868276596069336, 0.19111251831054688, 0.19539737701416016, 0.19968223571777344, 0.20396709442138672, 0.208251953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 14.0, 13.0, 10.0, 20.0, 28.0, 45.0, 54.0, 85.0, 163.0, 318.0, 614.0, 1283.0, 2821.0, 6644.0, 14733.0, 33626.0, 77522.0, 175133.0, 301757.0, 236427.0, 110328.0, 48714.0, 21112.0, 9239.0, 4200.0, 1867.0, 827.0, 394.0, 204.0, 110.0, 73.0, 50.0, 29.0, 21.0, 18.0, 12.0, 13.0, 11.0, 5.0, 9.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.156005859375, -0.15108680725097656, -0.14616775512695312, -0.1412487030029297, -0.13632965087890625, -0.1314105987548828, -0.12649154663085938, -0.12157249450683594, -0.1166534423828125, -0.11173439025878906, -0.10681533813476562, -0.10189628601074219, -0.09697723388671875, -0.09205818176269531, -0.08713912963867188, -0.08222007751464844, -0.077301025390625, -0.07238197326660156, -0.06746292114257812, -0.06254386901855469, -0.05762481689453125, -0.05270576477050781, -0.047786712646484375, -0.04286766052246094, -0.0379486083984375, -0.03302955627441406, -0.028110504150390625, -0.023191452026367188, -0.01827239990234375, -0.013353347778320312, -0.008434295654296875, -0.0035152435302734375, 0.00140380859375, 0.0063228607177734375, 0.011241912841796875, 0.016160964965820312, 0.02108001708984375, 0.025999069213867188, 0.030918121337890625, 0.03583717346191406, 0.0407562255859375, 0.04567527770996094, 0.050594329833984375, 0.05551338195800781, 0.06043243408203125, 0.06535148620605469, 0.07027053833007812, 0.07518959045410156, 0.080108642578125, 0.08502769470214844, 0.08994674682617188, 0.09486579895019531, 0.09978485107421875, 0.10470390319824219, 0.10962295532226562, 0.11454200744628906, 0.1194610595703125, 0.12438011169433594, 0.12929916381835938, 0.1342182159423828, 0.13913726806640625, 0.1440563201904297, 0.14897537231445312, 0.15389442443847656, 0.1588134765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 14.0, 8.0, 10.0, 15.0, 17.0, 21.0, 18.0, 22.0, 20.0, 28.0, 30.0, 30.0, 31.0, 36.0, 35.0, 35.0, 34.0, 37.0, 53.0, 52.0, 38.0, 46.0, 35.0, 27.0, 36.0, 27.0, 30.0, 28.0, 24.0, 18.0, 24.0, 25.0, 14.0, 14.0, 11.0, 10.0, 8.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1485595703125, -0.14398574829101562, -0.13941192626953125, -0.13483810424804688, -0.1302642822265625, -0.12569046020507812, -0.12111663818359375, -0.11654281616210938, -0.111968994140625, -0.10739517211914062, -0.10282135009765625, -0.09824752807617188, -0.0936737060546875, -0.08909988403320312, -0.08452606201171875, -0.07995223999023438, -0.07537841796875, -0.07080459594726562, -0.06623077392578125, -0.061656951904296875, -0.0570831298828125, -0.052509307861328125, -0.04793548583984375, -0.043361663818359375, -0.038787841796875, -0.034214019775390625, -0.02964019775390625, -0.025066375732421875, -0.0204925537109375, -0.015918731689453125, -0.01134490966796875, -0.006771087646484375, -0.002197265625, 0.002376556396484375, 0.00695037841796875, 0.011524200439453125, 0.0160980224609375, 0.020671844482421875, 0.02524566650390625, 0.029819488525390625, 0.034393310546875, 0.038967132568359375, 0.04354095458984375, 0.048114776611328125, 0.0526885986328125, 0.057262420654296875, 0.06183624267578125, 0.06641006469726562, 0.07098388671875, 0.07555770874023438, 0.08013153076171875, 0.08470535278320312, 0.0892791748046875, 0.09385299682617188, 0.09842681884765625, 0.10300064086914062, 0.107574462890625, 0.11214828491210938, 0.11672210693359375, 0.12129592895507812, 0.1258697509765625, 0.13044357299804688, 0.13501739501953125, 0.13959121704101562, 0.1441650390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 15.0, 26.0, 45.0, 52.0, 90.0, 124.0, 193.0, 298.0, 477.0, 797.0, 1338.0, 2209.0, 3813.0, 6872.0, 12364.0, 22535.0, 42138.0, 75914.0, 130672.0, 189900.0, 202611.0, 151155.0, 91252.0, 50881.0, 27751.0, 15182.0, 8377.0, 4614.0, 2644.0, 1586.0, 1010.0, 609.0, 380.0, 197.0, 145.0, 83.0, 59.0, 41.0, 27.0, 18.0, 13.0, 14.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.03803300857543945, -0.036728858947753906, -0.03542470932006836, -0.03412055969238281, -0.032816410064697266, -0.03151226043701172, -0.030208110809326172, -0.028903961181640625, -0.027599811553955078, -0.02629566192626953, -0.024991512298583984, -0.023687362670898438, -0.02238321304321289, -0.021079063415527344, -0.019774913787841797, -0.01847076416015625, -0.017166614532470703, -0.015862464904785156, -0.01455831527709961, -0.013254165649414062, -0.011950016021728516, -0.010645866394042969, -0.009341716766357422, -0.008037567138671875, -0.006733417510986328, -0.005429267883300781, -0.004125118255615234, -0.0028209686279296875, -0.0015168190002441406, -0.00021266937255859375, 0.0010914802551269531, 0.0023956298828125, 0.003699779510498047, 0.005003929138183594, 0.006308078765869141, 0.0076122283935546875, 0.008916378021240234, 0.010220527648925781, 0.011524677276611328, 0.012828826904296875, 0.014132976531982422, 0.015437126159667969, 0.016741275787353516, 0.018045425415039062, 0.01934957504272461, 0.020653724670410156, 0.021957874298095703, 0.02326202392578125, 0.024566173553466797, 0.025870323181152344, 0.02717447280883789, 0.028478622436523438, 0.029782772064208984, 0.03108692169189453, 0.03239107131958008, 0.033695220947265625, 0.03499937057495117, 0.03630352020263672, 0.037607669830322266, 0.03891181945800781, 0.04021596908569336, 0.041520118713378906, 0.04282426834106445, 0.04412841796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 4.0, 2.0, 7.0, 11.0, 13.0, 13.0, 14.0, 16.0, 30.0, 42.0, 30.0, 37.0, 48.0, 71.0, 94.0, 106.0, 88.0, 82.0, 55.0, 51.0, 32.0, 34.0, 21.0, 12.0, 20.0, 12.0, 17.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0311603546142578e-05, -9.922310709953308e-06, -9.533017873764038e-06, -9.143725037574768e-06, -8.754432201385498e-06, -8.365139365196228e-06, -7.975846529006958e-06, -7.586553692817688e-06, -7.197260856628418e-06, -6.807968020439148e-06, -6.418675184249878e-06, -6.029382348060608e-06, -5.640089511871338e-06, -5.250796675682068e-06, -4.861503839492798e-06, -4.472211003303528e-06, -4.082918167114258e-06, -3.693625330924988e-06, -3.3043324947357178e-06, -2.9150396585464478e-06, -2.5257468223571777e-06, -2.1364539861679077e-06, -1.7471611499786377e-06, -1.3578683137893677e-06, -9.685754776000977e-07, -5.792826414108276e-07, -1.8998980522155762e-07, 1.993030309677124e-07, 5.885958671569824e-07, 9.778887033462524e-07, 1.3671815395355225e-06, 1.7564743757247925e-06, 2.1457672119140625e-06, 2.5350600481033325e-06, 2.9243528842926025e-06, 3.3136457204818726e-06, 3.7029385566711426e-06, 4.092231392860413e-06, 4.481524229049683e-06, 4.870817065238953e-06, 5.260109901428223e-06, 5.649402737617493e-06, 6.038695573806763e-06, 6.427988409996033e-06, 6.817281246185303e-06, 7.206574082374573e-06, 7.595866918563843e-06, 7.985159754753113e-06, 8.374452590942383e-06, 8.763745427131653e-06, 9.153038263320923e-06, 9.542331099510193e-06, 9.931623935699463e-06, 1.0320916771888733e-05, 1.0710209608078003e-05, 1.1099502444267273e-05, 1.1488795280456543e-05, 1.1878088116645813e-05, 1.2267380952835083e-05, 1.2656673789024353e-05, 1.3045966625213623e-05, 1.3435259461402893e-05, 1.3824552297592163e-05, 1.4213845133781433e-05, 1.4603137969970703e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 10.0, 8.0, 11.0, 22.0, 40.0, 57.0, 93.0, 164.0, 275.0, 458.0, 737.0, 1391.0, 2565.0, 4519.0, 8424.0, 16059.0, 29954.0, 56291.0, 101819.0, 168137.0, 215763.0, 184466.0, 116313.0, 65387.0, 35174.0, 18725.0, 9743.0, 5262.0, 2886.0, 1667.0, 945.0, 445.0, 294.0, 186.0, 100.0, 59.0, 29.0, 25.0, 10.0, 8.0, 10.0, 7.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.03835916519165039, -0.03710651397705078, -0.03585386276245117, -0.03460121154785156, -0.03334856033325195, -0.032095909118652344, -0.030843257904052734, -0.029590606689453125, -0.028337955474853516, -0.027085304260253906, -0.025832653045654297, -0.024580001831054688, -0.023327350616455078, -0.02207469940185547, -0.02082204818725586, -0.01956939697265625, -0.01831674575805664, -0.01706409454345703, -0.015811443328857422, -0.014558792114257812, -0.013306140899658203, -0.012053489685058594, -0.010800838470458984, -0.009548187255859375, -0.008295536041259766, -0.007042884826660156, -0.005790233612060547, -0.0045375823974609375, -0.003284931182861328, -0.0020322799682617188, -0.0007796287536621094, 0.0004730224609375, 0.0017256736755371094, 0.0029783248901367188, 0.004230976104736328, 0.0054836273193359375, 0.006736278533935547, 0.007988929748535156, 0.009241580963134766, 0.010494232177734375, 0.011746883392333984, 0.012999534606933594, 0.014252185821533203, 0.015504837036132812, 0.016757488250732422, 0.01801013946533203, 0.01926279067993164, 0.02051544189453125, 0.02176809310913086, 0.02302074432373047, 0.024273395538330078, 0.025526046752929688, 0.026778697967529297, 0.028031349182128906, 0.029284000396728516, 0.030536651611328125, 0.031789302825927734, 0.033041954040527344, 0.03429460525512695, 0.03554725646972656, 0.03679990768432617, 0.03805255889892578, 0.03930521011352539, 0.040557861328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 13.0, 16.0, 18.0, 18.0, 23.0, 20.0, 35.0, 35.0, 49.0, 36.0, 48.0, 44.0, 70.0, 64.0, 61.0, 56.0, 49.0, 39.0, 44.0, 42.0, 38.0, 18.0, 20.0, 27.0, 17.0, 16.0, 11.0, 13.0, 10.0, 3.0, 3.0, 2.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.040924072265625, -0.03970623016357422, -0.03848838806152344, -0.037270545959472656, -0.036052703857421875, -0.034834861755371094, -0.03361701965332031, -0.03239917755126953, -0.03118133544921875, -0.02996349334716797, -0.028745651245117188, -0.027527809143066406, -0.026309967041015625, -0.025092124938964844, -0.023874282836914062, -0.02265644073486328, -0.0214385986328125, -0.02022075653076172, -0.019002914428710938, -0.017785072326660156, -0.016567230224609375, -0.015349388122558594, -0.014131546020507812, -0.012913703918457031, -0.01169586181640625, -0.010478019714355469, -0.009260177612304688, -0.008042335510253906, -0.006824493408203125, -0.005606651306152344, -0.0043888092041015625, -0.0031709671020507812, -0.001953125, -0.0007352828979492188, 0.0004825592041015625, 0.0017004013061523438, 0.002918243408203125, 0.004136085510253906, 0.0053539276123046875, 0.006571769714355469, 0.00778961181640625, 0.009007453918457031, 0.010225296020507812, 0.011443138122558594, 0.012660980224609375, 0.013878822326660156, 0.015096664428710938, 0.01631450653076172, 0.0175323486328125, 0.01875019073486328, 0.019968032836914062, 0.021185874938964844, 0.022403717041015625, 0.023621559143066406, 0.024839401245117188, 0.02605724334716797, 0.02727508544921875, 0.02849292755126953, 0.029710769653320312, 0.030928611755371094, 0.032146453857421875, 0.033364295959472656, 0.03458213806152344, 0.03579998016357422, 0.037017822265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 53.0, 159.0, 280.0, 319.0, 130.0, 43.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.192502021789551, -2.1280267238616943, -2.063551187515259, -1.9990758895874023, -1.934600591659546, -1.8701251745224, -1.805649757385254, -1.7411744594573975, -1.6766990423202515, -1.6122236251831055, -1.547748327255249, -1.483272910118103, -1.418797492980957, -1.3543221950531006, -1.2898467779159546, -1.2253713607788086, -1.1608960628509521, -1.0964206457138062, -1.0319453477859497, -0.9674699306488037, -0.9029945731163025, -0.8385192155838013, -0.7740437984466553, -0.709568440914154, -0.6450930833816528, -0.5806177258491516, -0.5161423683166504, -0.4516669511795044, -0.3871915936470032, -0.32271623611450195, -0.25824084877967834, -0.19376546144485474, -0.12928986549377441, -0.064814493060112, -0.00033912062644958496, 0.06413625180721283, 0.12861162424087524, 0.19308698177337646, 0.2575623691082001, 0.3220377564430237, 0.3865131139755249, 0.4509884715080261, 0.5154638290405273, 0.5799392461776733, 0.6444146037101746, 0.7088899612426758, 0.7733653783798218, 0.837840735912323, 0.9023160934448242, 0.9667914509773254, 1.0312668085098267, 1.0957422256469727, 1.160217523574829, 1.224692940711975, 1.289168357849121, 1.3536436557769775, 1.4181190729141235, 1.4825944900512695, 1.547069787979126, 1.611545205116272, 1.676020622253418, 1.7404959201812744, 1.8049713373184204, 1.8694467544555664, 1.9339220523834229]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 10.0, 10.0, 7.0, 11.0, 12.0, 18.0, 20.0, 28.0, 29.0, 26.0, 35.0, 44.0, 36.0, 30.0, 49.0, 51.0, 54.0, 43.0, 46.0, 39.0, 65.0, 43.0, 35.0, 35.0, 44.0, 18.0, 28.0, 24.0, 24.0, 24.0, 14.0, 13.0, 6.0, 9.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6124780774116516, -0.5935313701629639, -0.5745847225189209, -0.5556380152702332, -0.5366913080215454, -0.5177446007728577, -0.4987979233264923, -0.47985124588012695, -0.4609045386314392, -0.44195783138275146, -0.4230111539363861, -0.40406447649002075, -0.385117769241333, -0.36617106199264526, -0.3472243845462799, -0.32827770709991455, -0.3093309998512268, -0.29038429260253906, -0.2714376151561737, -0.25249093770980835, -0.2335442304611206, -0.21459753811359406, -0.1956508457660675, -0.17670415341854095, -0.1577574610710144, -0.13881076872348785, -0.1198640763759613, -0.10091738402843475, -0.0819706916809082, -0.06302399933338165, -0.0440773069858551, -0.025130614638328552, -0.006183981895446777, 0.012762710452079773, 0.03170940279960632, 0.050656095147132874, 0.06960278749465942, 0.08854947984218597, 0.10749617218971252, 0.12644286453723907, 0.14538955688476562, 0.16433624923229218, 0.18328294157981873, 0.20222963392734528, 0.22117632627487183, 0.24012301862239838, 0.2590697109699249, 0.2780163884162903, 0.296963095664978, 0.31590980291366577, 0.33485648036003113, 0.3538031578063965, 0.37274986505508423, 0.391696572303772, 0.41064324975013733, 0.4295899271965027, 0.44853663444519043, 0.4674833416938782, 0.48643001914024353, 0.5053766965866089, 0.5243234038352966, 0.5432701110839844, 0.5622167587280273, 0.5811634659767151, 0.6001101732254028]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 14.0, 10.0, 24.0, 35.0, 53.0, 111.0, 183.0, 428.0, 1108.0, 3002.0, 10149.0, 47117.0, 785882.0, 3193055.0, 128576.0, 16213.0, 4401.0, 1731.0, 836.0, 482.0, 299.0, 171.0, 125.0, 88.0, 51.0, 30.0, 29.0, 21.0, 21.0, 14.0, 8.0, 7.0, 0.0, 1.0, 4.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.15855026245117188, -0.15108489990234375, -0.14361953735351562, -0.1361541748046875, -0.12868881225585938, -0.12122344970703125, -0.11375808715820312, -0.106292724609375, -0.09882736206054688, -0.09136199951171875, -0.08389663696289062, -0.0764312744140625, -0.06896591186523438, -0.06150054931640625, -0.054035186767578125, -0.04656982421875, -0.039104461669921875, -0.03163909912109375, -0.024173736572265625, -0.0167083740234375, -0.009243011474609375, -0.00177764892578125, 0.005687713623046875, 0.013153076171875, 0.020618438720703125, 0.02808380126953125, 0.035549163818359375, 0.0430145263671875, 0.050479888916015625, 0.05794525146484375, 0.06541061401367188, 0.0728759765625, 0.08034133911132812, 0.08780670166015625, 0.09527206420898438, 0.1027374267578125, 0.11020278930664062, 0.11766815185546875, 0.12513351440429688, 0.132598876953125, 0.14006423950195312, 0.14752960205078125, 0.15499496459960938, 0.1624603271484375, 0.16992568969726562, 0.17739105224609375, 0.18485641479492188, 0.19232177734375, 0.19978713989257812, 0.20725250244140625, 0.21471786499023438, 0.2221832275390625, 0.22964859008789062, 0.23711395263671875, 0.24457931518554688, 0.252044677734375, 0.2595100402832031, 0.26697540283203125, 0.2744407653808594, 0.2819061279296875, 0.2893714904785156, 0.29683685302734375, 0.3043022155761719, 0.311767578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 5.0, 22.0, 36.0, 46.0, 66.0, 95.0, 90.0, 111.0, 125.0, 105.0, 106.0, 61.0, 45.0, 32.0, 16.0, 16.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06329345703125, -0.05913066864013672, -0.05496788024902344, -0.050805091857910156, -0.046642303466796875, -0.042479515075683594, -0.03831672668457031, -0.03415393829345703, -0.02999114990234375, -0.02582836151123047, -0.021665573120117188, -0.017502784729003906, -0.013339996337890625, -0.009177207946777344, -0.0050144195556640625, -0.0008516311645507812, 0.0033111572265625, 0.007473945617675781, 0.011636734008789062, 0.015799522399902344, 0.019962310791015625, 0.024125099182128906, 0.028287887573242188, 0.03245067596435547, 0.03661346435546875, 0.04077625274658203, 0.04493904113769531, 0.049101829528808594, 0.053264617919921875, 0.057427406311035156, 0.06159019470214844, 0.06575298309326172, 0.069915771484375, 0.07407855987548828, 0.07824134826660156, 0.08240413665771484, 0.08656692504882812, 0.0907297134399414, 0.09489250183105469, 0.09905529022216797, 0.10321807861328125, 0.10738086700439453, 0.11154365539550781, 0.1157064437866211, 0.11986923217773438, 0.12403202056884766, 0.12819480895996094, 0.13235759735107422, 0.1365203857421875, 0.14068317413330078, 0.14484596252441406, 0.14900875091552734, 0.15317153930664062, 0.1573343276977539, 0.1614971160888672, 0.16565990447998047, 0.16982269287109375, 0.17398548126220703, 0.1781482696533203, 0.1823110580444336, 0.18647384643554688, 0.19063663482666016, 0.19479942321777344, 0.19896221160888672, 0.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 8.0, 17.0, 13.0, 21.0, 28.0, 43.0, 57.0, 123.0, 179.0, 367.0, 991.0, 3211.0, 15148.0, 125987.0, 1916748.0, 1980006.0, 130343.0, 15855.0, 3220.0, 957.0, 400.0, 172.0, 113.0, 78.0, 62.0, 38.0, 23.0, 15.0, 19.0, 5.0, 8.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2003173828125, -0.19364166259765625, -0.1869659423828125, -0.18029022216796875, -0.173614501953125, -0.16693878173828125, -0.1602630615234375, -0.15358734130859375, -0.14691162109375, -0.14023590087890625, -0.1335601806640625, -0.12688446044921875, -0.120208740234375, -0.11353302001953125, -0.1068572998046875, -0.10018157958984375, -0.093505859375, -0.08683013916015625, -0.0801544189453125, -0.07347869873046875, -0.066802978515625, -0.06012725830078125, -0.0534515380859375, -0.04677581787109375, -0.04010009765625, -0.03342437744140625, -0.0267486572265625, -0.02007293701171875, -0.013397216796875, -0.00672149658203125, -4.57763671875e-05, 0.00662994384765625, 0.0133056640625, 0.01998138427734375, 0.0266571044921875, 0.03333282470703125, 0.040008544921875, 0.04668426513671875, 0.0533599853515625, 0.06003570556640625, 0.06671142578125, 0.07338714599609375, 0.0800628662109375, 0.08673858642578125, 0.093414306640625, 0.10009002685546875, 0.1067657470703125, 0.11344146728515625, 0.1201171875, 0.12679290771484375, 0.1334686279296875, 0.14014434814453125, 0.146820068359375, 0.15349578857421875, 0.1601715087890625, 0.16684722900390625, 0.17352294921875, 0.18019866943359375, 0.1868743896484375, 0.19355010986328125, 0.200225830078125, 0.20690155029296875, 0.2135772705078125, 0.22025299072265625, 0.2269287109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 13.0, 18.0, 27.0, 38.0, 46.0, 76.0, 88.0, 145.0, 222.0, 282.0, 401.0, 494.0, 564.0, 484.0, 365.0, 248.0, 170.0, 113.0, 93.0, 56.0, 30.0, 20.0, 18.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129638671875, -0.12615394592285156, -0.12266921997070312, -0.11918449401855469, -0.11569976806640625, -0.11221504211425781, -0.10873031616210938, -0.10524559020996094, -0.1017608642578125, -0.09827613830566406, -0.09479141235351562, -0.09130668640136719, -0.08782196044921875, -0.08433723449707031, -0.08085250854492188, -0.07736778259277344, -0.073883056640625, -0.07039833068847656, -0.06691360473632812, -0.06342887878417969, -0.05994415283203125, -0.05645942687988281, -0.052974700927734375, -0.04948997497558594, -0.0460052490234375, -0.04252052307128906, -0.039035797119140625, -0.03555107116699219, -0.03206634521484375, -0.028581619262695312, -0.025096893310546875, -0.021612167358398438, -0.01812744140625, -0.014642715454101562, -0.011157989501953125, -0.0076732635498046875, -0.00418853759765625, -0.0007038116455078125, 0.002780914306640625, 0.0062656402587890625, 0.0097503662109375, 0.013235092163085938, 0.016719818115234375, 0.020204544067382812, 0.02368927001953125, 0.027173995971679688, 0.030658721923828125, 0.03414344787597656, 0.037628173828125, 0.04111289978027344, 0.044597625732421875, 0.04808235168457031, 0.05156707763671875, 0.05505180358886719, 0.058536529541015625, 0.06202125549316406, 0.0655059814453125, 0.06899070739746094, 0.07247543334960938, 0.07596015930175781, 0.07944488525390625, 0.08292961120605469, 0.08641433715820312, 0.08989906311035156, 0.0933837890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 20.0, 38.0, 95.0, 168.0, 215.0, 212.0, 127.0, 80.0, 24.0, 13.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359740138053894, -1.3247348070144653, -1.2897295951843262, -1.2547242641448975, -1.2197190523147583, -1.1847137212753296, -1.1497085094451904, -1.1147031784057617, -1.079697847366333, -1.0446925163269043, -1.0096873044967651, -0.9746820330619812, -0.9396767616271973, -0.9046714305877686, -0.8696661591529846, -0.8346608877182007, -0.7996556758880615, -0.7646504044532776, -0.7296451330184937, -0.6946398615837097, -0.6596345901489258, -0.6246292591094971, -0.5896239876747131, -0.5546187162399292, -0.5196134448051453, -0.48460817337036133, -0.4496029019355774, -0.41459760069847107, -0.37959232926368713, -0.3445870578289032, -0.3095817565917969, -0.27457648515701294, -0.23957133293151855, -0.20456606149673462, -0.1695607751607895, -0.13455548882484436, -0.09955021739006042, -0.06454494595527649, -0.02953965961933136, 0.0054656267166137695, 0.040470898151397705, 0.07547617703676224, 0.11048145592212677, 0.1454867422580719, 0.18049201369285583, 0.21549728512763977, 0.2505025863647461, 0.28550785779953003, 0.32051312923431396, 0.3555184006690979, 0.39052367210388184, 0.42552897334098816, 0.4605342447757721, 0.49553951621055603, 0.5305448174476624, 0.5655500888824463, 0.6005553603172302, 0.6355606317520142, 0.6705659031867981, 0.705571174621582, 0.7405765056610107, 0.7755817174911499, 0.8105870485305786, 0.8455923199653625, 0.8805975914001465]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 8.0, 11.0, 18.0, 15.0, 20.0, 23.0, 28.0, 22.0, 25.0, 38.0, 40.0, 60.0, 53.0, 52.0, 48.0, 50.0, 49.0, 40.0, 49.0, 40.0, 40.0, 30.0, 32.0, 41.0, 24.0, 28.0, 17.0, 22.0, 13.0, 11.0, 15.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3257802128791809, -0.31436967849731445, -0.3029591143131256, -0.29154857993125916, -0.2801380157470703, -0.26872748136520386, -0.2573169469833374, -0.24590638279914856, -0.2344958335161209, -0.22308528423309326, -0.2116747349500656, -0.20026418566703796, -0.1888536512851715, -0.17744308710098267, -0.1660325527191162, -0.15462200343608856, -0.1432114541530609, -0.13180090487003326, -0.12039035558700562, -0.10897981375455856, -0.09756926447153091, -0.08615871518850327, -0.07474817335605621, -0.06333762407302856, -0.051927074790000916, -0.04051652550697327, -0.029105979949235916, -0.017695434391498566, -0.006284885108470917, 0.005125664174556732, 0.016536206007003784, 0.027946755290031433, 0.03935730457305908, 0.05076785385608673, 0.06217839941382408, 0.07358894497156143, 0.08499949425458908, 0.09641004353761673, 0.10782058537006378, 0.11923113465309143, 0.13064168393611908, 0.14205223321914673, 0.15346278250217438, 0.16487333178520203, 0.17628386616706848, 0.18769443035125732, 0.19910496473312378, 0.21051551401615143, 0.22192606329917908, 0.23333661258220673, 0.24474716186523438, 0.25615769624710083, 0.2675682604312897, 0.27897879481315613, 0.29038935899734497, 0.3017998933792114, 0.3132104277610779, 0.32462096214294434, 0.3360315263271332, 0.34744206070899963, 0.3588526248931885, 0.37026315927505493, 0.3816736936569214, 0.39308425784111023, 0.4044948220252991]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 17.0, 15.0, 21.0, 32.0, 41.0, 66.0, 95.0, 128.0, 170.0, 258.0, 408.0, 709.0, 1400.0, 3532.0, 10784.0, 45827.0, 246227.0, 546444.0, 150271.0, 29143.0, 7573.0, 2608.0, 1108.0, 602.0, 356.0, 212.0, 138.0, 100.0, 77.0, 48.0, 39.0, 21.0, 21.0, 18.0, 9.0, 8.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.470458984375, -0.45676422119140625, -0.4430694580078125, -0.42937469482421875, -0.415679931640625, -0.40198516845703125, -0.3882904052734375, -0.37459564208984375, -0.36090087890625, -0.34720611572265625, -0.3335113525390625, -0.31981658935546875, -0.306121826171875, -0.29242706298828125, -0.2787322998046875, -0.26503753662109375, -0.2513427734375, -0.23764801025390625, -0.2239532470703125, -0.21025848388671875, -0.196563720703125, -0.18286895751953125, -0.1691741943359375, -0.15547943115234375, -0.14178466796875, -0.12808990478515625, -0.1143951416015625, -0.10070037841796875, -0.087005615234375, -0.07331085205078125, -0.0596160888671875, -0.04592132568359375, -0.0322265625, -0.01853179931640625, -0.0048370361328125, 0.00885772705078125, 0.022552490234375, 0.03624725341796875, 0.0499420166015625, 0.06363677978515625, 0.07733154296875, 0.09102630615234375, 0.1047210693359375, 0.11841583251953125, 0.132110595703125, 0.14580535888671875, 0.1595001220703125, 0.17319488525390625, 0.1868896484375, 0.20058441162109375, 0.2142791748046875, 0.22797393798828125, 0.241668701171875, 0.25536346435546875, 0.2690582275390625, 0.28275299072265625, 0.29644775390625, 0.31014251708984375, 0.3238372802734375, 0.33753204345703125, 0.351226806640625, 0.36492156982421875, 0.3786163330078125, 0.39231109619140625, 0.406005859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 7.0, 10.0, 22.0, 30.0, 59.0, 77.0, 105.0, 87.0, 127.0, 129.0, 121.0, 80.0, 56.0, 31.0, 31.0, 7.0, 11.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0634765625, -0.059200286865234375, -0.05492401123046875, -0.050647735595703125, -0.0463714599609375, -0.042095184326171875, -0.03781890869140625, -0.033542633056640625, -0.029266357421875, -0.024990081787109375, -0.02071380615234375, -0.016437530517578125, -0.0121612548828125, -0.007884979248046875, -0.00360870361328125, 0.000667572021484375, 0.00494384765625, 0.009220123291015625, 0.01349639892578125, 0.017772674560546875, 0.0220489501953125, 0.026325225830078125, 0.03060150146484375, 0.034877777099609375, 0.039154052734375, 0.043430328369140625, 0.04770660400390625, 0.051982879638671875, 0.0562591552734375, 0.060535430908203125, 0.06481170654296875, 0.06908798217773438, 0.0733642578125, 0.07764053344726562, 0.08191680908203125, 0.08619308471679688, 0.0904693603515625, 0.09474563598632812, 0.09902191162109375, 0.10329818725585938, 0.107574462890625, 0.11185073852539062, 0.11612701416015625, 0.12040328979492188, 0.1246795654296875, 0.12895584106445312, 0.13323211669921875, 0.13750839233398438, 0.14178466796875, 0.14606094360351562, 0.15033721923828125, 0.15461349487304688, 0.1588897705078125, 0.16316604614257812, 0.16744232177734375, 0.17171859741210938, 0.175994873046875, 0.18027114868164062, 0.18454742431640625, 0.18882369995117188, 0.1930999755859375, 0.19737625122070312, 0.20165252685546875, 0.20592880249023438, 0.210205078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 13.0, 9.0, 10.0, 23.0, 21.0, 27.0, 40.0, 53.0, 103.0, 136.0, 250.0, 408.0, 695.0, 1255.0, 2365.0, 4827.0, 9957.0, 21860.0, 48510.0, 105215.0, 199007.0, 262620.0, 197652.0, 103702.0, 47756.0, 21872.0, 9970.0, 4841.0, 2402.0, 1170.0, 675.0, 408.0, 265.0, 131.0, 91.0, 72.0, 51.0, 20.0, 19.0, 21.0, 15.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.1976318359375, -0.19190216064453125, -0.1861724853515625, -0.18044281005859375, -0.174713134765625, -0.16898345947265625, -0.1632537841796875, -0.15752410888671875, -0.15179443359375, -0.14606475830078125, -0.1403350830078125, -0.13460540771484375, -0.128875732421875, -0.12314605712890625, -0.1174163818359375, -0.11168670654296875, -0.10595703125, -0.10022735595703125, -0.0944976806640625, -0.08876800537109375, -0.083038330078125, -0.07730865478515625, -0.0715789794921875, -0.06584930419921875, -0.06011962890625, -0.05438995361328125, -0.0486602783203125, -0.04293060302734375, -0.037200927734375, -0.03147125244140625, -0.0257415771484375, -0.02001190185546875, -0.0142822265625, -0.00855255126953125, -0.0028228759765625, 0.00290679931640625, 0.008636474609375, 0.01436614990234375, 0.0200958251953125, 0.02582550048828125, 0.03155517578125, 0.03728485107421875, 0.0430145263671875, 0.04874420166015625, 0.054473876953125, 0.06020355224609375, 0.0659332275390625, 0.07166290283203125, 0.077392578125, 0.08312225341796875, 0.0888519287109375, 0.09458160400390625, 0.100311279296875, 0.10604095458984375, 0.1117706298828125, 0.11750030517578125, 0.12322998046875, 0.12895965576171875, 0.1346893310546875, 0.14041900634765625, 0.146148681640625, 0.15187835693359375, 0.1576080322265625, 0.16333770751953125, 0.1690673828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 9.0, 10.0, 10.0, 17.0, 15.0, 22.0, 31.0, 22.0, 32.0, 42.0, 27.0, 39.0, 52.0, 45.0, 67.0, 49.0, 50.0, 52.0, 38.0, 53.0, 37.0, 47.0, 29.0, 30.0, 30.0, 26.0, 23.0, 18.0, 16.0, 18.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1910400390625, -0.1848888397216797, -0.17873764038085938, -0.17258644104003906, -0.16643524169921875, -0.16028404235839844, -0.15413284301757812, -0.1479816436767578, -0.1418304443359375, -0.1356792449951172, -0.12952804565429688, -0.12337684631347656, -0.11722564697265625, -0.11107444763183594, -0.10492324829101562, -0.09877204895019531, -0.092620849609375, -0.08646965026855469, -0.08031845092773438, -0.07416725158691406, -0.06801605224609375, -0.06186485290527344, -0.055713653564453125, -0.04956245422363281, -0.0434112548828125, -0.03726005554199219, -0.031108856201171875, -0.024957656860351562, -0.01880645751953125, -0.012655258178710938, -0.006504058837890625, -0.0003528594970703125, 0.00579833984375, 0.011949539184570312, 0.018100738525390625, 0.024251937866210938, 0.03040313720703125, 0.03655433654785156, 0.042705535888671875, 0.04885673522949219, 0.0550079345703125, 0.06115913391113281, 0.06731033325195312, 0.07346153259277344, 0.07961273193359375, 0.08576393127441406, 0.09191513061523438, 0.09806632995605469, 0.104217529296875, 0.11036872863769531, 0.11651992797851562, 0.12267112731933594, 0.12882232666015625, 0.13497352600097656, 0.14112472534179688, 0.1472759246826172, 0.1534271240234375, 0.1595783233642578, 0.16572952270507812, 0.17188072204589844, 0.17803192138671875, 0.18418312072753906, 0.19033432006835938, 0.1964855194091797, 0.20263671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 6.0, 7.0, 17.0, 22.0, 21.0, 45.0, 54.0, 89.0, 98.0, 147.0, 236.0, 323.0, 435.0, 605.0, 894.0, 1389.0, 2141.0, 3483.0, 5842.0, 10647.0, 22104.0, 48792.0, 113417.0, 231069.0, 282487.0, 175111.0, 78045.0, 34140.0, 15938.0, 8212.0, 4519.0, 2777.0, 1702.0, 1162.0, 805.0, 502.0, 362.0, 278.0, 162.0, 138.0, 91.0, 60.0, 66.0, 37.0, 19.0, 19.0, 14.0, 9.0, 6.0, 4.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07822704315185547, -0.07564353942871094, -0.0730600357055664, -0.07047653198242188, -0.06789302825927734, -0.06530952453613281, -0.06272602081298828, -0.06014251708984375, -0.05755901336669922, -0.05497550964355469, -0.052392005920410156, -0.049808502197265625, -0.047224998474121094, -0.04464149475097656, -0.04205799102783203, -0.0394744873046875, -0.03689098358154297, -0.03430747985839844, -0.031723976135253906, -0.029140472412109375, -0.026556968688964844, -0.023973464965820312, -0.02138996124267578, -0.01880645751953125, -0.01622295379638672, -0.013639450073242188, -0.011055946350097656, -0.008472442626953125, -0.005888938903808594, -0.0033054351806640625, -0.0007219314575195312, 0.001861572265625, 0.004445075988769531, 0.0070285797119140625, 0.009612083435058594, 0.012195587158203125, 0.014779090881347656, 0.017362594604492188, 0.01994609832763672, 0.02252960205078125, 0.02511310577392578, 0.027696609497070312, 0.030280113220214844, 0.032863616943359375, 0.035447120666503906, 0.03803062438964844, 0.04061412811279297, 0.0431976318359375, 0.04578113555908203, 0.04836463928222656, 0.050948143005371094, 0.053531646728515625, 0.056115150451660156, 0.05869865417480469, 0.06128215789794922, 0.06386566162109375, 0.06644916534423828, 0.06903266906738281, 0.07161617279052734, 0.07419967651367188, 0.0767831802368164, 0.07936668395996094, 0.08195018768310547, 0.08453369140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 9.0, 12.0, 14.0, 17.0, 23.0, 59.0, 67.0, 87.0, 110.0, 129.0, 130.0, 88.0, 79.0, 44.0, 38.0, 20.0, 14.0, 10.0, 9.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.2814609110355377e-05, -2.1846964955329895e-05, -2.0879320800304413e-05, -1.991167664527893e-05, -1.894403249025345e-05, -1.7976388335227966e-05, -1.7008744180202484e-05, -1.6041100025177002e-05, -1.507345587015152e-05, -1.4105811715126038e-05, -1.3138167560100555e-05, -1.2170523405075073e-05, -1.1202879250049591e-05, -1.0235235095024109e-05, -9.267590939998627e-06, -8.299946784973145e-06, -7.332302629947662e-06, -6.36465847492218e-06, -5.397014319896698e-06, -4.429370164871216e-06, -3.4617260098457336e-06, -2.4940818548202515e-06, -1.5264376997947693e-06, -5.587935447692871e-07, 4.0885061025619507e-07, 1.3764947652816772e-06, 2.3441389203071594e-06, 3.3117830753326416e-06, 4.279427230358124e-06, 5.247071385383606e-06, 6.214715540409088e-06, 7.18235969543457e-06, 8.150003850460052e-06, 9.117648005485535e-06, 1.0085292160511017e-05, 1.1052936315536499e-05, 1.2020580470561981e-05, 1.2988224625587463e-05, 1.3955868780612946e-05, 1.4923512935638428e-05, 1.589115709066391e-05, 1.6858801245689392e-05, 1.7826445400714874e-05, 1.8794089555740356e-05, 1.976173371076584e-05, 2.072937786579132e-05, 2.1697022020816803e-05, 2.2664666175842285e-05, 2.3632310330867767e-05, 2.459995448589325e-05, 2.556759864091873e-05, 2.6535242795944214e-05, 2.7502886950969696e-05, 2.8470531105995178e-05, 2.943817526102066e-05, 3.0405819416046143e-05, 3.1373463571071625e-05, 3.234110772609711e-05, 3.330875188112259e-05, 3.427639603614807e-05, 3.5244040191173553e-05, 3.6211684346199036e-05, 3.717932850122452e-05, 3.814697265625e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 11.0, 12.0, 24.0, 48.0, 95.0, 124.0, 209.0, 320.0, 581.0, 955.0, 1605.0, 2834.0, 5888.0, 12766.0, 34427.0, 118932.0, 365098.0, 341716.0, 107196.0, 31662.0, 11933.0, 5464.0, 2831.0, 1551.0, 935.0, 486.0, 314.0, 194.0, 116.0, 65.0, 55.0, 36.0, 26.0, 11.0, 6.0, 10.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.1267690658569336, -0.12292289733886719, -0.11907672882080078, -0.11523056030273438, -0.11138439178466797, -0.10753822326660156, -0.10369205474853516, -0.09984588623046875, -0.09599971771240234, -0.09215354919433594, -0.08830738067626953, -0.08446121215820312, -0.08061504364013672, -0.07676887512207031, -0.0729227066040039, -0.0690765380859375, -0.0652303695678711, -0.06138420104980469, -0.05753803253173828, -0.053691864013671875, -0.04984569549560547, -0.04599952697753906, -0.042153358459472656, -0.03830718994140625, -0.034461021423339844, -0.030614852905273438, -0.02676868438720703, -0.022922515869140625, -0.01907634735107422, -0.015230178833007812, -0.011384010314941406, -0.007537841796875, -0.0036916732788085938, 0.0001544952392578125, 0.004000663757324219, 0.007846832275390625, 0.011693000793457031, 0.015539169311523438, 0.019385337829589844, 0.02323150634765625, 0.027077674865722656, 0.030923843383789062, 0.03477001190185547, 0.038616180419921875, 0.04246234893798828, 0.04630851745605469, 0.050154685974121094, 0.0540008544921875, 0.057847023010253906, 0.06169319152832031, 0.06553936004638672, 0.06938552856445312, 0.07323169708251953, 0.07707786560058594, 0.08092403411865234, 0.08477020263671875, 0.08861637115478516, 0.09246253967285156, 0.09630870819091797, 0.10015487670898438, 0.10400104522705078, 0.10784721374511719, 0.1116933822631836, 0.11553955078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 7.0, 5.0, 15.0, 21.0, 30.0, 43.0, 49.0, 51.0, 65.0, 83.0, 93.0, 99.0, 105.0, 72.0, 58.0, 48.0, 33.0, 28.0, 12.0, 22.0, 19.0, 6.0, 10.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08404731750488281, -0.08105850219726562, -0.07806968688964844, -0.07508087158203125, -0.07209205627441406, -0.06910324096679688, -0.06611442565917969, -0.0631256103515625, -0.06013679504394531, -0.057147979736328125, -0.05415916442871094, -0.05117034912109375, -0.04818153381347656, -0.045192718505859375, -0.04220390319824219, -0.039215087890625, -0.03622627258300781, -0.033237457275390625, -0.030248641967773438, -0.02725982666015625, -0.024271011352539062, -0.021282196044921875, -0.018293380737304688, -0.0153045654296875, -0.012315750122070312, -0.009326934814453125, -0.0063381195068359375, -0.00334930419921875, -0.0003604888916015625, 0.002628326416015625, 0.0056171417236328125, 0.00860595703125, 0.011594772338867188, 0.014583587646484375, 0.017572402954101562, 0.02056121826171875, 0.023550033569335938, 0.026538848876953125, 0.029527664184570312, 0.0325164794921875, 0.03550529479980469, 0.038494110107421875, 0.04148292541503906, 0.04447174072265625, 0.04746055603027344, 0.050449371337890625, 0.05343818664550781, 0.056427001953125, 0.05941581726074219, 0.062404632568359375, 0.06539344787597656, 0.06838226318359375, 0.07137107849121094, 0.07435989379882812, 0.07734870910644531, 0.0803375244140625, 0.08332633972167969, 0.08631515502929688, 0.08930397033691406, 0.09229278564453125, 0.09528160095214844, 0.09827041625976562, 0.10125923156738281, 0.104248046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 47.0, 176.0, 383.0, 281.0, 101.0, 19.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578874111175537, -2.454348087310791, -2.329821825027466, -2.2052958011627197, -2.0807695388793945, -1.9562435150146484, -1.8317172527313232, -1.7071912288665771, -1.582664966583252, -1.4581388235092163, -1.3336126804351807, -1.209086537361145, -1.0845603942871094, -0.9600343108177185, -0.8355081677436829, -0.7109820246696472, -0.5864559412002563, -0.4619297981262207, -0.33740365505218506, -0.2128775417804718, -0.08835139870643616, 0.0361747145652771, 0.16070085763931274, 0.2852270007133484, 0.40975314378738403, 0.5342792868614197, 0.6588054299354553, 0.7833315134048462, 0.9078576564788818, 1.0323837995529175, 1.1569099426269531, 1.2814360857009888, 1.4059622287750244, 1.53048837184906, 1.6550145149230957, 1.7795406579971313, 1.904066801071167, 2.028592824935913, 2.1531190872192383, 2.2776451110839844, 2.4021713733673096, 2.5266973972320557, 2.651223659515381, 2.775749683380127, 2.900275945663452, 3.0248019695281982, 3.1493282318115234, 3.2738542556762695, 3.3983802795410156, 3.5229063034057617, 3.647432565689087, 3.771958589553833, 3.896484851837158, 4.021010875701904, 4.14553689956665, 4.270063400268555, 4.394589424133301, 4.519115447998047, 4.643641471862793, 4.768167972564697, 4.892693996429443, 5.0172200202941895, 5.1417460441589355, 5.26627254486084, 5.390798568725586]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 4.0, 5.0, 11.0, 3.0, 7.0, 13.0, 10.0, 19.0, 15.0, 16.0, 22.0, 24.0, 35.0, 36.0, 26.0, 33.0, 37.0, 49.0, 35.0, 40.0, 42.0, 35.0, 33.0, 33.0, 43.0, 40.0, 38.0, 35.0, 40.0, 19.0, 33.0, 16.0, 26.0, 12.0, 21.0, 17.0, 11.0, 19.0, 10.0, 4.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6638127565383911, -0.6432740688323975, -0.6227354407310486, -0.6021967530250549, -0.5816580653190613, -0.5611194372177124, -0.5405807495117188, -0.5200420618057251, -0.4995034337043762, -0.47896477580070496, -0.4584260880947113, -0.43788743019104004, -0.4173487722873688, -0.3968101143836975, -0.37627142667770386, -0.3557327687740326, -0.33519408106803894, -0.3146554231643677, -0.294116735458374, -0.27357807755470276, -0.2530394196510315, -0.23250074684619904, -0.21196207404136658, -0.1914234161376953, -0.17088474333286285, -0.1503460705280304, -0.12980741262435913, -0.10926873981952667, -0.08873007446527481, -0.06819140911102295, -0.04765273630619049, -0.027114078402519226, -0.006575405597686768, 0.013963261619210243, 0.034501928836107254, 0.055040597915649414, 0.07557926326990128, 0.09611792862415314, 0.1166566014289856, 0.13719525933265686, 0.15773393213748932, 0.17827260494232178, 0.19881126284599304, 0.2193499356508255, 0.23988860845565796, 0.2604272663593292, 0.2809659242630005, 0.30150461196899414, 0.3220432698726654, 0.34258192777633667, 0.3631206154823303, 0.3836592733860016, 0.40419793128967285, 0.4247366189956665, 0.44527527689933777, 0.46581393480300903, 0.4863526225090027, 0.5068913102149963, 0.5274299383163452, 0.5479686260223389, 0.5685073137283325, 0.5890459418296814, 0.609584629535675, 0.6301232576370239, 0.6506619453430176]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 28.0, 53.0, 132.0, 342.0, 1169.0, 5426.0, 37566.0, 1196452.0, 2884109.0, 59241.0, 6830.0, 1591.0, 626.0, 309.0, 174.0, 89.0, 52.0, 29.0, 19.0, 16.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.24665069580078125, -0.2359771728515625, -0.22530364990234375, -0.214630126953125, -0.20395660400390625, -0.1932830810546875, -0.18260955810546875, -0.17193603515625, -0.16126251220703125, -0.1505889892578125, -0.13991546630859375, -0.129241943359375, -0.11856842041015625, -0.1078948974609375, -0.09722137451171875, -0.0865478515625, -0.07587432861328125, -0.0652008056640625, -0.05452728271484375, -0.043853759765625, -0.03318023681640625, -0.0225067138671875, -0.01183319091796875, -0.00115966796875, 0.00951385498046875, 0.0201873779296875, 0.03086090087890625, 0.041534423828125, 0.05220794677734375, 0.0628814697265625, 0.07355499267578125, 0.084228515625, 0.09490203857421875, 0.1055755615234375, 0.11624908447265625, 0.126922607421875, 0.13759613037109375, 0.1482696533203125, 0.15894317626953125, 0.16961669921875, 0.18029022216796875, 0.1909637451171875, 0.20163726806640625, 0.212310791015625, 0.22298431396484375, 0.2336578369140625, 0.24433135986328125, 0.2550048828125, 0.26567840576171875, 0.2763519287109375, 0.28702545166015625, 0.297698974609375, 0.30837249755859375, 0.3190460205078125, 0.32971954345703125, 0.34039306640625, 0.35106658935546875, 0.3617401123046875, 0.37241363525390625, 0.383087158203125, 0.39376068115234375, 0.4044342041015625, 0.41510772705078125, 0.42578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 8.0, 22.0, 32.0, 37.0, 49.0, 75.0, 90.0, 117.0, 101.0, 115.0, 96.0, 71.0, 70.0, 38.0, 24.0, 19.0, 19.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.078125, -0.07344627380371094, -0.06876754760742188, -0.06408882141113281, -0.05941009521484375, -0.05473136901855469, -0.050052642822265625, -0.04537391662597656, -0.0406951904296875, -0.03601646423339844, -0.031337738037109375, -0.026659011840820312, -0.02198028564453125, -0.017301559448242188, -0.012622833251953125, -0.007944107055664062, -0.003265380859375, 0.0014133453369140625, 0.006092071533203125, 0.010770797729492188, 0.01544952392578125, 0.020128250122070312, 0.024806976318359375, 0.029485702514648438, 0.0341644287109375, 0.03884315490722656, 0.043521881103515625, 0.04820060729980469, 0.05287933349609375, 0.05755805969238281, 0.062236785888671875, 0.06691551208496094, 0.07159423828125, 0.07627296447753906, 0.08095169067382812, 0.08563041687011719, 0.09030914306640625, 0.09498786926269531, 0.09966659545898438, 0.10434532165527344, 0.1090240478515625, 0.11370277404785156, 0.11838150024414062, 0.12306022644042969, 0.12773895263671875, 0.1324176788330078, 0.13709640502929688, 0.14177513122558594, 0.146453857421875, 0.15113258361816406, 0.15581130981445312, 0.1604900360107422, 0.16516876220703125, 0.1698474884033203, 0.17452621459960938, 0.17920494079589844, 0.1838836669921875, 0.18856239318847656, 0.19324111938476562, 0.1979198455810547, 0.20259857177734375, 0.2072772979736328, 0.21195602416992188, 0.21663475036621094, 0.2213134765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 15.0, 35.0, 45.0, 64.0, 167.0, 283.0, 560.0, 1231.0, 3868.0, 15229.0, 92389.0, 1102564.0, 2728909.0, 211440.0, 27939.0, 6139.0, 1912.0, 752.0, 324.0, 157.0, 91.0, 63.0, 29.0, 21.0, 16.0, 13.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.323974609375, -0.31647300720214844, -0.3089714050292969, -0.3014698028564453, -0.29396820068359375, -0.2864665985107422, -0.2789649963378906, -0.27146339416503906, -0.2639617919921875, -0.25646018981933594, -0.24895858764648438, -0.2414569854736328, -0.23395538330078125, -0.2264537811279297, -0.21895217895507812, -0.21145057678222656, -0.203948974609375, -0.19644737243652344, -0.18894577026367188, -0.1814441680908203, -0.17394256591796875, -0.1664409637451172, -0.15893936157226562, -0.15143775939941406, -0.1439361572265625, -0.13643455505371094, -0.12893295288085938, -0.12143135070800781, -0.11392974853515625, -0.10642814636230469, -0.09892654418945312, -0.09142494201660156, -0.08392333984375, -0.07642173767089844, -0.06892013549804688, -0.06141853332519531, -0.05391693115234375, -0.04641532897949219, -0.038913726806640625, -0.03141212463378906, -0.0239105224609375, -0.016408920288085938, -0.008907318115234375, -0.0014057159423828125, 0.00609588623046875, 0.013597488403320312, 0.021099090576171875, 0.028600692749023438, 0.036102294921875, 0.04360389709472656, 0.051105499267578125, 0.05860710144042969, 0.06610870361328125, 0.07361030578613281, 0.08111190795898438, 0.08861351013183594, 0.0961151123046875, 0.10361671447753906, 0.11111831665039062, 0.11861991882324219, 0.12612152099609375, 0.1336231231689453, 0.14112472534179688, 0.14862632751464844, 0.1561279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 15.0, 29.0, 42.0, 60.0, 110.0, 175.0, 221.0, 356.0, 566.0, 753.0, 623.0, 409.0, 233.0, 194.0, 101.0, 42.0, 45.0, 33.0, 9.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12398910522460938, -0.11894989013671875, -0.11391067504882812, -0.1088714599609375, -0.10383224487304688, -0.09879302978515625, -0.09375381469726562, -0.088714599609375, -0.08367538452148438, -0.07863616943359375, -0.07359695434570312, -0.0685577392578125, -0.06351852416992188, -0.05847930908203125, -0.053440093994140625, -0.04840087890625, -0.043361663818359375, -0.03832244873046875, -0.033283233642578125, -0.0282440185546875, -0.023204803466796875, -0.01816558837890625, -0.013126373291015625, -0.008087158203125, -0.003047943115234375, 0.00199127197265625, 0.007030487060546875, 0.0120697021484375, 0.017108917236328125, 0.02214813232421875, 0.027187347412109375, 0.0322265625, 0.037265777587890625, 0.04230499267578125, 0.047344207763671875, 0.0523834228515625, 0.057422637939453125, 0.06246185302734375, 0.06750106811523438, 0.072540283203125, 0.07757949829101562, 0.08261871337890625, 0.08765792846679688, 0.0926971435546875, 0.09773635864257812, 0.10277557373046875, 0.10781478881835938, 0.11285400390625, 0.11789321899414062, 0.12293243408203125, 0.12797164916992188, 0.1330108642578125, 0.13805007934570312, 0.14308929443359375, 0.14812850952148438, 0.153167724609375, 0.15820693969726562, 0.16324615478515625, 0.16828536987304688, 0.1733245849609375, 0.17836380004882812, 0.18340301513671875, 0.18844223022460938, 0.1934814453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 11.0, 12.0, 36.0, 95.0, 147.0, 159.0, 178.0, 165.0, 92.0, 54.0, 32.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3531036376953125, -1.314698338508606, -1.2762930393218994, -1.2378876209259033, -1.1994823217391968, -1.1610770225524902, -1.1226716041564941, -1.0842663049697876, -1.045861005783081, -1.0074557065963745, -0.9690503478050232, -0.9306449890136719, -0.8922396898269653, -0.8538343906402588, -0.8154290318489075, -0.7770236730575562, -0.7386183738708496, -0.7002130746841431, -0.6618077158927917, -0.6234023571014404, -0.5849970579147339, -0.5465917587280273, -0.508186399936676, -0.4697810709476471, -0.43137574195861816, -0.39297041296958923, -0.3545650839805603, -0.31615975499153137, -0.27775442600250244, -0.2393490970134735, -0.20094376802444458, -0.16253843903541565, -0.12413322925567627, -0.08572790026664734, -0.04732257127761841, -0.008917242288589478, 0.029488086700439453, 0.06789341568946838, 0.10629874467849731, 0.14470407366752625, 0.18310940265655518, 0.2215147316455841, 0.25992006063461304, 0.29832538962364197, 0.3367307186126709, 0.37513604760169983, 0.41354137659072876, 0.4519467055797577, 0.4903520345687866, 0.5287573337554932, 0.5671626925468445, 0.6055680513381958, 0.6439733505249023, 0.6823786497116089, 0.7207840085029602, 0.7591893672943115, 0.7975946664810181, 0.8359999656677246, 0.8744053244590759, 0.9128106832504272, 0.9512159824371338, 0.9896212816238403, 1.0280265808105469, 1.066431999206543, 1.1048372983932495]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 4.0, 13.0, 13.0, 22.0, 19.0, 16.0, 26.0, 27.0, 23.0, 34.0, 36.0, 38.0, 41.0, 43.0, 36.0, 43.0, 51.0, 54.0, 36.0, 31.0, 39.0, 38.0, 42.0, 33.0, 37.0, 35.0, 24.0, 36.0, 18.0, 16.0, 7.0, 12.0, 10.0, 7.0, 7.0, 2.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3875146508216858, -0.3749905526638031, -0.362466424703598, -0.34994232654571533, -0.33741819858551025, -0.32489410042762756, -0.3123699724674225, -0.2998458743095398, -0.2873217463493347, -0.274797648191452, -0.26227352023124695, -0.24974940717220306, -0.23722529411315918, -0.2247011959552765, -0.2121770679950714, -0.19965296983718872, -0.18712885677814484, -0.17460474371910095, -0.16208063066005707, -0.14955651760101318, -0.1370324045419693, -0.12450829893350601, -0.11198418587446213, -0.09946007281541824, -0.08693595975637436, -0.07441184669733047, -0.06188773363828659, -0.049363624304533005, -0.03683951124548912, -0.024315401911735535, -0.01179128885269165, 0.0007328242063522339, 0.013256937265396118, 0.025781050324440002, 0.03830516338348389, 0.05082927271723747, 0.06335338950157166, 0.07587749511003494, 0.08840160816907883, 0.10092572122812271, 0.1134498342871666, 0.12597393989562988, 0.13849805295467377, 0.15102216601371765, 0.16354627907276154, 0.17607039213180542, 0.1885945051908493, 0.2011186182498932, 0.21364273130893707, 0.22616684436798096, 0.23869095742702484, 0.2512150704860687, 0.2637391686439514, 0.2762632966041565, 0.2887873947620392, 0.30131152272224426, 0.31383562088012695, 0.32635971903800964, 0.3388838469982147, 0.3514079451560974, 0.3639320731163025, 0.3764561712741852, 0.38898029923439026, 0.40150439739227295, 0.414028525352478]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 18.0, 17.0, 31.0, 47.0, 64.0, 81.0, 121.0, 175.0, 302.0, 532.0, 1100.0, 2935.0, 9496.0, 37285.0, 187766.0, 584412.0, 174376.0, 35357.0, 9104.0, 2810.0, 1088.0, 524.0, 306.0, 193.0, 125.0, 81.0, 65.0, 39.0, 23.0, 16.0, 12.0, 11.0, 9.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.310791015625, -0.298095703125, -0.285400390625, -0.272705078125, -0.260009765625, -0.247314453125, -0.234619140625, -0.221923828125, -0.209228515625, -0.196533203125, -0.183837890625, -0.171142578125, -0.158447265625, -0.145751953125, -0.133056640625, -0.120361328125, -0.107666015625, -0.094970703125, -0.082275390625, -0.069580078125, -0.056884765625, -0.044189453125, -0.031494140625, -0.018798828125, -0.006103515625, 0.006591796875, 0.019287109375, 0.031982421875, 0.044677734375, 0.057373046875, 0.070068359375, 0.082763671875, 0.095458984375, 0.108154296875, 0.120849609375, 0.133544921875, 0.146240234375, 0.158935546875, 0.171630859375, 0.184326171875, 0.197021484375, 0.209716796875, 0.222412109375, 0.235107421875, 0.247802734375, 0.260498046875, 0.273193359375, 0.285888671875, 0.298583984375, 0.311279296875, 0.323974609375, 0.336669921875, 0.349365234375, 0.362060546875, 0.374755859375, 0.387451171875, 0.400146484375, 0.412841796875, 0.425537109375, 0.438232421875, 0.450927734375, 0.463623046875, 0.476318359375, 0.489013671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 16.0, 21.0, 26.0, 35.0, 54.0, 92.0, 80.0, 124.0, 109.0, 123.0, 77.0, 78.0, 62.0, 39.0, 23.0, 12.0, 14.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07806396484375, -0.07333660125732422, -0.06860923767089844, -0.06388187408447266, -0.059154510498046875, -0.054427146911621094, -0.04969978332519531, -0.04497241973876953, -0.04024505615234375, -0.03551769256591797, -0.030790328979492188, -0.026062965393066406, -0.021335601806640625, -0.016608238220214844, -0.011880874633789062, -0.007153511047363281, -0.0024261474609375, 0.0023012161254882812, 0.0070285797119140625, 0.011755943298339844, 0.016483306884765625, 0.021210670471191406, 0.025938034057617188, 0.03066539764404297, 0.03539276123046875, 0.04012012481689453, 0.04484748840332031, 0.049574851989746094, 0.054302215576171875, 0.059029579162597656, 0.06375694274902344, 0.06848430633544922, 0.073211669921875, 0.07793903350830078, 0.08266639709472656, 0.08739376068115234, 0.09212112426757812, 0.0968484878540039, 0.10157585144042969, 0.10630321502685547, 0.11103057861328125, 0.11575794219970703, 0.12048530578613281, 0.1252126693725586, 0.12994003295898438, 0.13466739654541016, 0.13939476013183594, 0.14412212371826172, 0.1488494873046875, 0.15357685089111328, 0.15830421447753906, 0.16303157806396484, 0.16775894165039062, 0.1724863052368164, 0.1772136688232422, 0.18194103240966797, 0.18666839599609375, 0.19139575958251953, 0.1961231231689453, 0.2008504867553711, 0.20557785034179688, 0.21030521392822266, 0.21503257751464844, 0.21975994110107422, 0.2244873046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 18.0, 16.0, 19.0, 35.0, 49.0, 80.0, 162.0, 352.0, 1064.0, 3572.0, 14514.0, 67109.0, 354508.0, 479122.0, 99847.0, 20849.0, 5011.0, 1317.0, 412.0, 189.0, 113.0, 66.0, 37.0, 20.0, 13.0, 12.0, 7.0, 8.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353515625, -0.3425102233886719, -0.33150482177734375, -0.3204994201660156, -0.3094940185546875, -0.2984886169433594, -0.28748321533203125, -0.2764778137207031, -0.265472412109375, -0.2544670104980469, -0.24346160888671875, -0.23245620727539062, -0.2214508056640625, -0.21044540405273438, -0.19944000244140625, -0.18843460083007812, -0.17742919921875, -0.16642379760742188, -0.15541839599609375, -0.14441299438476562, -0.1334075927734375, -0.12240219116210938, -0.11139678955078125, -0.10039138793945312, -0.089385986328125, -0.07838058471679688, -0.06737518310546875, -0.056369781494140625, -0.0453643798828125, -0.034358978271484375, -0.02335357666015625, -0.012348175048828125, -0.0013427734375, 0.009662628173828125, 0.02066802978515625, 0.031673431396484375, 0.0426788330078125, 0.053684234619140625, 0.06468963623046875, 0.07569503784179688, 0.086700439453125, 0.09770584106445312, 0.10871124267578125, 0.11971664428710938, 0.1307220458984375, 0.14172744750976562, 0.15273284912109375, 0.16373825073242188, 0.17474365234375, 0.18574905395507812, 0.19675445556640625, 0.20775985717773438, 0.2187652587890625, 0.22977066040039062, 0.24077606201171875, 0.2517814636230469, 0.262786865234375, 0.2737922668457031, 0.28479766845703125, 0.2958030700683594, 0.3068084716796875, 0.3178138732910156, 0.32881927490234375, 0.3398246765136719, 0.350830078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 5.0, 14.0, 10.0, 16.0, 16.0, 21.0, 24.0, 28.0, 33.0, 32.0, 42.0, 66.0, 56.0, 59.0, 57.0, 55.0, 66.0, 46.0, 58.0, 47.0, 40.0, 40.0, 29.0, 32.0, 17.0, 15.0, 12.0, 18.0, 8.0, 9.0, 4.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2120361328125, -0.2046642303466797, -0.19729232788085938, -0.18992042541503906, -0.18254852294921875, -0.17517662048339844, -0.16780471801757812, -0.1604328155517578, -0.1530609130859375, -0.1456890106201172, -0.13831710815429688, -0.13094520568847656, -0.12357330322265625, -0.11620140075683594, -0.10882949829101562, -0.10145759582519531, -0.094085693359375, -0.08671379089355469, -0.07934188842773438, -0.07196998596191406, -0.06459808349609375, -0.05722618103027344, -0.049854278564453125, -0.04248237609863281, -0.0351104736328125, -0.027738571166992188, -0.020366668701171875, -0.012994766235351562, -0.00562286376953125, 0.0017490386962890625, 0.009120941162109375, 0.016492843627929688, 0.02386474609375, 0.031236648559570312, 0.038608551025390625, 0.04598045349121094, 0.05335235595703125, 0.06072425842285156, 0.06809616088867188, 0.07546806335449219, 0.0828399658203125, 0.09021186828613281, 0.09758377075195312, 0.10495567321777344, 0.11232757568359375, 0.11969947814941406, 0.12707138061523438, 0.1344432830810547, 0.141815185546875, 0.1491870880126953, 0.15655899047851562, 0.16393089294433594, 0.17130279541015625, 0.17867469787597656, 0.18604660034179688, 0.1934185028076172, 0.2007904052734375, 0.2081623077392578, 0.21553421020507812, 0.22290611267089844, 0.23027801513671875, 0.23764991760253906, 0.24502182006835938, 0.2523937225341797, 0.259765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 16.0, 18.0, 18.0, 30.0, 37.0, 67.0, 96.0, 137.0, 195.0, 373.0, 592.0, 1213.0, 2586.0, 6427.0, 16877.0, 47749.0, 161311.0, 447135.0, 253063.0, 71113.0, 23775.0, 8733.0, 3472.0, 1547.0, 786.0, 423.0, 237.0, 125.0, 111.0, 71.0, 55.0, 43.0, 28.0, 22.0, 9.0, 14.0, 9.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.120758056640625, -0.11639404296875, -0.112030029296875, -0.107666015625, -0.103302001953125, -0.09893798828125, -0.094573974609375, -0.0902099609375, -0.085845947265625, -0.08148193359375, -0.077117919921875, -0.07275390625, -0.068389892578125, -0.06402587890625, -0.059661865234375, -0.0552978515625, -0.050933837890625, -0.04656982421875, -0.042205810546875, -0.037841796875, -0.033477783203125, -0.02911376953125, -0.024749755859375, -0.0203857421875, -0.016021728515625, -0.01165771484375, -0.007293701171875, -0.0029296875, 0.001434326171875, 0.00579833984375, 0.010162353515625, 0.0145263671875, 0.018890380859375, 0.02325439453125, 0.027618408203125, 0.031982421875, 0.036346435546875, 0.04071044921875, 0.045074462890625, 0.0494384765625, 0.053802490234375, 0.05816650390625, 0.062530517578125, 0.06689453125, 0.071258544921875, 0.07562255859375, 0.079986572265625, 0.0843505859375, 0.088714599609375, 0.09307861328125, 0.097442626953125, 0.101806640625, 0.106170654296875, 0.11053466796875, 0.114898681640625, 0.1192626953125, 0.123626708984375, 0.12799072265625, 0.132354736328125, 0.13671875, 0.141082763671875, 0.14544677734375, 0.149810791015625, 0.1541748046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 3.0, 5.0, 7.0, 13.0, 9.0, 10.0, 11.0, 12.0, 27.0, 21.0, 42.0, 38.0, 70.0, 89.0, 93.0, 86.0, 72.0, 81.0, 68.0, 34.0, 46.0, 22.0, 21.0, 17.0, 10.0, 15.0, 10.0, 6.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.9729137420654297e-05, -1.9156374037265778e-05, -1.8583610653877258e-05, -1.801084727048874e-05, -1.743808388710022e-05, -1.68653205037117e-05, -1.629255712032318e-05, -1.5719793736934662e-05, -1.5147030353546143e-05, -1.4574266970157623e-05, -1.4001503586769104e-05, -1.3428740203380585e-05, -1.2855976819992065e-05, -1.2283213436603546e-05, -1.1710450053215027e-05, -1.1137686669826508e-05, -1.0564923286437988e-05, -9.992159903049469e-06, -9.41939651966095e-06, -8.84663313627243e-06, -8.273869752883911e-06, -7.701106369495392e-06, -7.1283429861068726e-06, -6.555579602718353e-06, -5.982816219329834e-06, -5.410052835941315e-06, -4.837289452552795e-06, -4.264526069164276e-06, -3.691762685775757e-06, -3.1189993023872375e-06, -2.5462359189987183e-06, -1.973472535610199e-06, -1.4007091522216797e-06, -8.279457688331604e-07, -2.551823854446411e-07, 3.175809979438782e-07, 8.903443813323975e-07, 1.4631077647209167e-06, 2.035871148109436e-06, 2.6086345314979553e-06, 3.1813979148864746e-06, 3.754161298274994e-06, 4.326924681663513e-06, 4.8996880650520325e-06, 5.472451448440552e-06, 6.045214831829071e-06, 6.61797821521759e-06, 7.19074159860611e-06, 7.763504981994629e-06, 8.336268365383148e-06, 8.909031748771667e-06, 9.481795132160187e-06, 1.0054558515548706e-05, 1.0627321898937225e-05, 1.1200085282325745e-05, 1.1772848665714264e-05, 1.2345612049102783e-05, 1.2918375432491302e-05, 1.3491138815879822e-05, 1.4063902199268341e-05, 1.463666558265686e-05, 1.520942896604538e-05, 1.57821923494339e-05, 1.6354955732822418e-05, 1.6927719116210938e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 7.0, 9.0, 20.0, 31.0, 38.0, 61.0, 99.0, 118.0, 187.0, 260.0, 380.0, 624.0, 972.0, 1681.0, 3217.0, 7231.0, 19961.0, 65391.0, 281705.0, 486937.0, 123669.0, 34034.0, 11458.0, 4634.0, 2278.0, 1223.0, 767.0, 522.0, 320.0, 227.0, 131.0, 103.0, 74.0, 54.0, 29.0, 28.0, 22.0, 15.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14013671875, -0.13550186157226562, -0.13086700439453125, -0.12623214721679688, -0.1215972900390625, -0.11696243286132812, -0.11232757568359375, -0.10769271850585938, -0.103057861328125, -0.09842300415039062, -0.09378814697265625, -0.08915328979492188, -0.0845184326171875, -0.07988357543945312, -0.07524871826171875, -0.07061386108398438, -0.06597900390625, -0.061344146728515625, -0.05670928955078125, -0.052074432373046875, -0.0474395751953125, -0.042804718017578125, -0.03816986083984375, -0.033535003662109375, -0.028900146484375, -0.024265289306640625, -0.01963043212890625, -0.014995574951171875, -0.0103607177734375, -0.005725860595703125, -0.00109100341796875, 0.003543853759765625, 0.0081787109375, 0.012813568115234375, 0.01744842529296875, 0.022083282470703125, 0.0267181396484375, 0.031352996826171875, 0.03598785400390625, 0.040622711181640625, 0.045257568359375, 0.049892425537109375, 0.05452728271484375, 0.059162139892578125, 0.0637969970703125, 0.06843185424804688, 0.07306671142578125, 0.07770156860351562, 0.08233642578125, 0.08697128295898438, 0.09160614013671875, 0.09624099731445312, 0.1008758544921875, 0.10551071166992188, 0.11014556884765625, 0.11478042602539062, 0.119415283203125, 0.12405014038085938, 0.12868499755859375, 0.13331985473632812, 0.1379547119140625, 0.14258956909179688, 0.14722442626953125, 0.15185928344726562, 0.156494140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 10.0, 12.0, 18.0, 17.0, 21.0, 36.0, 68.0, 113.0, 137.0, 148.0, 131.0, 83.0, 57.0, 38.0, 27.0, 16.0, 13.0, 6.0, 10.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.16699790954589844, -0.16212081909179688, -0.1572437286376953, -0.15236663818359375, -0.1474895477294922, -0.14261245727539062, -0.13773536682128906, -0.1328582763671875, -0.12798118591308594, -0.12310409545898438, -0.11822700500488281, -0.11334991455078125, -0.10847282409667969, -0.10359573364257812, -0.09871864318847656, -0.093841552734375, -0.08896446228027344, -0.08408737182617188, -0.07921028137207031, -0.07433319091796875, -0.06945610046386719, -0.06457901000976562, -0.05970191955566406, -0.0548248291015625, -0.04994773864746094, -0.045070648193359375, -0.04019355773925781, -0.03531646728515625, -0.030439376831054688, -0.025562286376953125, -0.020685195922851562, -0.01580810546875, -0.010931015014648438, -0.006053924560546875, -0.0011768341064453125, 0.00370025634765625, 0.008577346801757812, 0.013454437255859375, 0.018331527709960938, 0.0232086181640625, 0.028085708618164062, 0.032962799072265625, 0.03783988952636719, 0.04271697998046875, 0.04759407043457031, 0.052471160888671875, 0.05734825134277344, 0.062225341796875, 0.06710243225097656, 0.07197952270507812, 0.07685661315917969, 0.08173370361328125, 0.08661079406738281, 0.09148788452148438, 0.09636497497558594, 0.1012420654296875, 0.10611915588378906, 0.11099624633789062, 0.11587333679199219, 0.12075042724609375, 0.1256275177001953, 0.13050460815429688, 0.13538169860839844, 0.1402587890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 10.0, 16.0, 35.0, 115.0, 228.0, 266.0, 201.0, 91.0, 36.0, 11.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0012428760528564, -0.9278908371925354, -0.8545387983322144, -0.7811867594718933, -0.7078347206115723, -0.6344826817512512, -0.5611306428909302, -0.48777860403060913, -0.4144265651702881, -0.34107452630996704, -0.267722487449646, -0.19437044858932495, -0.1210184097290039, -0.04766637086868286, 0.025685667991638184, 0.09903770685195923, 0.17238974571228027, 0.24574178457260132, 0.31909382343292236, 0.3924458622932434, 0.46579790115356445, 0.5391499400138855, 0.6125019788742065, 0.6858540177345276, 0.7592060565948486, 0.8325580954551697, 0.9059101343154907, 0.9792621731758118, 1.0526142120361328, 1.1259663105010986, 1.199318289756775, 1.2726702690124512, 1.346022367477417, 1.4193744659423828, 1.492726445198059, 1.5660784244537354, 1.6394305229187012, 1.712782621383667, 1.7861346006393433, 1.8594865798950195, 1.9328386783599854, 2.006190776824951, 2.079542636871338, 2.1528947353363037, 2.2262468338012695, 2.2995989322662354, 2.372951030731201, 2.446302890777588, 2.5196549892425537, 2.5930070877075195, 2.6663589477539062, 2.739711046218872, 2.813063144683838, 2.8864152431488037, 2.9597673416137695, 3.0331192016601562, 3.106471300125122, 3.179823398590088, 3.2531752586364746, 3.3265273571014404, 3.3998794555664062, 3.473231554031372, 3.546583652496338, 3.6199355125427246, 3.6932876110076904]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 12.0, 12.0, 11.0, 20.0, 15.0, 24.0, 34.0, 31.0, 30.0, 27.0, 31.0, 45.0, 44.0, 54.0, 55.0, 52.0, 48.0, 60.0, 40.0, 37.0, 43.0, 33.0, 44.0, 31.0, 25.0, 22.0, 17.0, 19.0, 18.0, 15.0, 7.0, 9.0, 6.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.7667695879936218, -0.7454947829246521, -0.7242200374603271, -0.7029452323913574, -0.6816704869270325, -0.6603956818580627, -0.6391209363937378, -0.6178461313247681, -0.5965713262557983, -0.5752965211868286, -0.5540217757225037, -0.5327469706535339, -0.511472225189209, -0.49019742012023926, -0.4689226448535919, -0.4476478695869446, -0.42637309432029724, -0.4050983190536499, -0.38382354378700256, -0.3625487685203552, -0.3412739634513855, -0.31999918818473816, -0.2987244129180908, -0.2774496078491211, -0.25617486238479614, -0.2349000871181488, -0.21362529695034027, -0.19235052168369293, -0.1710757315158844, -0.14980095624923706, -0.12852618098258972, -0.10725139081478119, -0.08597660064697266, -0.06470181792974472, -0.04342703893780708, -0.022152259945869446, -0.00087747722864151, 0.020397305488586426, 0.041672080755233765, 0.0629468709230423, 0.08422164618968964, 0.10549642890691757, 0.1267712116241455, 0.14804598689079285, 0.16932076215744019, 0.19059555232524872, 0.21187032759189606, 0.2331451177597046, 0.25441989302635193, 0.27569466829299927, 0.2969694435596466, 0.31824421882629395, 0.33951902389526367, 0.360793799161911, 0.38206857442855835, 0.4033433794975281, 0.424618124961853, 0.44589290022850037, 0.4671676754951477, 0.48844248056411743, 0.5097172260284424, 0.5309920310974121, 0.5522668361663818, 0.5735415816307068, 0.5948163866996765]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 1.0, 12.0, 24.0, 45.0, 51.0, 127.0, 208.0, 376.0, 729.0, 1641.0, 3868.0, 10735.0, 39055.0, 222414.0, 2646245.0, 1133116.0, 101522.0, 21450.0, 6666.0, 2760.0, 1281.0, 686.0, 427.0, 268.0, 185.0, 97.0, 97.0, 39.0, 40.0, 24.0, 22.0, 20.0, 11.0, 6.0, 7.0, 5.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.14850997924804688, -0.14101409912109375, -0.13351821899414062, -0.1260223388671875, -0.11852645874023438, -0.11103057861328125, -0.10353469848632812, -0.096038818359375, -0.08854293823242188, -0.08104705810546875, -0.07355117797851562, -0.0660552978515625, -0.058559417724609375, -0.05106353759765625, -0.043567657470703125, -0.03607177734375, -0.028575897216796875, -0.02108001708984375, -0.013584136962890625, -0.0060882568359375, 0.001407623291015625, 0.00890350341796875, 0.016399383544921875, 0.023895263671875, 0.031391143798828125, 0.03888702392578125, 0.046382904052734375, 0.0538787841796875, 0.061374664306640625, 0.06887054443359375, 0.07636642456054688, 0.0838623046875, 0.09135818481445312, 0.09885406494140625, 0.10634994506835938, 0.1138458251953125, 0.12134170532226562, 0.12883758544921875, 0.13633346557617188, 0.143829345703125, 0.15132522583007812, 0.15882110595703125, 0.16631698608398438, 0.1738128662109375, 0.18130874633789062, 0.18880462646484375, 0.19630050659179688, 0.20379638671875, 0.21129226684570312, 0.21878814697265625, 0.22628402709960938, 0.2337799072265625, 0.24127578735351562, 0.24877166748046875, 0.2562675476074219, 0.263763427734375, 0.2712593078613281, 0.27875518798828125, 0.2862510681152344, 0.2937469482421875, 0.3012428283691406, 0.30873870849609375, 0.3162345886230469, 0.32373046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 13.0, 14.0, 21.0, 32.0, 48.0, 67.0, 84.0, 96.0, 117.0, 113.0, 105.0, 83.0, 58.0, 61.0, 36.0, 20.0, 15.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0888671875, -0.0839691162109375, -0.079071044921875, -0.0741729736328125, -0.06927490234375, -0.0643768310546875, -0.059478759765625, -0.0545806884765625, -0.0496826171875, -0.0447845458984375, -0.039886474609375, -0.0349884033203125, -0.03009033203125, -0.0251922607421875, -0.020294189453125, -0.0153961181640625, -0.010498046875, -0.0055999755859375, -0.000701904296875, 0.0041961669921875, 0.00909423828125, 0.0139923095703125, 0.018890380859375, 0.0237884521484375, 0.0286865234375, 0.0335845947265625, 0.038482666015625, 0.0433807373046875, 0.04827880859375, 0.0531768798828125, 0.058074951171875, 0.0629730224609375, 0.06787109375, 0.0727691650390625, 0.077667236328125, 0.0825653076171875, 0.08746337890625, 0.0923614501953125, 0.097259521484375, 0.1021575927734375, 0.1070556640625, 0.1119537353515625, 0.116851806640625, 0.1217498779296875, 0.12664794921875, 0.1315460205078125, 0.136444091796875, 0.1413421630859375, 0.146240234375, 0.1511383056640625, 0.156036376953125, 0.1609344482421875, 0.16583251953125, 0.1707305908203125, 0.175628662109375, 0.1805267333984375, 0.1854248046875, 0.1903228759765625, 0.195220947265625, 0.2001190185546875, 0.20501708984375, 0.2099151611328125, 0.214813232421875, 0.2197113037109375, 0.224609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 1.0, 7.0, 1.0, 3.0, 5.0, 8.0, 6.0, 5.0, 22.0, 15.0, 27.0, 39.0, 63.0, 77.0, 118.0, 158.0, 234.0, 407.0, 645.0, 1318.0, 2704.0, 6310.0, 17226.0, 59667.0, 284307.0, 1894939.0, 1605942.0, 240574.0, 52920.0, 15308.0, 5845.0, 2434.0, 1181.0, 655.0, 349.0, 235.0, 166.0, 95.0, 66.0, 48.0, 47.0, 29.0, 13.0, 17.0, 8.0, 7.0, 13.0, 10.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19504547119140625, -0.1883087158203125, -0.18157196044921875, -0.174835205078125, -0.16809844970703125, -0.1613616943359375, -0.15462493896484375, -0.14788818359375, -0.14115142822265625, -0.1344146728515625, -0.12767791748046875, -0.120941162109375, -0.11420440673828125, -0.1074676513671875, -0.10073089599609375, -0.093994140625, -0.08725738525390625, -0.0805206298828125, -0.07378387451171875, -0.067047119140625, -0.06031036376953125, -0.0535736083984375, -0.04683685302734375, -0.04010009765625, -0.03336334228515625, -0.0266265869140625, -0.01988983154296875, -0.013153076171875, -0.00641632080078125, 0.0003204345703125, 0.00705718994140625, 0.0137939453125, 0.02053070068359375, 0.0272674560546875, 0.03400421142578125, 0.040740966796875, 0.04747772216796875, 0.0542144775390625, 0.06095123291015625, 0.06768798828125, 0.07442474365234375, 0.0811614990234375, 0.08789825439453125, 0.094635009765625, 0.10137176513671875, 0.1081085205078125, 0.11484527587890625, 0.12158203125, 0.12831878662109375, 0.1350555419921875, 0.14179229736328125, 0.148529052734375, 0.15526580810546875, 0.1620025634765625, 0.16873931884765625, 0.17547607421875, 0.18221282958984375, 0.1889495849609375, 0.19568634033203125, 0.202423095703125, 0.20915985107421875, 0.2158966064453125, 0.22263336181640625, 0.2293701171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 5.0, 6.0, 23.0, 11.0, 22.0, 17.0, 42.0, 39.0, 62.0, 84.0, 126.0, 188.0, 277.0, 380.0, 522.0, 622.0, 473.0, 344.0, 253.0, 157.0, 126.0, 84.0, 57.0, 39.0, 24.0, 21.0, 20.0, 19.0, 6.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.170166015625, -0.165069580078125, -0.15997314453125, -0.154876708984375, -0.1497802734375, -0.144683837890625, -0.13958740234375, -0.134490966796875, -0.12939453125, -0.124298095703125, -0.11920166015625, -0.114105224609375, -0.1090087890625, -0.103912353515625, -0.09881591796875, -0.093719482421875, -0.088623046875, -0.083526611328125, -0.07843017578125, -0.073333740234375, -0.0682373046875, -0.063140869140625, -0.05804443359375, -0.052947998046875, -0.0478515625, -0.042755126953125, -0.03765869140625, -0.032562255859375, -0.0274658203125, -0.022369384765625, -0.01727294921875, -0.012176513671875, -0.007080078125, -0.001983642578125, 0.00311279296875, 0.008209228515625, 0.0133056640625, 0.018402099609375, 0.02349853515625, 0.028594970703125, 0.03369140625, 0.038787841796875, 0.04388427734375, 0.048980712890625, 0.0540771484375, 0.059173583984375, 0.06427001953125, 0.069366455078125, 0.074462890625, 0.079559326171875, 0.08465576171875, 0.089752197265625, 0.0948486328125, 0.099945068359375, 0.10504150390625, 0.110137939453125, 0.115234375, 0.120330810546875, 0.12542724609375, 0.130523681640625, 0.1356201171875, 0.140716552734375, 0.14581298828125, 0.150909423828125, 0.156005859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 10.0, 12.0, 25.0, 31.0, 59.0, 85.0, 89.0, 92.0, 127.0, 99.0, 95.0, 83.0, 60.0, 38.0, 32.0, 17.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.477787733078003, -1.4458448886871338, -1.413901925086975, -1.3819589614868164, -1.3500161170959473, -1.3180732727050781, -1.2861303091049194, -1.2541873455047607, -1.2222445011138916, -1.1903016567230225, -1.1583586931228638, -1.126415729522705, -1.094472885131836, -1.0625300407409668, -1.030587077140808, -0.9986441731452942, -0.9667012691497803, -0.9347583651542664, -0.9028154611587524, -0.8708725571632385, -0.8389296531677246, -0.8069867491722107, -0.7750438451766968, -0.7431009411811829, -0.711158037185669, -0.679215133190155, -0.6472722291946411, -0.6153293251991272, -0.5833864212036133, -0.5514435172080994, -0.5195006132125854, -0.48755770921707153, -0.4556148052215576, -0.4236719012260437, -0.3917289972305298, -0.35978609323501587, -0.32784318923950195, -0.29590028524398804, -0.2639573812484741, -0.2320144772529602, -0.2000715732574463, -0.16812866926193237, -0.13618576526641846, -0.10424286127090454, -0.07229995727539062, -0.04035705327987671, -0.008414149284362793, 0.023528754711151123, 0.05547165870666504, 0.08741456270217896, 0.11935746669769287, 0.1513003706932068, 0.1832432746887207, 0.21518617868423462, 0.24712908267974854, 0.27907198667526245, 0.31101489067077637, 0.3429577946662903, 0.3749006986618042, 0.4068436026573181, 0.43878650665283203, 0.47072941064834595, 0.5026723146438599, 0.5346152186393738, 0.5665581226348877]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 13.0, 19.0, 12.0, 18.0, 26.0, 30.0, 22.0, 34.0, 36.0, 33.0, 47.0, 40.0, 40.0, 53.0, 49.0, 63.0, 47.0, 47.0, 39.0, 36.0, 39.0, 35.0, 26.0, 36.0, 23.0, 34.0, 17.0, 8.0, 14.0, 15.0, 5.0, 3.0, 5.0, 5.0, 2.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6266806721687317, -0.6093015074729919, -0.5919223427772522, -0.5745431780815125, -0.5571639537811279, -0.5397847890853882, -0.5224056243896484, -0.5050264596939087, -0.48764729499816895, -0.4702681303024292, -0.45288896560668945, -0.4355097711086273, -0.4181306064128876, -0.4007514417171478, -0.3833722472190857, -0.36599308252334595, -0.3486139178276062, -0.33123475313186646, -0.3138555884361267, -0.2964763939380646, -0.27909722924232483, -0.2617180645465851, -0.24433888494968414, -0.2269597053527832, -0.20958054065704346, -0.1922013759613037, -0.17482219636440277, -0.15744301676750183, -0.14006385207176208, -0.12268467992544174, -0.1053055077791214, -0.08792633563280106, -0.07054710388183594, -0.053167931735515594, -0.03578875958919525, -0.01840958744287491, -0.0010304152965545654, 0.016348756849765778, 0.03372792899608612, 0.051107101142406464, 0.0684862732887268, 0.08586544543504715, 0.10324461758136749, 0.12062378972768784, 0.13800296187400818, 0.15538212656974792, 0.17276130616664886, 0.1901404857635498, 0.20751965045928955, 0.2248988151550293, 0.24227799475193024, 0.2596571743488312, 0.2770363390445709, 0.29441550374031067, 0.3117946982383728, 0.32917386293411255, 0.3465530276298523, 0.36393219232559204, 0.3813113570213318, 0.3986905515193939, 0.41606971621513367, 0.4334488809108734, 0.45082807540893555, 0.4682072401046753, 0.48558640480041504]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 6.0, 15.0, 16.0, 20.0, 36.0, 46.0, 67.0, 93.0, 151.0, 194.0, 317.0, 535.0, 1015.0, 2273.0, 5937.0, 16227.0, 48374.0, 152245.0, 395893.0, 286074.0, 91508.0, 29600.0, 10419.0, 3914.0, 1627.0, 728.0, 420.0, 253.0, 173.0, 95.0, 91.0, 57.0, 37.0, 26.0, 25.0, 13.0, 8.0, 3.0, 4.0, 5.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.39990234375, -0.38840484619140625, -0.3769073486328125, -0.36540985107421875, -0.353912353515625, -0.34241485595703125, -0.3309173583984375, -0.31941986083984375, -0.30792236328125, -0.29642486572265625, -0.2849273681640625, -0.27342987060546875, -0.261932373046875, -0.25043487548828125, -0.2389373779296875, -0.22743988037109375, -0.2159423828125, -0.20444488525390625, -0.1929473876953125, -0.18144989013671875, -0.169952392578125, -0.15845489501953125, -0.1469573974609375, -0.13545989990234375, -0.12396240234375, -0.11246490478515625, -0.1009674072265625, -0.08946990966796875, -0.077972412109375, -0.06647491455078125, -0.0549774169921875, -0.04347991943359375, -0.031982421875, -0.02048492431640625, -0.0089874267578125, 0.00251007080078125, 0.014007568359375, 0.02550506591796875, 0.0370025634765625, 0.04850006103515625, 0.05999755859375, 0.07149505615234375, 0.0829925537109375, 0.09449005126953125, 0.105987548828125, 0.11748504638671875, 0.1289825439453125, 0.14048004150390625, 0.1519775390625, 0.16347503662109375, 0.1749725341796875, 0.18647003173828125, 0.197967529296875, 0.20946502685546875, 0.2209625244140625, 0.23246002197265625, 0.24395751953125, 0.25545501708984375, 0.2669525146484375, 0.27845001220703125, 0.289947509765625, 0.30144500732421875, 0.3129425048828125, 0.32444000244140625, 0.3359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 17.0, 10.0, 20.0, 26.0, 39.0, 62.0, 77.0, 99.0, 98.0, 116.0, 93.0, 97.0, 68.0, 59.0, 47.0, 23.0, 25.0, 12.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07525634765625, -0.07040882110595703, -0.06556129455566406, -0.060713768005371094, -0.055866241455078125, -0.051018714904785156, -0.04617118835449219, -0.04132366180419922, -0.03647613525390625, -0.03162860870361328, -0.026781082153320312, -0.021933555603027344, -0.017086029052734375, -0.012238502502441406, -0.0073909759521484375, -0.0025434494018554688, 0.0023040771484375, 0.007151603698730469, 0.011999130249023438, 0.016846656799316406, 0.021694183349609375, 0.026541709899902344, 0.03138923645019531, 0.03623676300048828, 0.04108428955078125, 0.04593181610107422, 0.05077934265136719, 0.055626869201660156, 0.060474395751953125, 0.0653219223022461, 0.07016944885253906, 0.07501697540283203, 0.079864501953125, 0.08471202850341797, 0.08955955505371094, 0.0944070816040039, 0.09925460815429688, 0.10410213470458984, 0.10894966125488281, 0.11379718780517578, 0.11864471435546875, 0.12349224090576172, 0.1283397674560547, 0.13318729400634766, 0.13803482055664062, 0.1428823471069336, 0.14772987365722656, 0.15257740020751953, 0.1574249267578125, 0.16227245330810547, 0.16711997985839844, 0.1719675064086914, 0.17681503295898438, 0.18166255950927734, 0.1865100860595703, 0.19135761260986328, 0.19620513916015625, 0.20105266571044922, 0.2059001922607422, 0.21074771881103516, 0.21559524536132812, 0.2204427719116211, 0.22529029846191406, 0.23013782501220703, 0.2349853515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 8.0, 12.0, 32.0, 24.0, 64.0, 90.0, 144.0, 248.0, 417.0, 717.0, 1389.0, 2618.0, 4926.0, 10170.0, 20516.0, 44229.0, 102651.0, 230448.0, 306853.0, 179604.0, 76974.0, 33758.0, 15916.0, 7995.0, 4059.0, 2088.0, 1101.0, 611.0, 350.0, 200.0, 112.0, 75.0, 53.0, 43.0, 29.0, 6.0, 7.0, 9.0, 1.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1766357421875, -0.16872596740722656, -0.16081619262695312, -0.1529064178466797, -0.14499664306640625, -0.1370868682861328, -0.12917709350585938, -0.12126731872558594, -0.1133575439453125, -0.10544776916503906, -0.09753799438476562, -0.08962821960449219, -0.08171844482421875, -0.07380867004394531, -0.06589889526367188, -0.05798912048339844, -0.050079345703125, -0.04216957092285156, -0.034259796142578125, -0.026350021362304688, -0.01844024658203125, -0.010530471801757812, -0.002620697021484375, 0.0052890777587890625, 0.0131988525390625, 0.021108627319335938, 0.029018402099609375, 0.03692817687988281, 0.04483795166015625, 0.05274772644042969, 0.060657501220703125, 0.06856727600097656, 0.07647705078125, 0.08438682556152344, 0.09229660034179688, 0.10020637512207031, 0.10811614990234375, 0.11602592468261719, 0.12393569946289062, 0.13184547424316406, 0.1397552490234375, 0.14766502380371094, 0.15557479858398438, 0.1634845733642578, 0.17139434814453125, 0.1793041229248047, 0.18721389770507812, 0.19512367248535156, 0.203033447265625, 0.21094322204589844, 0.21885299682617188, 0.2267627716064453, 0.23467254638671875, 0.2425823211669922, 0.2504920959472656, 0.25840187072753906, 0.2663116455078125, 0.27422142028808594, 0.2821311950683594, 0.2900409698486328, 0.29795074462890625, 0.3058605194091797, 0.3137702941894531, 0.32168006896972656, 0.32958984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 7.0, 6.0, 5.0, 11.0, 16.0, 14.0, 14.0, 21.0, 18.0, 22.0, 21.0, 31.0, 39.0, 33.0, 45.0, 58.0, 52.0, 34.0, 44.0, 36.0, 56.0, 49.0, 47.0, 44.0, 37.0, 31.0, 34.0, 30.0, 19.0, 27.0, 25.0, 19.0, 13.0, 5.0, 7.0, 5.0, 3.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.272705078125, -0.2643585205078125, -0.256011962890625, -0.2476654052734375, -0.23931884765625, -0.2309722900390625, -0.222625732421875, -0.2142791748046875, -0.2059326171875, -0.1975860595703125, -0.189239501953125, -0.1808929443359375, -0.17254638671875, -0.1641998291015625, -0.155853271484375, -0.1475067138671875, -0.13916015625, -0.1308135986328125, -0.122467041015625, -0.1141204833984375, -0.10577392578125, -0.0974273681640625, -0.089080810546875, -0.0807342529296875, -0.0723876953125, -0.0640411376953125, -0.055694580078125, -0.0473480224609375, -0.03900146484375, -0.0306549072265625, -0.022308349609375, -0.0139617919921875, -0.005615234375, 0.0027313232421875, 0.011077880859375, 0.0194244384765625, 0.02777099609375, 0.0361175537109375, 0.044464111328125, 0.0528106689453125, 0.0611572265625, 0.0695037841796875, 0.077850341796875, 0.0861968994140625, 0.09454345703125, 0.1028900146484375, 0.111236572265625, 0.1195831298828125, 0.1279296875, 0.1362762451171875, 0.144622802734375, 0.1529693603515625, 0.16131591796875, 0.1696624755859375, 0.178009033203125, 0.1863555908203125, 0.1947021484375, 0.2030487060546875, 0.211395263671875, 0.2197418212890625, 0.22808837890625, 0.2364349365234375, 0.244781494140625, 0.2531280517578125, 0.261474609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 18.0, 27.0, 33.0, 52.0, 76.0, 125.0, 186.0, 281.0, 427.0, 714.0, 1205.0, 2161.0, 3797.0, 7985.0, 16835.0, 37662.0, 92408.0, 235600.0, 346722.0, 176920.0, 69284.0, 28971.0, 12998.0, 6289.0, 3279.0, 1731.0, 1065.0, 594.0, 390.0, 249.0, 165.0, 96.0, 65.0, 40.0, 25.0, 28.0, 9.0, 5.0, 12.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.1491374969482422, -0.14422225952148438, -0.13930702209472656, -0.13439178466796875, -0.12947654724121094, -0.12456130981445312, -0.11964607238769531, -0.1147308349609375, -0.10981559753417969, -0.10490036010742188, -0.09998512268066406, -0.09506988525390625, -0.09015464782714844, -0.08523941040039062, -0.08032417297363281, -0.075408935546875, -0.07049369812011719, -0.06557846069335938, -0.06066322326660156, -0.05574798583984375, -0.05083274841308594, -0.045917510986328125, -0.04100227355957031, -0.0360870361328125, -0.031171798706054688, -0.026256561279296875, -0.021341323852539062, -0.01642608642578125, -0.011510848999023438, -0.006595611572265625, -0.0016803741455078125, 0.00323486328125, 0.008150100708007812, 0.013065338134765625, 0.017980575561523438, 0.02289581298828125, 0.027811050415039062, 0.032726287841796875, 0.03764152526855469, 0.0425567626953125, 0.04747200012207031, 0.052387237548828125, 0.05730247497558594, 0.06221771240234375, 0.06713294982910156, 0.07204818725585938, 0.07696342468261719, 0.081878662109375, 0.08679389953613281, 0.09170913696289062, 0.09662437438964844, 0.10153961181640625, 0.10645484924316406, 0.11137008666992188, 0.11628532409667969, 0.1212005615234375, 0.1261157989501953, 0.13103103637695312, 0.13594627380371094, 0.14086151123046875, 0.14577674865722656, 0.15069198608398438, 0.1556072235107422, 0.1605224609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 5.0, 8.0, 6.0, 16.0, 16.0, 28.0, 33.0, 33.0, 51.0, 66.0, 121.0, 120.0, 113.0, 84.0, 80.0, 48.0, 39.0, 26.0, 25.0, 17.0, 15.0, 12.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1113624572753906e-05, -2.995505928993225e-05, -2.8796494007110596e-05, -2.763792872428894e-05, -2.6479363441467285e-05, -2.532079815864563e-05, -2.4162232875823975e-05, -2.300366759300232e-05, -2.1845102310180664e-05, -2.068653702735901e-05, -1.9527971744537354e-05, -1.8369406461715698e-05, -1.7210841178894043e-05, -1.6052275896072388e-05, -1.4893710613250732e-05, -1.3735145330429077e-05, -1.2576580047607422e-05, -1.1418014764785767e-05, -1.0259449481964111e-05, -9.100884199142456e-06, -7.9423189163208e-06, -6.7837536334991455e-06, -5.62518835067749e-06, -4.466623067855835e-06, -3.3080577850341797e-06, -2.1494925022125244e-06, -9.909272193908691e-07, 1.6763806343078613e-07, 1.3262033462524414e-06, 2.4847686290740967e-06, 3.643333911895752e-06, 4.801899194717407e-06, 5.9604644775390625e-06, 7.119029760360718e-06, 8.277595043182373e-06, 9.436160326004028e-06, 1.0594725608825684e-05, 1.1753290891647339e-05, 1.2911856174468994e-05, 1.407042145729065e-05, 1.5228986740112305e-05, 1.638755202293396e-05, 1.7546117305755615e-05, 1.870468258857727e-05, 1.9863247871398926e-05, 2.102181315422058e-05, 2.2180378437042236e-05, 2.333894371986389e-05, 2.4497509002685547e-05, 2.5656074285507202e-05, 2.6814639568328857e-05, 2.7973204851150513e-05, 2.9131770133972168e-05, 3.0290335416793823e-05, 3.144890069961548e-05, 3.2607465982437134e-05, 3.376603126525879e-05, 3.4924596548080444e-05, 3.60831618309021e-05, 3.7241727113723755e-05, 3.840029239654541e-05, 3.9558857679367065e-05, 4.071742296218872e-05, 4.1875988245010376e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 20.0, 18.0, 33.0, 36.0, 31.0, 89.0, 132.0, 207.0, 326.0, 552.0, 858.0, 1526.0, 2687.0, 4900.0, 9296.0, 18876.0, 41554.0, 99459.0, 246506.0, 335824.0, 162573.0, 65379.0, 28522.0, 13536.0, 6911.0, 3579.0, 2033.0, 1116.0, 775.0, 412.0, 272.0, 167.0, 113.0, 85.0, 45.0, 25.0, 20.0, 18.0, 13.0, 4.0, 5.0, 6.0, 1.0, 4.0], "bins": [-0.1884765625, -0.18367671966552734, -0.1788768768310547, -0.17407703399658203, -0.16927719116210938, -0.16447734832763672, -0.15967750549316406, -0.1548776626586914, -0.15007781982421875, -0.1452779769897461, -0.14047813415527344, -0.13567829132080078, -0.13087844848632812, -0.12607860565185547, -0.12127876281738281, -0.11647891998291016, -0.1116790771484375, -0.10687923431396484, -0.10207939147949219, -0.09727954864501953, -0.09247970581054688, -0.08767986297607422, -0.08288002014160156, -0.0780801773071289, -0.07328033447265625, -0.0684804916381836, -0.06368064880371094, -0.05888080596923828, -0.054080963134765625, -0.04928112030029297, -0.04448127746582031, -0.039681434631347656, -0.034881591796875, -0.030081748962402344, -0.025281906127929688, -0.02048206329345703, -0.015682220458984375, -0.010882377624511719, -0.0060825347900390625, -0.0012826919555664062, 0.00351715087890625, 0.008316993713378906, 0.013116836547851562, 0.01791667938232422, 0.022716522216796875, 0.02751636505126953, 0.03231620788574219, 0.037116050720214844, 0.0419158935546875, 0.046715736389160156, 0.05151557922363281, 0.05631542205810547, 0.061115264892578125, 0.06591510772705078, 0.07071495056152344, 0.0755147933959961, 0.08031463623046875, 0.0851144790649414, 0.08991432189941406, 0.09471416473388672, 0.09951400756835938, 0.10431385040283203, 0.10911369323730469, 0.11391353607177734, 0.11871337890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 3.0, 3.0, 5.0, 7.0, 14.0, 15.0, 18.0, 22.0, 23.0, 32.0, 29.0, 32.0, 61.0, 55.0, 60.0, 59.0, 81.0, 79.0, 60.0, 63.0, 43.0, 44.0, 35.0, 38.0, 17.0, 14.0, 21.0, 17.0, 8.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.1434326171875, -0.13944625854492188, -0.13545989990234375, -0.13147354125976562, -0.1274871826171875, -0.12350082397460938, -0.11951446533203125, -0.11552810668945312, -0.111541748046875, -0.10755538940429688, -0.10356903076171875, -0.09958267211914062, -0.0955963134765625, -0.09160995483398438, -0.08762359619140625, -0.08363723754882812, -0.07965087890625, -0.07566452026367188, -0.07167816162109375, -0.06769180297851562, -0.0637054443359375, -0.059719085693359375, -0.05573272705078125, -0.051746368408203125, -0.047760009765625, -0.043773651123046875, -0.03978729248046875, -0.035800933837890625, -0.0318145751953125, -0.027828216552734375, -0.02384185791015625, -0.019855499267578125, -0.015869140625, -0.011882781982421875, -0.00789642333984375, -0.003910064697265625, 7.62939453125e-05, 0.004062652587890625, 0.00804901123046875, 0.012035369873046875, 0.016021728515625, 0.020008087158203125, 0.02399444580078125, 0.027980804443359375, 0.0319671630859375, 0.035953521728515625, 0.03993988037109375, 0.043926239013671875, 0.04791259765625, 0.051898956298828125, 0.05588531494140625, 0.059871673583984375, 0.0638580322265625, 0.06784439086914062, 0.07183074951171875, 0.07581710815429688, 0.079803466796875, 0.08378982543945312, 0.08777618408203125, 0.09176254272460938, 0.0957489013671875, 0.09973526000976562, 0.10372161865234375, 0.10770797729492188, 0.1116943359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 13.0, 23.0, 40.0, 61.0, 95.0, 109.0, 140.0, 127.0, 114.0, 95.0, 76.0, 57.0, 21.0, 18.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.9995193481445312, -2.9411139488220215, -2.8827085494995117, -2.824303150177002, -2.765897750854492, -2.7074923515319824, -2.6490869522094727, -2.590681552886963, -2.532276153564453, -2.4738707542419434, -2.4154653549194336, -2.357059955596924, -2.298654556274414, -2.2402491569519043, -2.1818437576293945, -2.1234383583068848, -2.065032958984375, -2.0066275596618652, -1.9482221603393555, -1.8898167610168457, -1.831411361694336, -1.7730059623718262, -1.7146005630493164, -1.6561951637268066, -1.597790002822876, -1.5393846035003662, -1.4809792041778564, -1.4225738048553467, -1.364168405532837, -1.3057630062103271, -1.2473576068878174, -1.1889522075653076, -1.1305468082427979, -1.072141408920288, -1.0137360095977783, -0.9553306102752686, -0.8969252109527588, -0.838519811630249, -0.780114471912384, -0.7217090725898743, -0.6633037328720093, -0.6048983335494995, -0.5464929342269897, -0.48808756470680237, -0.4296821653842926, -0.37127676606178284, -0.31287139654159546, -0.2544659972190857, -0.19606059789657593, -0.13765519857406616, -0.07924981415271759, -0.02084442973136902, 0.03756096959114075, 0.09596636891365051, 0.1543717384338379, 0.21277713775634766, 0.2711825370788574, 0.3295879364013672, 0.38799333572387695, 0.44639870524406433, 0.5048041343688965, 0.5632095336914062, 0.6216148734092712, 0.680020272731781, 0.7384256720542908]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 11.0, 7.0, 10.0, 19.0, 11.0, 15.0, 30.0, 24.0, 34.0, 36.0, 34.0, 36.0, 34.0, 37.0, 37.0, 41.0, 41.0, 49.0, 46.0, 50.0, 44.0, 27.0, 36.0, 31.0, 31.0, 26.0, 25.0, 24.0, 19.0, 25.0, 13.0, 9.0, 12.0, 14.0, 9.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.6818969249725342, -0.6597164869308472, -0.6375360488891602, -0.6153556108474731, -0.5931751728057861, -0.5709947943687439, -0.5488143563270569, -0.5266339182853699, -0.5044534802436829, -0.48227304220199585, -0.46009260416030884, -0.4379121959209442, -0.4157317578792572, -0.3935513198375702, -0.37137091159820557, -0.34919047355651855, -0.32701003551483154, -0.30482959747314453, -0.2826491594314575, -0.2604687511920929, -0.23828831315040588, -0.21610787510871887, -0.19392745196819305, -0.17174702882766724, -0.14956659078598022, -0.1273861527442932, -0.1052057296037674, -0.08302529901266098, -0.060844868421554565, -0.03866443783044815, -0.016484007239341736, 0.005696415901184082, 0.02787691354751587, 0.050057344138622284, 0.0722377747297287, 0.09441820532083511, 0.11659863591194153, 0.13877907395362854, 0.16095949709415436, 0.18313992023468018, 0.2053203582763672, 0.2275007963180542, 0.24968121945858002, 0.27186164259910583, 0.29404208064079285, 0.31622251868247986, 0.3384029269218445, 0.3605833649635315, 0.3827638030052185, 0.4049442410469055, 0.42712467908859253, 0.44930508732795715, 0.47148552536964417, 0.4936659634113312, 0.5158463716506958, 0.5380268096923828, 0.5602072477340698, 0.5823876857757568, 0.6045681238174438, 0.6267485618591309, 0.6489289999008179, 0.6711093783378601, 0.6932898163795471, 0.7154702544212341, 0.7376506924629211]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 12.0, 16.0, 26.0, 40.0, 60.0, 87.0, 194.0, 350.0, 719.0, 1594.0, 4627.0, 16409.0, 78429.0, 670018.0, 3036253.0, 322869.0, 45578.0, 10587.0, 3465.0, 1366.0, 627.0, 367.0, 217.0, 132.0, 94.0, 44.0, 30.0, 31.0, 14.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.257568359375, -0.24779510498046875, -0.2380218505859375, -0.22824859619140625, -0.218475341796875, -0.20870208740234375, -0.1989288330078125, -0.18915557861328125, -0.17938232421875, -0.16960906982421875, -0.1598358154296875, -0.15006256103515625, -0.140289306640625, -0.13051605224609375, -0.1207427978515625, -0.11096954345703125, -0.1011962890625, -0.09142303466796875, -0.0816497802734375, -0.07187652587890625, -0.062103271484375, -0.05233001708984375, -0.0425567626953125, -0.03278350830078125, -0.02301025390625, -0.01323699951171875, -0.0034637451171875, 0.00630950927734375, 0.016082763671875, 0.02585601806640625, 0.0356292724609375, 0.04540252685546875, 0.05517578125, 0.06494903564453125, 0.0747222900390625, 0.08449554443359375, 0.094268798828125, 0.10404205322265625, 0.1138153076171875, 0.12358856201171875, 0.13336181640625, 0.14313507080078125, 0.1529083251953125, 0.16268157958984375, 0.172454833984375, 0.18222808837890625, 0.1920013427734375, 0.20177459716796875, 0.2115478515625, 0.22132110595703125, 0.2310943603515625, 0.24086761474609375, 0.250640869140625, 0.26041412353515625, 0.2701873779296875, 0.27996063232421875, 0.28973388671875, 0.29950714111328125, 0.3092803955078125, 0.31905364990234375, 0.328826904296875, 0.33860015869140625, 0.3483734130859375, 0.35814666748046875, 0.367919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 18.0, 15.0, 22.0, 35.0, 43.0, 47.0, 70.0, 65.0, 84.0, 98.0, 95.0, 84.0, 78.0, 57.0, 50.0, 48.0, 34.0, 20.0, 17.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08575439453125, -0.08075237274169922, -0.07575035095214844, -0.07074832916259766, -0.06574630737304688, -0.060744285583496094, -0.05574226379394531, -0.05074024200439453, -0.04573822021484375, -0.04073619842529297, -0.03573417663574219, -0.030732154846191406, -0.025730133056640625, -0.020728111267089844, -0.015726089477539062, -0.010724067687988281, -0.0057220458984375, -0.0007200241088867188, 0.0042819976806640625, 0.009284019470214844, 0.014286041259765625, 0.019288063049316406, 0.024290084838867188, 0.02929210662841797, 0.03429412841796875, 0.03929615020751953, 0.04429817199707031, 0.049300193786621094, 0.054302215576171875, 0.059304237365722656, 0.06430625915527344, 0.06930828094482422, 0.074310302734375, 0.07931232452392578, 0.08431434631347656, 0.08931636810302734, 0.09431838989257812, 0.0993204116821289, 0.10432243347167969, 0.10932445526123047, 0.11432647705078125, 0.11932849884033203, 0.12433052062988281, 0.1293325424194336, 0.13433456420898438, 0.13933658599853516, 0.14433860778808594, 0.14934062957763672, 0.1543426513671875, 0.15934467315673828, 0.16434669494628906, 0.16934871673583984, 0.17435073852539062, 0.1793527603149414, 0.1843547821044922, 0.18935680389404297, 0.19435882568359375, 0.19936084747314453, 0.2043628692626953, 0.2093648910522461, 0.21436691284179688, 0.21936893463134766, 0.22437095642089844, 0.22937297821044922, 0.234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 3.0, 9.0, 7.0, 19.0, 17.0, 23.0, 37.0, 48.0, 60.0, 110.0, 174.0, 336.0, 630.0, 1177.0, 2613.0, 6325.0, 18032.0, 63710.0, 323711.0, 2196821.0, 1320594.0, 194261.0, 43315.0, 13095.0, 4892.0, 2039.0, 994.0, 484.0, 279.0, 143.0, 111.0, 68.0, 39.0, 27.0, 26.0, 9.0, 6.0, 13.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33740234375, -0.3271331787109375, -0.316864013671875, -0.3065948486328125, -0.29632568359375, -0.2860565185546875, -0.275787353515625, -0.2655181884765625, -0.2552490234375, -0.2449798583984375, -0.234710693359375, -0.2244415283203125, -0.21417236328125, -0.2039031982421875, -0.193634033203125, -0.1833648681640625, -0.173095703125, -0.1628265380859375, -0.152557373046875, -0.1422882080078125, -0.13201904296875, -0.1217498779296875, -0.111480712890625, -0.1012115478515625, -0.0909423828125, -0.0806732177734375, -0.070404052734375, -0.0601348876953125, -0.04986572265625, -0.0395965576171875, -0.029327392578125, -0.0190582275390625, -0.0087890625, 0.0014801025390625, 0.011749267578125, 0.0220184326171875, 0.03228759765625, 0.0425567626953125, 0.052825927734375, 0.0630950927734375, 0.0733642578125, 0.0836334228515625, 0.093902587890625, 0.1041717529296875, 0.11444091796875, 0.1247100830078125, 0.134979248046875, 0.1452484130859375, 0.155517578125, 0.1657867431640625, 0.176055908203125, 0.1863250732421875, 0.19659423828125, 0.2068634033203125, 0.217132568359375, 0.2274017333984375, 0.2376708984375, 0.2479400634765625, 0.258209228515625, 0.2684783935546875, 0.27874755859375, 0.2890167236328125, 0.299285888671875, 0.3095550537109375, 0.31982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 13.0, 17.0, 18.0, 30.0, 50.0, 83.0, 109.0, 178.0, 276.0, 484.0, 682.0, 745.0, 482.0, 341.0, 186.0, 120.0, 83.0, 49.0, 30.0, 27.0, 20.0, 9.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.2869911193847656, -0.27857208251953125, -0.2701530456542969, -0.2617340087890625, -0.2533149719238281, -0.24489593505859375, -0.23647689819335938, -0.228057861328125, -0.21963882446289062, -0.21121978759765625, -0.20280075073242188, -0.1943817138671875, -0.18596267700195312, -0.17754364013671875, -0.16912460327148438, -0.16070556640625, -0.15228652954101562, -0.14386749267578125, -0.13544845581054688, -0.1270294189453125, -0.11861038208007812, -0.11019134521484375, -0.10177230834960938, -0.093353271484375, -0.08493423461914062, -0.07651519775390625, -0.06809616088867188, -0.0596771240234375, -0.051258087158203125, -0.04283905029296875, -0.034420013427734375, -0.0260009765625, -0.017581939697265625, -0.00916290283203125, -0.000743865966796875, 0.0076751708984375, 0.016094207763671875, 0.02451324462890625, 0.032932281494140625, 0.041351318359375, 0.049770355224609375, 0.05818939208984375, 0.06660842895507812, 0.0750274658203125, 0.08344650268554688, 0.09186553955078125, 0.10028457641601562, 0.10870361328125, 0.11712265014648438, 0.12554168701171875, 0.13396072387695312, 0.1423797607421875, 0.15079879760742188, 0.15921783447265625, 0.16763687133789062, 0.176055908203125, 0.18447494506835938, 0.19289398193359375, 0.20131301879882812, 0.2097320556640625, 0.21815109252929688, 0.22657012939453125, 0.23498916625976562, 0.243408203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 11.0, 3.0, 6.0, 6.0, 12.0, 25.0, 31.0, 30.0, 58.0, 57.0, 76.0, 77.0, 81.0, 73.0, 84.0, 85.0, 73.0, 51.0, 35.0, 41.0, 23.0, 17.0, 12.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0217467546463013, -0.9913377165794373, -0.9609286785125732, -0.9305196404457092, -0.9001106023788452, -0.8697015643119812, -0.8392925262451172, -0.808883547782898, -0.7784744501113892, -0.7480654120445251, -0.7176563739776611, -0.6872473359107971, -0.6568382978439331, -0.6264292597770691, -0.5960202217102051, -0.5656112432479858, -0.5352022051811218, -0.5047931671142578, -0.4743841290473938, -0.4439750909805298, -0.41356605291366577, -0.38315701484680176, -0.35274800658226013, -0.3223389685153961, -0.2919299304485321, -0.2615208923816681, -0.23111185431480408, -0.20070283114910126, -0.17029379308223724, -0.13988475501537323, -0.10947573184967041, -0.0790666937828064, -0.04865765571594238, -0.018248621374368668, 0.012160412967205048, 0.042569443583488464, 0.07297848165035248, 0.10338751971721649, 0.1337965428829193, 0.16420558094978333, 0.19461461901664734, 0.22502365708351135, 0.25543269515037537, 0.285841703414917, 0.316250741481781, 0.346659779548645, 0.37706881761550903, 0.40747785568237305, 0.43788689374923706, 0.4682959318161011, 0.4987049698829651, 0.5291140079498291, 0.5595230460166931, 0.5899320840835571, 0.6203410625457764, 0.6507501602172852, 0.6811591386795044, 0.7115681767463684, 0.7419772148132324, 0.7723862528800964, 0.8027952909469604, 0.8332043290138245, 0.8636133670806885, 0.8940223455429077, 0.9244314432144165]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 6.0, 5.0, 11.0, 15.0, 14.0, 10.0, 15.0, 20.0, 19.0, 25.0, 26.0, 41.0, 40.0, 33.0, 32.0, 50.0, 53.0, 45.0, 42.0, 37.0, 58.0, 46.0, 46.0, 27.0, 30.0, 38.0, 35.0, 32.0, 27.0, 19.0, 19.0, 11.0, 14.0, 18.0, 9.0, 5.0, 8.0, 2.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7819831371307373, -0.7594842314720154, -0.7369852662086487, -0.7144863605499268, -0.6919873952865601, -0.6694884896278381, -0.6469895839691162, -0.6244906187057495, -0.6019916534423828, -0.5794927477836609, -0.5569937825202942, -0.5344948768615723, -0.5119959115982056, -0.48949700593948364, -0.46699807047843933, -0.444499135017395, -0.4220002293586731, -0.3995012938976288, -0.3770023584365845, -0.35450345277786255, -0.33200448751449585, -0.3095055818557739, -0.2870066463947296, -0.2645077109336853, -0.242008775472641, -0.21950984001159668, -0.19701090455055237, -0.17451198399066925, -0.15201304852962494, -0.12951411306858063, -0.10701519250869751, -0.0845162570476532, -0.06201726198196411, -0.0395183302462101, -0.017019398510456085, 0.005479529500007629, 0.02797846496105194, 0.05047740042209625, 0.07297632098197937, 0.09547525644302368, 0.117974191904068, 0.1404731273651123, 0.16297206282615662, 0.18547098338603973, 0.20796991884708405, 0.23046885430812836, 0.2529677748680115, 0.2754667103290558, 0.2979656457901001, 0.3204645812511444, 0.3429635167121887, 0.36546242237091064, 0.38796138763427734, 0.41046029329299927, 0.4329592287540436, 0.4554581642150879, 0.4779570996761322, 0.5004560351371765, 0.5229549407958984, 0.5454539060592651, 0.5679528117179871, 0.5904517769813538, 0.6129506826400757, 0.6354496479034424, 0.6579485535621643]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 12.0, 5.0, 7.0, 12.0, 27.0, 37.0, 36.0, 69.0, 97.0, 184.0, 294.0, 501.0, 966.0, 2063.0, 4029.0, 8473.0, 18203.0, 43395.0, 119322.0, 313414.0, 326314.0, 127936.0, 46155.0, 19345.0, 8971.0, 4201.0, 2090.0, 1050.0, 533.0, 316.0, 189.0, 91.0, 74.0, 49.0, 23.0, 20.0, 19.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.28045654296875, -0.2711181640625, -0.26177978515625, -0.25244140625, -0.24310302734375, -0.2337646484375, -0.22442626953125, -0.215087890625, -0.20574951171875, -0.1964111328125, -0.18707275390625, -0.177734375, -0.16839599609375, -0.1590576171875, -0.14971923828125, -0.140380859375, -0.13104248046875, -0.1217041015625, -0.11236572265625, -0.10302734375, -0.09368896484375, -0.0843505859375, -0.07501220703125, -0.065673828125, -0.05633544921875, -0.0469970703125, -0.03765869140625, -0.0283203125, -0.01898193359375, -0.0096435546875, -0.00030517578125, 0.009033203125, 0.01837158203125, 0.0277099609375, 0.03704833984375, 0.04638671875, 0.05572509765625, 0.0650634765625, 0.07440185546875, 0.083740234375, 0.09307861328125, 0.1024169921875, 0.11175537109375, 0.12109375, 0.13043212890625, 0.1397705078125, 0.14910888671875, 0.158447265625, 0.16778564453125, 0.1771240234375, 0.18646240234375, 0.19580078125, 0.20513916015625, 0.2144775390625, 0.22381591796875, 0.233154296875, 0.24249267578125, 0.2518310546875, 0.26116943359375, 0.2705078125, 0.27984619140625, 0.2891845703125, 0.29852294921875, 0.307861328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 11.0, 8.0, 11.0, 27.0, 24.0, 34.0, 46.0, 47.0, 68.0, 56.0, 72.0, 94.0, 88.0, 62.0, 78.0, 80.0, 37.0, 54.0, 30.0, 32.0, 10.0, 11.0, 14.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836181640625, -0.07875633239746094, -0.07389450073242188, -0.06903266906738281, -0.06417083740234375, -0.05930900573730469, -0.054447174072265625, -0.04958534240722656, -0.0447235107421875, -0.03986167907714844, -0.034999847412109375, -0.030138015747070312, -0.02527618408203125, -0.020414352416992188, -0.015552520751953125, -0.010690689086914062, -0.005828857421875, -0.0009670257568359375, 0.003894805908203125, 0.008756637573242188, 0.01361846923828125, 0.018480300903320312, 0.023342132568359375, 0.028203964233398438, 0.0330657958984375, 0.03792762756347656, 0.042789459228515625, 0.04765129089355469, 0.05251312255859375, 0.05737495422363281, 0.062236785888671875, 0.06709861755371094, 0.07196044921875, 0.07682228088378906, 0.08168411254882812, 0.08654594421386719, 0.09140777587890625, 0.09626960754394531, 0.10113143920898438, 0.10599327087402344, 0.1108551025390625, 0.11571693420410156, 0.12057876586914062, 0.1254405975341797, 0.13030242919921875, 0.1351642608642578, 0.14002609252929688, 0.14488792419433594, 0.149749755859375, 0.15461158752441406, 0.15947341918945312, 0.1643352508544922, 0.16919708251953125, 0.1740589141845703, 0.17892074584960938, 0.18378257751464844, 0.1886444091796875, 0.19350624084472656, 0.19836807250976562, 0.2032299041748047, 0.20809173583984375, 0.2129535675048828, 0.21781539916992188, 0.22267723083496094, 0.2275390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 10.0, 18.0, 31.0, 58.0, 147.0, 267.0, 569.0, 1209.0, 2588.0, 5894.0, 13536.0, 37689.0, 154211.0, 516203.0, 232454.0, 52556.0, 17745.0, 7321.0, 3226.0, 1444.0, 658.0, 343.0, 150.0, 84.0, 49.0, 34.0, 12.0, 8.0, 12.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3935546875, -0.38027191162109375, -0.3669891357421875, -0.35370635986328125, -0.340423583984375, -0.32714080810546875, -0.3138580322265625, -0.30057525634765625, -0.28729248046875, -0.27400970458984375, -0.2607269287109375, -0.24744415283203125, -0.234161376953125, -0.22087860107421875, -0.2075958251953125, -0.19431304931640625, -0.1810302734375, -0.16774749755859375, -0.1544647216796875, -0.14118194580078125, -0.127899169921875, -0.11461639404296875, -0.1013336181640625, -0.08805084228515625, -0.07476806640625, -0.06148529052734375, -0.0482025146484375, -0.03491973876953125, -0.021636962890625, -0.00835418701171875, 0.0049285888671875, 0.01821136474609375, 0.031494140625, 0.04477691650390625, 0.0580596923828125, 0.07134246826171875, 0.084625244140625, 0.09790802001953125, 0.1111907958984375, 0.12447357177734375, 0.13775634765625, 0.15103912353515625, 0.1643218994140625, 0.17760467529296875, 0.190887451171875, 0.20417022705078125, 0.2174530029296875, 0.23073577880859375, 0.2440185546875, 0.25730133056640625, 0.2705841064453125, 0.28386688232421875, 0.297149658203125, 0.31043243408203125, 0.3237152099609375, 0.33699798583984375, 0.35028076171875, 0.36356353759765625, 0.3768463134765625, 0.39012908935546875, 0.403411865234375, 0.41669464111328125, 0.4299774169921875, 0.44326019287109375, 0.45654296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 4.0, 8.0, 16.0, 14.0, 18.0, 28.0, 29.0, 30.0, 30.0, 43.0, 49.0, 61.0, 60.0, 62.0, 67.0, 53.0, 70.0, 56.0, 39.0, 48.0, 44.0, 26.0, 31.0, 24.0, 21.0, 18.0, 11.0, 8.0, 5.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.39488983154296875, -0.3835296630859375, -0.37216949462890625, -0.360809326171875, -0.34944915771484375, -0.3380889892578125, -0.32672882080078125, -0.31536865234375, -0.30400848388671875, -0.2926483154296875, -0.28128814697265625, -0.269927978515625, -0.25856781005859375, -0.2472076416015625, -0.23584747314453125, -0.2244873046875, -0.21312713623046875, -0.2017669677734375, -0.19040679931640625, -0.179046630859375, -0.16768646240234375, -0.1563262939453125, -0.14496612548828125, -0.13360595703125, -0.12224578857421875, -0.1108856201171875, -0.09952545166015625, -0.088165283203125, -0.07680511474609375, -0.0654449462890625, -0.05408477783203125, -0.042724609375, -0.03136444091796875, -0.0200042724609375, -0.00864410400390625, 0.002716064453125, 0.01407623291015625, 0.0254364013671875, 0.03679656982421875, 0.04815673828125, 0.05951690673828125, 0.0708770751953125, 0.08223724365234375, 0.093597412109375, 0.10495758056640625, 0.1163177490234375, 0.12767791748046875, 0.1390380859375, 0.15039825439453125, 0.1617584228515625, 0.17311859130859375, 0.184478759765625, 0.19583892822265625, 0.2071990966796875, 0.21855926513671875, 0.22991943359375, 0.24127960205078125, 0.2526397705078125, 0.26399993896484375, 0.275360107421875, 0.28672027587890625, 0.2980804443359375, 0.30944061279296875, 0.32080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 1.0, 7.0, 8.0, 17.0, 29.0, 35.0, 65.0, 95.0, 200.0, 366.0, 559.0, 1087.0, 2155.0, 4454.0, 9976.0, 23890.0, 62425.0, 230100.0, 483577.0, 150036.0, 46034.0, 18185.0, 7875.0, 3568.0, 1729.0, 911.0, 503.0, 291.0, 143.0, 94.0, 56.0, 31.0, 18.0, 8.0, 13.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037353515625, -0.1967945098876953, -0.18985366821289062, -0.18291282653808594, -0.17597198486328125, -0.16903114318847656, -0.16209030151367188, -0.1551494598388672, -0.1482086181640625, -0.1412677764892578, -0.13432693481445312, -0.12738609313964844, -0.12044525146484375, -0.11350440979003906, -0.10656356811523438, -0.09962272644042969, -0.092681884765625, -0.08574104309082031, -0.07880020141601562, -0.07185935974121094, -0.06491851806640625, -0.05797767639160156, -0.051036834716796875, -0.04409599304199219, -0.0371551513671875, -0.030214309692382812, -0.023273468017578125, -0.016332626342773438, -0.00939178466796875, -0.0024509429931640625, 0.004489898681640625, 0.011430740356445312, 0.01837158203125, 0.025312423706054688, 0.032253265380859375, 0.03919410705566406, 0.04613494873046875, 0.05307579040527344, 0.060016632080078125, 0.06695747375488281, 0.0738983154296875, 0.08083915710449219, 0.08777999877929688, 0.09472084045410156, 0.10166168212890625, 0.10860252380371094, 0.11554336547851562, 0.12248420715332031, 0.129425048828125, 0.1363658905029297, 0.14330673217773438, 0.15024757385253906, 0.15718841552734375, 0.16412925720214844, 0.17107009887695312, 0.1780109405517578, 0.1849517822265625, 0.1918926239013672, 0.19883346557617188, 0.20577430725097656, 0.21271514892578125, 0.21965599060058594, 0.22659683227539062, 0.2335376739501953, 0.240478515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 14.0, 14.0, 13.0, 40.0, 41.0, 81.0, 150.0, 195.0, 152.0, 88.0, 54.0, 28.0, 30.0, 19.0, 12.0, 7.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.115436553955078e-05, -5.9567391872406006e-05, -5.798041820526123e-05, -5.6393444538116455e-05, -5.480647087097168e-05, -5.3219497203826904e-05, -5.163252353668213e-05, -5.0045549869537354e-05, -4.845857620239258e-05, -4.68716025352478e-05, -4.528462886810303e-05, -4.369765520095825e-05, -4.2110681533813477e-05, -4.05237078666687e-05, -3.8936734199523926e-05, -3.734976053237915e-05, -3.5762786865234375e-05, -3.41758131980896e-05, -3.2588839530944824e-05, -3.100186586380005e-05, -2.9414892196655273e-05, -2.7827918529510498e-05, -2.6240944862365723e-05, -2.4653971195220947e-05, -2.3066997528076172e-05, -2.1480023860931396e-05, -1.989305019378662e-05, -1.8306076526641846e-05, -1.671910285949707e-05, -1.5132129192352295e-05, -1.354515552520752e-05, -1.1958181858062744e-05, -1.0371208190917969e-05, -8.784234523773193e-06, -7.197260856628418e-06, -5.610287189483643e-06, -4.023313522338867e-06, -2.436339855194092e-06, -8.493661880493164e-07, 7.37607479095459e-07, 2.3245811462402344e-06, 3.91155481338501e-06, 5.498528480529785e-06, 7.0855021476745605e-06, 8.672475814819336e-06, 1.0259449481964111e-05, 1.1846423149108887e-05, 1.3433396816253662e-05, 1.5020370483398438e-05, 1.6607344150543213e-05, 1.8194317817687988e-05, 1.9781291484832764e-05, 2.136826515197754e-05, 2.2955238819122314e-05, 2.454221248626709e-05, 2.6129186153411865e-05, 2.771615982055664e-05, 2.9303133487701416e-05, 3.089010715484619e-05, 3.247708082199097e-05, 3.406405448913574e-05, 3.565102815628052e-05, 3.723800182342529e-05, 3.882497549057007e-05, 4.0411949157714844e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 12.0, 29.0, 27.0, 32.0, 60.0, 83.0, 118.0, 198.0, 283.0, 467.0, 810.0, 1356.0, 2462.0, 4757.0, 9826.0, 21418.0, 50857.0, 152410.0, 438092.0, 238782.0, 72236.0, 28272.0, 12579.0, 6119.0, 3086.0, 1638.0, 936.0, 575.0, 318.0, 209.0, 145.0, 104.0, 77.0, 44.0, 29.0, 28.0, 20.0, 13.0, 12.0, 4.0, 4.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.17630958557128906, -0.17036819458007812, -0.1644268035888672, -0.15848541259765625, -0.1525440216064453, -0.14660263061523438, -0.14066123962402344, -0.1347198486328125, -0.12877845764160156, -0.12283706665039062, -0.11689567565917969, -0.11095428466796875, -0.10501289367675781, -0.09907150268554688, -0.09313011169433594, -0.087188720703125, -0.08124732971191406, -0.07530593872070312, -0.06936454772949219, -0.06342315673828125, -0.05748176574707031, -0.051540374755859375, -0.04559898376464844, -0.0396575927734375, -0.03371620178222656, -0.027774810791015625, -0.021833419799804688, -0.01589202880859375, -0.009950637817382812, -0.004009246826171875, 0.0019321441650390625, 0.00787353515625, 0.013814926147460938, 0.019756317138671875, 0.025697708129882812, 0.03163909912109375, 0.03758049011230469, 0.043521881103515625, 0.04946327209472656, 0.0554046630859375, 0.06134605407714844, 0.06728744506835938, 0.07322883605957031, 0.07917022705078125, 0.08511161804199219, 0.09105300903320312, 0.09699440002441406, 0.102935791015625, 0.10887718200683594, 0.11481857299804688, 0.12075996398925781, 0.12670135498046875, 0.1326427459716797, 0.13858413696289062, 0.14452552795410156, 0.1504669189453125, 0.15640830993652344, 0.16234970092773438, 0.1682910919189453, 0.17423248291015625, 0.1801738739013672, 0.18611526489257812, 0.19205665588378906, 0.197998046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 2.0, 5.0, 3.0, 11.0, 13.0, 22.0, 34.0, 57.0, 90.0, 121.0, 136.0, 142.0, 114.0, 70.0, 56.0, 37.0, 17.0, 10.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.288330078125, -0.28067588806152344, -0.2730216979980469, -0.2653675079345703, -0.25771331787109375, -0.2500591278076172, -0.24240493774414062, -0.23475074768066406, -0.2270965576171875, -0.21944236755371094, -0.21178817749023438, -0.2041339874267578, -0.19647979736328125, -0.1888256072998047, -0.18117141723632812, -0.17351722717285156, -0.165863037109375, -0.15820884704589844, -0.15055465698242188, -0.1429004669189453, -0.13524627685546875, -0.1275920867919922, -0.11993789672851562, -0.11228370666503906, -0.1046295166015625, -0.09697532653808594, -0.08932113647460938, -0.08166694641113281, -0.07401275634765625, -0.06635856628417969, -0.058704376220703125, -0.05105018615722656, -0.04339599609375, -0.03574180603027344, -0.028087615966796875, -0.020433425903320312, -0.01277923583984375, -0.0051250457763671875, 0.002529144287109375, 0.010183334350585938, 0.0178375244140625, 0.025491714477539062, 0.033145904541015625, 0.04080009460449219, 0.04845428466796875, 0.05610847473144531, 0.06376266479492188, 0.07141685485839844, 0.079071044921875, 0.08672523498535156, 0.09437942504882812, 0.10203361511230469, 0.10968780517578125, 0.11734199523925781, 0.12499618530273438, 0.13265037536621094, 0.1403045654296875, 0.14795875549316406, 0.15561294555664062, 0.1632671356201172, 0.17092132568359375, 0.1785755157470703, 0.18622970581054688, 0.19388389587402344, 0.2015380859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 8.0, 9.0, 22.0, 36.0, 47.0, 75.0, 99.0, 104.0, 101.0, 115.0, 95.0, 93.0, 52.0, 50.0, 30.0, 19.0, 9.0, 14.0, 6.0, 2.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6127504110336304, -1.5591074228286743, -1.5054645538330078, -1.4518215656280518, -1.3981785774230957, -1.3445355892181396, -1.2908927202224731, -1.237249732017517, -1.1836068630218506, -1.1299638748168945, -1.076321005821228, -1.022678017616272, -0.9690350294113159, -0.9153921008110046, -0.8617491722106934, -0.8081061840057373, -0.7544631958007812, -0.70082026720047, -0.6471772789955139, -0.5935343503952026, -0.5398913621902466, -0.4862484335899353, -0.432605504989624, -0.37896254658699036, -0.3253195881843567, -0.271676629781723, -0.21803368628025055, -0.16439074277877808, -0.11074778437614441, -0.05710482597351074, -0.003461897373199463, 0.050181061029434204, 0.10382401943206787, 0.15746697783470154, 0.211109921336174, 0.2647528648376465, 0.31839582324028015, 0.3720387816429138, 0.4256817102432251, 0.47932466864585876, 0.5329676270484924, 0.5866105556488037, 0.6402535438537598, 0.693896472454071, 0.7475394010543823, 0.8011823892593384, 0.8548253178596497, 0.9084682464599609, 0.962111234664917, 1.015754222869873, 1.0693970918655396, 1.1230400800704956, 1.1766830682754517, 1.2303259372711182, 1.2839689254760742, 1.3376119136810303, 1.3912549018859863, 1.4448978900909424, 1.4985407590866089, 1.552183747291565, 1.605826735496521, 1.6594696044921875, 1.7131125926971436, 1.7667555809020996, 1.8203984498977661]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 13.0, 6.0, 9.0, 10.0, 16.0, 20.0, 24.0, 18.0, 27.0, 40.0, 38.0, 30.0, 45.0, 33.0, 44.0, 34.0, 39.0, 51.0, 45.0, 47.0, 25.0, 35.0, 39.0, 31.0, 33.0, 31.0, 21.0, 27.0, 32.0, 23.0, 16.0, 21.0, 7.0, 14.0, 8.0, 9.0, 5.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8816020488739014, -0.853523313999176, -0.8254446387290955, -0.7973659038543701, -0.7692871689796448, -0.7412084341049194, -0.7131297588348389, -0.6850510239601135, -0.6569722890853882, -0.6288935542106628, -0.6008148789405823, -0.5727361440658569, -0.5446574091911316, -0.5165786743164062, -0.4884999990463257, -0.46042126417160034, -0.4323425590991974, -0.40426385402679443, -0.3761851191520691, -0.34810641407966614, -0.3200276792049408, -0.29194897413253784, -0.2638702392578125, -0.23579153418540955, -0.2077128142118454, -0.17963409423828125, -0.1515553742647171, -0.12347666174173355, -0.0953979417681694, -0.06731922924518585, -0.039240509271621704, -0.011161789298057556, 0.016916930675506592, 0.04499565064907074, 0.07307437062263489, 0.10115308314561844, 0.12923181056976318, 0.15731051564216614, 0.18538923561573029, 0.21346795558929443, 0.24154667556285858, 0.26962539553642273, 0.2977041006088257, 0.325782835483551, 0.353861540555954, 0.38194024562835693, 0.4100189805030823, 0.4380977153778076, 0.46617642045021057, 0.4942551255226135, 0.5223338603973389, 0.5504125952720642, 0.5784912705421448, 0.6065700054168701, 0.6346487402915955, 0.6627274751663208, 0.6908061504364014, 0.7188848853111267, 0.7469635605812073, 0.7750422954559326, 0.803121030330658, 0.8311997652053833, 0.8592784404754639, 0.8873571753501892, 0.9154359102249146]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 3.0, 15.0, 11.0, 27.0, 37.0, 45.0, 62.0, 124.0, 179.0, 348.0, 668.0, 1340.0, 3046.0, 8021.0, 24825.0, 102023.0, 726140.0, 2915070.0, 327792.0, 58374.0, 15902.0, 5471.0, 2260.0, 1076.0, 594.0, 292.0, 187.0, 107.0, 77.0, 45.0, 34.0, 20.0, 18.0, 14.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.31640625, -0.306304931640625, -0.29620361328125, -0.286102294921875, -0.2760009765625, -0.265899658203125, -0.25579833984375, -0.245697021484375, -0.235595703125, -0.225494384765625, -0.21539306640625, -0.205291748046875, -0.1951904296875, -0.185089111328125, -0.17498779296875, -0.164886474609375, -0.15478515625, -0.144683837890625, -0.13458251953125, -0.124481201171875, -0.1143798828125, -0.104278564453125, -0.09417724609375, -0.084075927734375, -0.073974609375, -0.063873291015625, -0.05377197265625, -0.043670654296875, -0.0335693359375, -0.023468017578125, -0.01336669921875, -0.003265380859375, 0.0068359375, 0.016937255859375, 0.02703857421875, 0.037139892578125, 0.0472412109375, 0.057342529296875, 0.06744384765625, 0.077545166015625, 0.087646484375, 0.097747802734375, 0.10784912109375, 0.117950439453125, 0.1280517578125, 0.138153076171875, 0.14825439453125, 0.158355712890625, 0.16845703125, 0.178558349609375, 0.18865966796875, 0.198760986328125, 0.2088623046875, 0.218963623046875, 0.22906494140625, 0.239166259765625, 0.249267578125, 0.259368896484375, 0.26947021484375, 0.279571533203125, 0.2896728515625, 0.299774169921875, 0.30987548828125, 0.319976806640625, 0.330078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 21.0, 32.0, 36.0, 38.0, 57.0, 63.0, 60.0, 65.0, 80.0, 67.0, 73.0, 67.0, 59.0, 59.0, 46.0, 50.0, 20.0, 21.0, 18.0, 14.0, 3.0, 9.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09344482421875, -0.08835506439208984, -0.08326530456542969, -0.07817554473876953, -0.07308578491210938, -0.06799602508544922, -0.06290626525878906, -0.057816505432128906, -0.05272674560546875, -0.047636985778808594, -0.04254722595214844, -0.03745746612548828, -0.032367706298828125, -0.02727794647216797, -0.022188186645507812, -0.017098426818847656, -0.0120086669921875, -0.006918907165527344, -0.0018291473388671875, 0.0032606124877929688, 0.008350372314453125, 0.013440132141113281, 0.018529891967773438, 0.023619651794433594, 0.02870941162109375, 0.033799171447753906, 0.03888893127441406, 0.04397869110107422, 0.049068450927734375, 0.05415821075439453, 0.05924797058105469, 0.06433773040771484, 0.069427490234375, 0.07451725006103516, 0.07960700988769531, 0.08469676971435547, 0.08978652954101562, 0.09487628936767578, 0.09996604919433594, 0.1050558090209961, 0.11014556884765625, 0.1152353286743164, 0.12032508850097656, 0.12541484832763672, 0.13050460815429688, 0.13559436798095703, 0.1406841278076172, 0.14577388763427734, 0.1508636474609375, 0.15595340728759766, 0.1610431671142578, 0.16613292694091797, 0.17122268676757812, 0.17631244659423828, 0.18140220642089844, 0.1864919662475586, 0.19158172607421875, 0.1966714859008789, 0.20176124572753906, 0.20685100555419922, 0.21194076538085938, 0.21703052520751953, 0.2221202850341797, 0.22721004486083984, 0.2322998046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 8.0, 8.0, 13.0, 12.0, 13.0, 34.0, 52.0, 93.0, 122.0, 199.0, 249.0, 451.0, 783.0, 1253.0, 2249.0, 4653.0, 10091.0, 24575.0, 71031.0, 249227.0, 1167616.0, 2062995.0, 424768.0, 111099.0, 36053.0, 13826.0, 5949.0, 2878.0, 1582.0, 900.0, 524.0, 332.0, 214.0, 146.0, 94.0, 54.0, 46.0, 28.0, 24.0, 6.0, 12.0, 10.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3359375, -0.32550048828125, -0.3150634765625, -0.30462646484375, -0.294189453125, -0.28375244140625, -0.2733154296875, -0.26287841796875, -0.25244140625, -0.24200439453125, -0.2315673828125, -0.22113037109375, -0.210693359375, -0.20025634765625, -0.1898193359375, -0.17938232421875, -0.1689453125, -0.15850830078125, -0.1480712890625, -0.13763427734375, -0.127197265625, -0.11676025390625, -0.1063232421875, -0.09588623046875, -0.08544921875, -0.07501220703125, -0.0645751953125, -0.05413818359375, -0.043701171875, -0.03326416015625, -0.0228271484375, -0.01239013671875, -0.001953125, 0.00848388671875, 0.0189208984375, 0.02935791015625, 0.039794921875, 0.05023193359375, 0.0606689453125, 0.07110595703125, 0.08154296875, 0.09197998046875, 0.1024169921875, 0.11285400390625, 0.123291015625, 0.13372802734375, 0.1441650390625, 0.15460205078125, 0.1650390625, 0.17547607421875, 0.1859130859375, 0.19635009765625, 0.206787109375, 0.21722412109375, 0.2276611328125, 0.23809814453125, 0.24853515625, 0.25897216796875, 0.2694091796875, 0.27984619140625, 0.290283203125, 0.30072021484375, 0.3111572265625, 0.32159423828125, 0.33203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 8.0, 10.0, 12.0, 22.0, 29.0, 45.0, 56.0, 95.0, 148.0, 219.0, 369.0, 587.0, 811.0, 612.0, 369.0, 224.0, 148.0, 103.0, 63.0, 35.0, 34.0, 19.0, 19.0, 12.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24821853637695312, -0.23886871337890625, -0.22951889038085938, -0.2201690673828125, -0.21081924438476562, -0.20146942138671875, -0.19211959838867188, -0.182769775390625, -0.17341995239257812, -0.16407012939453125, -0.15472030639648438, -0.1453704833984375, -0.13602066040039062, -0.12667083740234375, -0.11732101440429688, -0.10797119140625, -0.09862136840820312, -0.08927154541015625, -0.07992172241210938, -0.0705718994140625, -0.061222076416015625, -0.05187225341796875, -0.042522430419921875, -0.033172607421875, -0.023822784423828125, -0.01447296142578125, -0.005123138427734375, 0.0042266845703125, 0.013576507568359375, 0.02292633056640625, 0.032276153564453125, 0.0416259765625, 0.050975799560546875, 0.06032562255859375, 0.06967544555664062, 0.0790252685546875, 0.08837509155273438, 0.09772491455078125, 0.10707473754882812, 0.116424560546875, 0.12577438354492188, 0.13512420654296875, 0.14447402954101562, 0.1538238525390625, 0.16317367553710938, 0.17252349853515625, 0.18187332153320312, 0.19122314453125, 0.20057296752929688, 0.20992279052734375, 0.21927261352539062, 0.2286224365234375, 0.23797225952148438, 0.24732208251953125, 0.2566719055175781, 0.266021728515625, 0.2753715515136719, 0.28472137451171875, 0.2940711975097656, 0.3034210205078125, 0.3127708435058594, 0.32212066650390625, 0.3314704895019531, 0.3408203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 14.0, 15.0, 15.0, 28.0, 31.0, 42.0, 60.0, 63.0, 68.0, 81.0, 93.0, 79.0, 87.0, 74.0, 57.0, 41.0, 40.0, 27.0, 13.0, 14.0, 14.0, 12.0, 11.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2687612771987915, -1.2335816621780396, -1.198401927947998, -1.163222312927246, -1.1280426979064941, -1.0928629636764526, -1.0576833486557007, -1.0225036144256592, -0.9873239994049072, -0.9521443247795105, -0.9169646501541138, -0.8817850351333618, -0.8466053605079651, -0.8114256858825684, -0.7762460708618164, -0.7410663962364197, -0.705886721611023, -0.6707070469856262, -0.6355273723602295, -0.6003477573394775, -0.5651680827140808, -0.5299884080886841, -0.49480876326560974, -0.4596291184425354, -0.42444944381713867, -0.38926976919174194, -0.3540901243686676, -0.31891047954559326, -0.28373080492019653, -0.248551145195961, -0.21337148547172546, -0.17819182574748993, -0.1430121660232544, -0.10783250629901886, -0.07265284657478333, -0.03747318685054779, -0.002293527126312256, 0.03288613259792328, 0.06806579232215881, 0.10324545204639435, 0.13842511177062988, 0.17360477149486542, 0.20878443121910095, 0.2439640909433365, 0.279143750667572, 0.31432342529296875, 0.3495030701160431, 0.38468271493911743, 0.41986238956451416, 0.4550420641899109, 0.49022170901298523, 0.5254013538360596, 0.5605810284614563, 0.595760703086853, 0.630940318107605, 0.6661199927330017, 0.7012996673583984, 0.7364793419837952, 0.7716590166091919, 0.8068386316299438, 0.8420183062553406, 0.8771979808807373, 0.9123775959014893, 0.947557270526886, 0.9827369451522827]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 12.0, 9.0, 16.0, 13.0, 12.0, 21.0, 18.0, 30.0, 21.0, 33.0, 26.0, 35.0, 48.0, 33.0, 37.0, 30.0, 45.0, 29.0, 38.0, 51.0, 35.0, 39.0, 31.0, 34.0, 31.0, 33.0, 27.0, 15.0, 22.0, 18.0, 19.0, 19.0, 13.0, 13.0, 17.0, 13.0, 4.0, 7.0, 9.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.669475793838501, -0.6492985486984253, -0.6291213631629944, -0.6089441180229187, -0.588766872882843, -0.5685896873474121, -0.5484124422073364, -0.5282351970672607, -0.5080579519271851, -0.48788073658943176, -0.4677034914493561, -0.4475262761116028, -0.4273490309715271, -0.4071718156337738, -0.3869946002960205, -0.3668173551559448, -0.3466401696205139, -0.3264629542827606, -0.30628570914268494, -0.28610849380493164, -0.26593124866485596, -0.24575403332710266, -0.22557681798934937, -0.20539958775043488, -0.18522235751152039, -0.1650451272726059, -0.1448678970336914, -0.12469068169593811, -0.10451345145702362, -0.08433622121810913, -0.06415899842977524, -0.043981775641441345, -0.023804545402526855, -0.003627318888902664, 0.016549907624721527, 0.03672713413834572, 0.05690436065196991, 0.0770815908908844, 0.09725881367921829, 0.11743603646755219, 0.13761326670646667, 0.15779049694538116, 0.17796772718429565, 0.19814494252204895, 0.21832217276096344, 0.23849940299987793, 0.2586766183376312, 0.2788538336753845, 0.2990310788154602, 0.3192082941532135, 0.3393855392932892, 0.3595627546310425, 0.37973999977111816, 0.39991721510887146, 0.42009443044662476, 0.44027167558670044, 0.46044889092445374, 0.48062610626220703, 0.5008033514022827, 0.5209805965423584, 0.5411577820777893, 0.561335027217865, 0.5815122723579407, 0.6016894578933716, 0.6218667030334473]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 9.0, 12.0, 15.0, 19.0, 39.0, 54.0, 68.0, 96.0, 184.0, 255.0, 431.0, 699.0, 1222.0, 2014.0, 3447.0, 6186.0, 10591.0, 19058.0, 35368.0, 72722.0, 171784.0, 336910.0, 210151.0, 85837.0, 41233.0, 21480.0, 12053.0, 6846.0, 3990.0, 2298.0, 1330.0, 793.0, 458.0, 287.0, 200.0, 125.0, 95.0, 60.0, 44.0, 29.0, 20.0, 14.0, 6.0, 5.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25830078125, -0.2503795623779297, -0.24245834350585938, -0.23453712463378906, -0.22661590576171875, -0.21869468688964844, -0.21077346801757812, -0.2028522491455078, -0.1949310302734375, -0.1870098114013672, -0.17908859252929688, -0.17116737365722656, -0.16324615478515625, -0.15532493591308594, -0.14740371704101562, -0.1394824981689453, -0.131561279296875, -0.12364006042480469, -0.11571884155273438, -0.10779762268066406, -0.09987640380859375, -0.09195518493652344, -0.08403396606445312, -0.07611274719238281, -0.0681915283203125, -0.06027030944824219, -0.052349090576171875, -0.04442787170410156, -0.03650665283203125, -0.028585433959960938, -0.020664215087890625, -0.012742996215820312, -0.00482177734375, 0.0030994415283203125, 0.011020660400390625, 0.018941879272460938, 0.02686309814453125, 0.03478431701660156, 0.042705535888671875, 0.05062675476074219, 0.0585479736328125, 0.06646919250488281, 0.07439041137695312, 0.08231163024902344, 0.09023284912109375, 0.09815406799316406, 0.10607528686523438, 0.11399650573730469, 0.121917724609375, 0.1298389434814453, 0.13776016235351562, 0.14568138122558594, 0.15360260009765625, 0.16152381896972656, 0.16944503784179688, 0.1773662567138672, 0.1852874755859375, 0.1932086944580078, 0.20112991333007812, 0.20905113220214844, 0.21697235107421875, 0.22489356994628906, 0.23281478881835938, 0.2407360076904297, 0.2486572265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 14.0, 22.0, 19.0, 28.0, 27.0, 56.0, 44.0, 40.0, 53.0, 66.0, 80.0, 57.0, 68.0, 55.0, 50.0, 43.0, 62.0, 50.0, 38.0, 40.0, 16.0, 16.0, 12.0, 11.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09765625, -0.09277534484863281, -0.08789443969726562, -0.08301353454589844, -0.07813262939453125, -0.07325172424316406, -0.06837081909179688, -0.06348991394042969, -0.0586090087890625, -0.05372810363769531, -0.048847198486328125, -0.04396629333496094, -0.03908538818359375, -0.03420448303222656, -0.029323577880859375, -0.024442672729492188, -0.019561767578125, -0.014680862426757812, -0.009799957275390625, -0.0049190521240234375, -3.814697265625e-05, 0.0048427581787109375, 0.009723663330078125, 0.014604568481445312, 0.0194854736328125, 0.024366378784179688, 0.029247283935546875, 0.03412818908691406, 0.03900909423828125, 0.04388999938964844, 0.048770904541015625, 0.05365180969238281, 0.05853271484375, 0.06341361999511719, 0.06829452514648438, 0.07317543029785156, 0.07805633544921875, 0.08293724060058594, 0.08781814575195312, 0.09269905090332031, 0.0975799560546875, 0.10246086120605469, 0.10734176635742188, 0.11222267150878906, 0.11710357666015625, 0.12198448181152344, 0.12686538696289062, 0.1317462921142578, 0.136627197265625, 0.1415081024169922, 0.14638900756835938, 0.15126991271972656, 0.15615081787109375, 0.16103172302246094, 0.16591262817382812, 0.1707935333251953, 0.1756744384765625, 0.1805553436279297, 0.18543624877929688, 0.19031715393066406, 0.19519805908203125, 0.20007896423339844, 0.20495986938476562, 0.2098407745361328, 0.2147216796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 17.0, 12.0, 24.0, 25.0, 34.0, 48.0, 53.0, 105.0, 156.0, 275.0, 465.0, 963.0, 1882.0, 3600.0, 7079.0, 14442.0, 30233.0, 69648.0, 202500.0, 422429.0, 177020.0, 63079.0, 27648.0, 13194.0, 6625.0, 3257.0, 1689.0, 901.0, 452.0, 250.0, 140.0, 89.0, 56.0, 33.0, 24.0, 26.0, 14.0, 8.0, 10.0, 9.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.310302734375, -0.3004341125488281, -0.29056549072265625, -0.2806968688964844, -0.2708282470703125, -0.2609596252441406, -0.25109100341796875, -0.24122238159179688, -0.231353759765625, -0.22148513793945312, -0.21161651611328125, -0.20174789428710938, -0.1918792724609375, -0.18201065063476562, -0.17214202880859375, -0.16227340698242188, -0.15240478515625, -0.14253616333007812, -0.13266754150390625, -0.12279891967773438, -0.1129302978515625, -0.10306167602539062, -0.09319305419921875, -0.08332443237304688, -0.073455810546875, -0.06358718872070312, -0.05371856689453125, -0.043849945068359375, -0.0339813232421875, -0.024112701416015625, -0.01424407958984375, -0.004375457763671875, 0.0054931640625, 0.015361785888671875, 0.02523040771484375, 0.035099029541015625, 0.0449676513671875, 0.054836273193359375, 0.06470489501953125, 0.07457351684570312, 0.084442138671875, 0.09431076049804688, 0.10417938232421875, 0.11404800415039062, 0.1239166259765625, 0.13378524780273438, 0.14365386962890625, 0.15352249145507812, 0.16339111328125, 0.17325973510742188, 0.18312835693359375, 0.19299697875976562, 0.2028656005859375, 0.21273422241210938, 0.22260284423828125, 0.23247146606445312, 0.242340087890625, 0.2522087097167969, 0.26207733154296875, 0.2719459533691406, 0.2818145751953125, 0.2916831970214844, 0.30155181884765625, 0.3114204406738281, 0.3212890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 10.0, 18.0, 17.0, 11.0, 21.0, 29.0, 32.0, 38.0, 36.0, 48.0, 43.0, 49.0, 65.0, 48.0, 46.0, 46.0, 43.0, 45.0, 52.0, 40.0, 27.0, 20.0, 35.0, 21.0, 25.0, 12.0, 22.0, 12.0, 13.0, 12.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.34228515625, -0.33154296875, -0.32080078125, -0.31005859375, -0.29931640625, -0.28857421875, -0.27783203125, -0.26708984375, -0.25634765625, -0.24560546875, -0.23486328125, -0.22412109375, -0.21337890625, -0.20263671875, -0.19189453125, -0.18115234375, -0.17041015625, -0.15966796875, -0.14892578125, -0.13818359375, -0.12744140625, -0.11669921875, -0.10595703125, -0.09521484375, -0.08447265625, -0.07373046875, -0.06298828125, -0.05224609375, -0.04150390625, -0.03076171875, -0.02001953125, -0.00927734375, 0.00146484375, 0.01220703125, 0.02294921875, 0.03369140625, 0.04443359375, 0.05517578125, 0.06591796875, 0.07666015625, 0.08740234375, 0.09814453125, 0.10888671875, 0.11962890625, 0.13037109375, 0.14111328125, 0.15185546875, 0.16259765625, 0.17333984375, 0.18408203125, 0.19482421875, 0.20556640625, 0.21630859375, 0.22705078125, 0.23779296875, 0.24853515625, 0.25927734375, 0.27001953125, 0.28076171875, 0.29150390625, 0.30224609375, 0.31298828125, 0.32373046875, 0.33447265625, 0.34521484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 17.0, 21.0, 65.0, 89.0, 150.0, 291.0, 447.0, 843.0, 1526.0, 2642.0, 4890.0, 8557.0, 15554.0, 27801.0, 53806.0, 134353.0, 373212.0, 251194.0, 85800.0, 39418.0, 21034.0, 11755.0, 6640.0, 3705.0, 2068.0, 1122.0, 652.0, 347.0, 222.0, 118.0, 77.0, 39.0, 34.0, 18.0, 9.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129150390625, -0.12450027465820312, -0.11985015869140625, -0.11520004272460938, -0.1105499267578125, -0.10589981079101562, -0.10124969482421875, -0.09659957885742188, -0.091949462890625, -0.08729934692382812, -0.08264923095703125, -0.07799911499023438, -0.0733489990234375, -0.06869888305664062, -0.06404876708984375, -0.059398651123046875, -0.05474853515625, -0.050098419189453125, -0.04544830322265625, -0.040798187255859375, -0.0361480712890625, -0.031497955322265625, -0.02684783935546875, -0.022197723388671875, -0.017547607421875, -0.012897491455078125, -0.00824737548828125, -0.003597259521484375, 0.0010528564453125, 0.005702972412109375, 0.01035308837890625, 0.015003204345703125, 0.0196533203125, 0.024303436279296875, 0.02895355224609375, 0.033603668212890625, 0.0382537841796875, 0.042903900146484375, 0.04755401611328125, 0.052204132080078125, 0.056854248046875, 0.061504364013671875, 0.06615447998046875, 0.07080459594726562, 0.0754547119140625, 0.08010482788085938, 0.08475494384765625, 0.08940505981445312, 0.09405517578125, 0.09870529174804688, 0.10335540771484375, 0.10800552368164062, 0.1126556396484375, 0.11730575561523438, 0.12195587158203125, 0.12660598754882812, 0.131256103515625, 0.13590621948242188, 0.14055633544921875, 0.14520645141601562, 0.1498565673828125, 0.15450668334960938, 0.15915679931640625, 0.16380691528320312, 0.16845703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 3.0, 8.0, 14.0, 10.0, 28.0, 26.0, 48.0, 51.0, 106.0, 174.0, 170.0, 117.0, 60.0, 54.0, 27.0, 26.0, 12.0, 10.0, 7.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.601478576660156e-05, -4.463084042072296e-05, -4.324689507484436e-05, -4.186294972896576e-05, -4.047900438308716e-05, -3.909505903720856e-05, -3.7711113691329956e-05, -3.6327168345451355e-05, -3.4943222999572754e-05, -3.355927765369415e-05, -3.217533230781555e-05, -3.079138696193695e-05, -2.940744161605835e-05, -2.802349627017975e-05, -2.6639550924301147e-05, -2.5255605578422546e-05, -2.3871660232543945e-05, -2.2487714886665344e-05, -2.1103769540786743e-05, -1.9719824194908142e-05, -1.833587884902954e-05, -1.695193350315094e-05, -1.556798815727234e-05, -1.4184042811393738e-05, -1.2800097465515137e-05, -1.1416152119636536e-05, -1.0032206773757935e-05, -8.648261427879333e-06, -7.264316082000732e-06, -5.880370736122131e-06, -4.49642539024353e-06, -3.112480044364929e-06, -1.7285346984863281e-06, -3.4458935260772705e-07, 1.039355993270874e-06, 2.423301339149475e-06, 3.807246685028076e-06, 5.191192030906677e-06, 6.575137376785278e-06, 7.95908272266388e-06, 9.34302806854248e-06, 1.0726973414421082e-05, 1.2110918760299683e-05, 1.3494864106178284e-05, 1.4878809452056885e-05, 1.6262754797935486e-05, 1.7646700143814087e-05, 1.9030645489692688e-05, 2.041459083557129e-05, 2.179853618144989e-05, 2.318248152732849e-05, 2.4566426873207092e-05, 2.5950372219085693e-05, 2.7334317564964294e-05, 2.8718262910842896e-05, 3.0102208256721497e-05, 3.14861536026001e-05, 3.28700989484787e-05, 3.42540442943573e-05, 3.56379896402359e-05, 3.70219349861145e-05, 3.84058803319931e-05, 3.9789825677871704e-05, 4.1173771023750305e-05, 4.2557716369628906e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 16.0, 20.0, 35.0, 56.0, 121.0, 168.0, 449.0, 1126.0, 2721.0, 7231.0, 18793.0, 48660.0, 159540.0, 558463.0, 168911.0, 50108.0, 19670.0, 7491.0, 2900.0, 1125.0, 471.0, 205.0, 106.0, 62.0, 33.0, 36.0, 13.0, 7.0, 8.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2333984375, -0.22622108459472656, -0.21904373168945312, -0.2118663787841797, -0.20468902587890625, -0.1975116729736328, -0.19033432006835938, -0.18315696716308594, -0.1759796142578125, -0.16880226135253906, -0.16162490844726562, -0.1544475555419922, -0.14727020263671875, -0.1400928497314453, -0.13291549682617188, -0.12573814392089844, -0.118560791015625, -0.11138343811035156, -0.10420608520507812, -0.09702873229980469, -0.08985137939453125, -0.08267402648925781, -0.07549667358398438, -0.06831932067871094, -0.0611419677734375, -0.05396461486816406, -0.046787261962890625, -0.03960990905761719, -0.03243255615234375, -0.025255203247070312, -0.018077850341796875, -0.010900497436523438, -0.00372314453125, 0.0034542083740234375, 0.010631561279296875, 0.017808914184570312, 0.02498626708984375, 0.03216361999511719, 0.039340972900390625, 0.04651832580566406, 0.0536956787109375, 0.06087303161621094, 0.06805038452148438, 0.07522773742675781, 0.08240509033203125, 0.08958244323730469, 0.09675979614257812, 0.10393714904785156, 0.111114501953125, 0.11829185485839844, 0.12546920776367188, 0.1326465606689453, 0.13982391357421875, 0.1470012664794922, 0.15417861938476562, 0.16135597229003906, 0.1685333251953125, 0.17571067810058594, 0.18288803100585938, 0.1900653839111328, 0.19724273681640625, 0.2044200897216797, 0.21159744262695312, 0.21877479553222656, 0.2259521484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 9.0, 7.0, 7.0, 9.0, 13.0, 17.0, 15.0, 30.0, 35.0, 43.0, 62.0, 94.0, 107.0, 121.0, 94.0, 92.0, 44.0, 34.0, 26.0, 18.0, 15.0, 16.0, 17.0, 11.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.162109375, -0.15708160400390625, -0.1520538330078125, -0.14702606201171875, -0.141998291015625, -0.13697052001953125, -0.1319427490234375, -0.12691497802734375, -0.12188720703125, -0.11685943603515625, -0.1118316650390625, -0.10680389404296875, -0.101776123046875, -0.09674835205078125, -0.0917205810546875, -0.08669281005859375, -0.0816650390625, -0.07663726806640625, -0.0716094970703125, -0.06658172607421875, -0.061553955078125, -0.05652618408203125, -0.0514984130859375, -0.04647064208984375, -0.04144287109375, -0.03641510009765625, -0.0313873291015625, -0.02635955810546875, -0.021331787109375, -0.01630401611328125, -0.0112762451171875, -0.00624847412109375, -0.001220703125, 0.00380706787109375, 0.0088348388671875, 0.01386260986328125, 0.018890380859375, 0.02391815185546875, 0.0289459228515625, 0.03397369384765625, 0.03900146484375, 0.04402923583984375, 0.0490570068359375, 0.05408477783203125, 0.059112548828125, 0.06414031982421875, 0.0691680908203125, 0.07419586181640625, 0.0792236328125, 0.08425140380859375, 0.0892791748046875, 0.09430694580078125, 0.099334716796875, 0.10436248779296875, 0.1093902587890625, 0.11441802978515625, 0.11944580078125, 0.12447357177734375, 0.1295013427734375, 0.13452911376953125, 0.139556884765625, 0.14458465576171875, 0.1496124267578125, 0.15464019775390625, 0.15966796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 27.0, 84.0, 163.0, 282.0, 257.0, 129.0, 49.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1073641777038574, -0.9641190767288208, -0.8208739757537842, -0.6776288747787476, -0.5343837738037109, -0.3911386728286743, -0.2478935718536377, -0.10464847087860107, 0.03859663009643555, 0.18184173107147217, 0.3250868320465088, 0.4683319330215454, 0.611577033996582, 0.7548221349716187, 0.8980672359466553, 1.041312336921692, 1.1845574378967285, 1.3278025388717651, 1.4710476398468018, 1.6142927408218384, 1.757537841796875, 1.9007829427719116, 2.0440280437469482, 2.1872730255126953, 2.3305182456970215, 2.4737634658813477, 2.6170084476470947, 2.760253429412842, 2.903498649597168, 3.046743869781494, 3.189988851547241, 3.3332338333129883, 3.4764795303344727, 3.619724750518799, 3.762969732284546, 3.906214714050293, 4.049459934234619, 4.192705154418945, 4.335949897766113, 4.4791951179504395, 4.622440338134766, 4.765685558319092, 4.908930778503418, 5.052175521850586, 5.195420742034912, 5.338665962219238, 5.481910705566406, 5.625155925750732, 5.768401145935059, 5.911646366119385, 6.054891586303711, 6.198136329650879, 6.341381549835205, 6.484626770019531, 6.627871513366699, 6.771116733551025, 6.914361953735352, 7.057607173919678, 7.200852394104004, 7.344097137451172, 7.487342357635498, 7.630587577819824, 7.773832321166992, 7.917077541351318, 8.060322761535645]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 7.0, 6.0, 11.0, 13.0, 17.0, 21.0, 15.0, 9.0, 24.0, 27.0, 23.0, 21.0, 24.0, 43.0, 46.0, 36.0, 43.0, 28.0, 33.0, 38.0, 28.0, 44.0, 46.0, 40.0, 25.0, 38.0, 26.0, 40.0, 26.0, 20.0, 21.0, 23.0, 22.0, 24.0, 20.0, 6.0, 8.0, 10.0, 6.0, 8.0, 4.0, 7.0, 8.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8121540546417236, -0.783103883266449, -0.7540537118911743, -0.7250035405158997, -0.695953369140625, -0.6669031977653503, -0.6378530263900757, -0.6088029146194458, -0.5797526836395264, -0.5507025122642517, -0.521652340888977, -0.4926021695137024, -0.46355199813842773, -0.4345018267631531, -0.4054516851902008, -0.37640151381492615, -0.3473513722419739, -0.3183012008666992, -0.28925102949142456, -0.2602008581161499, -0.23115070164203644, -0.20210053026676178, -0.17305037379264832, -0.14400020241737366, -0.114950031042099, -0.08589985966682434, -0.05684969574213028, -0.027799531817436218, 0.00125063955783844, 0.030300810933113098, 0.05935096740722656, 0.08840113878250122, 0.11745131015777588, 0.14650148153305054, 0.1755516529083252, 0.20460180938243866, 0.23365198075771332, 0.26270216703414917, 0.29175230860710144, 0.3208024799823761, 0.34985265135765076, 0.3789028227329254, 0.4079529941082001, 0.43700313568115234, 0.466053307056427, 0.49510347843170166, 0.5241536498069763, 0.553203821182251, 0.5822539925575256, 0.6113041639328003, 0.640354335308075, 0.6694045066833496, 0.6984546780586243, 0.7275048494338989, 0.7565549612045288, 0.7856051921844482, 0.8146553039550781, 0.8437054753303528, 0.8727556467056274, 0.9018058180809021, 0.9308559894561768, 0.9599061608314514, 0.9889563322067261, 1.018006443977356, 1.0470566749572754]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 11.0, 14.0, 11.0, 20.0, 38.0, 52.0, 72.0, 84.0, 142.0, 222.0, 319.0, 497.0, 798.0, 1315.0, 2260.0, 4081.0, 8115.0, 16443.0, 35752.0, 85098.0, 228738.0, 840760.0, 2206996.0, 491301.0, 156436.0, 60987.0, 26436.0, 12615.0, 6436.0, 3248.0, 1828.0, 1144.0, 669.0, 434.0, 277.0, 195.0, 119.0, 110.0, 52.0, 37.0, 34.0, 24.0, 15.0, 14.0, 13.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192626953125, -0.18627357482910156, -0.17992019653320312, -0.1735668182373047, -0.16721343994140625, -0.1608600616455078, -0.15450668334960938, -0.14815330505371094, -0.1417999267578125, -0.13544654846191406, -0.12909317016601562, -0.12273979187011719, -0.11638641357421875, -0.11003303527832031, -0.10367965698242188, -0.09732627868652344, -0.090972900390625, -0.08461952209472656, -0.07826614379882812, -0.07191276550292969, -0.06555938720703125, -0.05920600891113281, -0.052852630615234375, -0.04649925231933594, -0.0401458740234375, -0.03379249572753906, -0.027439117431640625, -0.021085739135742188, -0.01473236083984375, -0.008378982543945312, -0.002025604248046875, 0.0043277740478515625, 0.01068115234375, 0.017034530639648438, 0.023387908935546875, 0.029741287231445312, 0.03609466552734375, 0.04244804382324219, 0.048801422119140625, 0.05515480041503906, 0.0615081787109375, 0.06786155700683594, 0.07421493530273438, 0.08056831359863281, 0.08692169189453125, 0.09327507019042969, 0.09962844848632812, 0.10598182678222656, 0.112335205078125, 0.11868858337402344, 0.12504196166992188, 0.1313953399658203, 0.13774871826171875, 0.1441020965576172, 0.15045547485351562, 0.15680885314941406, 0.1631622314453125, 0.16951560974121094, 0.17586898803710938, 0.1822223663330078, 0.18857574462890625, 0.1949291229248047, 0.20128250122070312, 0.20763587951660156, 0.2139892578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 8.0, 11.0, 11.0, 22.0, 26.0, 29.0, 34.0, 37.0, 48.0, 61.0, 61.0, 62.0, 66.0, 53.0, 64.0, 57.0, 59.0, 38.0, 60.0, 37.0, 37.0, 27.0, 23.0, 15.0, 9.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09636116027832031, -0.09140396118164062, -0.08644676208496094, -0.08148956298828125, -0.07653236389160156, -0.07157516479492188, -0.06661796569824219, -0.0616607666015625, -0.05670356750488281, -0.051746368408203125, -0.04678916931152344, -0.04183197021484375, -0.03687477111816406, -0.031917572021484375, -0.026960372924804688, -0.022003173828125, -0.017045974731445312, -0.012088775634765625, -0.0071315765380859375, -0.00217437744140625, 0.0027828216552734375, 0.007740020751953125, 0.012697219848632812, 0.0176544189453125, 0.022611618041992188, 0.027568817138671875, 0.03252601623535156, 0.03748321533203125, 0.04244041442871094, 0.047397613525390625, 0.05235481262207031, 0.05731201171875, 0.06226921081542969, 0.06722640991210938, 0.07218360900878906, 0.07714080810546875, 0.08209800720214844, 0.08705520629882812, 0.09201240539550781, 0.0969696044921875, 0.10192680358886719, 0.10688400268554688, 0.11184120178222656, 0.11679840087890625, 0.12175559997558594, 0.12671279907226562, 0.1316699981689453, 0.136627197265625, 0.1415843963623047, 0.14654159545898438, 0.15149879455566406, 0.15645599365234375, 0.16141319274902344, 0.16637039184570312, 0.1713275909423828, 0.1762847900390625, 0.1812419891357422, 0.18619918823242188, 0.19115638732910156, 0.19611358642578125, 0.20107078552246094, 0.20602798461914062, 0.2109851837158203, 0.2159423828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 14.0, 16.0, 24.0, 32.0, 44.0, 58.0, 81.0, 119.0, 151.0, 254.0, 397.0, 519.0, 816.0, 1334.0, 1961.0, 3466.0, 5898.0, 10932.0, 21002.0, 43153.0, 97026.0, 238522.0, 672722.0, 1842119.0, 779127.0, 267941.0, 107604.0, 48014.0, 22737.0, 11992.0, 6446.0, 3637.0, 2181.0, 1384.0, 849.0, 537.0, 354.0, 259.0, 162.0, 123.0, 74.0, 50.0, 44.0, 34.0, 17.0, 20.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2490234375, -0.240875244140625, -0.23272705078125, -0.224578857421875, -0.2164306640625, -0.208282470703125, -0.20013427734375, -0.191986083984375, -0.183837890625, -0.175689697265625, -0.16754150390625, -0.159393310546875, -0.1512451171875, -0.143096923828125, -0.13494873046875, -0.126800537109375, -0.11865234375, -0.110504150390625, -0.10235595703125, -0.094207763671875, -0.0860595703125, -0.077911376953125, -0.06976318359375, -0.061614990234375, -0.053466796875, -0.045318603515625, -0.03717041015625, -0.029022216796875, -0.0208740234375, -0.012725830078125, -0.00457763671875, 0.003570556640625, 0.01171875, 0.019866943359375, 0.02801513671875, 0.036163330078125, 0.0443115234375, 0.052459716796875, 0.06060791015625, 0.068756103515625, 0.076904296875, 0.085052490234375, 0.09320068359375, 0.101348876953125, 0.1094970703125, 0.117645263671875, 0.12579345703125, 0.133941650390625, 0.14208984375, 0.150238037109375, 0.15838623046875, 0.166534423828125, 0.1746826171875, 0.182830810546875, 0.19097900390625, 0.199127197265625, 0.207275390625, 0.215423583984375, 0.22357177734375, 0.231719970703125, 0.2398681640625, 0.248016357421875, 0.25616455078125, 0.264312744140625, 0.2724609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 12.0, 16.0, 10.0, 15.0, 21.0, 31.0, 35.0, 41.0, 70.0, 91.0, 146.0, 177.0, 253.0, 369.0, 527.0, 655.0, 464.0, 317.0, 232.0, 173.0, 104.0, 75.0, 56.0, 48.0, 26.0, 28.0, 15.0, 12.0, 6.0, 12.0, 7.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.281005859375, -0.2732830047607422, -0.2655601501464844, -0.25783729553222656, -0.25011444091796875, -0.24239158630371094, -0.23466873168945312, -0.2269458770751953, -0.2192230224609375, -0.2115001678466797, -0.20377731323242188, -0.19605445861816406, -0.18833160400390625, -0.18060874938964844, -0.17288589477539062, -0.1651630401611328, -0.157440185546875, -0.1497173309326172, -0.14199447631835938, -0.13427162170410156, -0.12654876708984375, -0.11882591247558594, -0.11110305786132812, -0.10338020324707031, -0.0956573486328125, -0.08793449401855469, -0.08021163940429688, -0.07248878479003906, -0.06476593017578125, -0.05704307556152344, -0.049320220947265625, -0.04159736633300781, -0.03387451171875, -0.026151657104492188, -0.018428802490234375, -0.010705947875976562, -0.00298309326171875, 0.0047397613525390625, 0.012462615966796875, 0.020185470581054688, 0.0279083251953125, 0.03563117980957031, 0.043354034423828125, 0.05107688903808594, 0.05879974365234375, 0.06652259826660156, 0.07424545288085938, 0.08196830749511719, 0.089691162109375, 0.09741401672363281, 0.10513687133789062, 0.11285972595214844, 0.12058258056640625, 0.12830543518066406, 0.13602828979492188, 0.1437511444091797, 0.1514739990234375, 0.1591968536376953, 0.16691970825195312, 0.17464256286621094, 0.18236541748046875, 0.19008827209472656, 0.19781112670898438, 0.2055339813232422, 0.2132568359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 6.0, 12.0, 29.0, 34.0, 53.0, 66.0, 79.0, 84.0, 75.0, 92.0, 99.0, 78.0, 70.0, 61.0, 42.0, 31.0, 28.0, 15.0, 11.0, 11.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6479687690734863, -1.604292392730713, -1.5606160163879395, -1.5169397592544556, -1.4732633829116821, -1.4295870065689087, -1.3859106302261353, -1.3422343730926514, -1.298557996749878, -1.2548816204071045, -1.211205244064331, -1.1675289869308472, -1.1238526105880737, -1.0801762342453003, -1.0364998579025269, -0.9928235411643982, -0.9491471648216248, -0.9054707884788513, -0.8617944717407227, -0.8181180953979492, -0.7744417786598206, -0.7307654023170471, -0.6870890855789185, -0.643412709236145, -0.5997363328933716, -0.5560599565505981, -0.5123836398124695, -0.46870726346969604, -0.4250309467315674, -0.38135457038879395, -0.3376782238483429, -0.29400187730789185, -0.2503255605697632, -0.20664921402931213, -0.16297286748886108, -0.11929650604724884, -0.07562015950679779, -0.03194381296634674, 0.011732548475265503, 0.05540889501571655, 0.0990852415561676, 0.14276158809661865, 0.1864379346370697, 0.23011429607868195, 0.2737906575202942, 0.31746697425842285, 0.3611433506011963, 0.40481969714164734, 0.4484960436820984, 0.49217239022254944, 0.5358487367630005, 0.5795251131057739, 0.6232014298439026, 0.666877806186676, 0.7105541229248047, 0.7542304992675781, 0.7979068756103516, 0.841583251953125, 0.8852595686912537, 0.9289359450340271, 0.9726122617721558, 1.0162886381149292, 1.0599650144577026, 1.1036412715911865, 1.14731764793396]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 6.0, 4.0, 9.0, 12.0, 10.0, 20.0, 13.0, 24.0, 18.0, 19.0, 18.0, 31.0, 30.0, 23.0, 31.0, 45.0, 40.0, 30.0, 39.0, 36.0, 44.0, 33.0, 43.0, 47.0, 39.0, 27.0, 40.0, 30.0, 38.0, 34.0, 25.0, 14.0, 21.0, 15.0, 21.0, 22.0, 8.0, 8.0, 10.0, 5.0, 7.0, 3.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7765210270881653, -0.7536066174507141, -0.7306922674179077, -0.7077778577804565, -0.6848634481430054, -0.661949098110199, -0.6390346884727478, -0.6161203384399414, -0.5932059288024902, -0.5702915191650391, -0.5473771691322327, -0.5244627594947815, -0.5015484094619751, -0.4786339998245239, -0.45571959018707275, -0.43280521035194397, -0.4098908305168152, -0.3869764506816864, -0.3640620708465576, -0.34114766120910645, -0.31823328137397766, -0.2953189015388489, -0.2724044919013977, -0.24949011206626892, -0.22657573223114014, -0.20366135239601135, -0.18074695765972137, -0.1578325629234314, -0.1349181830883026, -0.11200379580259323, -0.08908940851688385, -0.06617501378059387, -0.04326069355010986, -0.020346306264400482, 0.002568081021308899, 0.02548246830701828, 0.04839685559272766, 0.07131124287843704, 0.09422563016414642, 0.1171400249004364, 0.14005440473556519, 0.16296878457069397, 0.18588317930698395, 0.20879757404327393, 0.2317119538784027, 0.2546263337135315, 0.27754074335098267, 0.30045512318611145, 0.32336950302124023, 0.346283882856369, 0.3691982626914978, 0.392112672328949, 0.41502705216407776, 0.43794143199920654, 0.4608558416366577, 0.4837702214717865, 0.5066846013069153, 0.5295990109443665, 0.5525133609771729, 0.575427770614624, 0.5983421802520752, 0.6212565302848816, 0.6441709399223328, 0.6670852899551392, 0.6899996995925903]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 8.0, 12.0, 8.0, 21.0, 25.0, 31.0, 77.0, 84.0, 127.0, 199.0, 293.0, 489.0, 720.0, 1196.0, 1932.0, 2936.0, 4544.0, 7317.0, 11663.0, 18671.0, 29895.0, 49802.0, 83304.0, 136979.0, 192500.0, 185137.0, 126209.0, 75451.0, 45138.0, 27466.0, 17256.0, 10505.0, 6872.0, 4277.0, 2734.0, 1666.0, 984.0, 735.0, 435.0, 293.0, 163.0, 142.0, 86.0, 58.0, 45.0, 18.0, 14.0, 15.0, 7.0, 7.0, 1.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.16943359375, -0.16395187377929688, -0.15847015380859375, -0.15298843383789062, -0.1475067138671875, -0.14202499389648438, -0.13654327392578125, -0.13106155395507812, -0.125579833984375, -0.12009811401367188, -0.11461639404296875, -0.10913467407226562, -0.1036529541015625, -0.09817123413085938, -0.09268951416015625, -0.08720779418945312, -0.08172607421875, -0.07624435424804688, -0.07076263427734375, -0.06528091430664062, -0.0597991943359375, -0.054317474365234375, -0.04883575439453125, -0.043354034423828125, -0.037872314453125, -0.032390594482421875, -0.02690887451171875, -0.021427154541015625, -0.0159454345703125, -0.010463714599609375, -0.00498199462890625, 0.000499725341796875, 0.0059814453125, 0.011463165283203125, 0.01694488525390625, 0.022426605224609375, 0.0279083251953125, 0.033390045166015625, 0.03887176513671875, 0.044353485107421875, 0.049835205078125, 0.055316925048828125, 0.06079864501953125, 0.06628036499023438, 0.0717620849609375, 0.07724380493164062, 0.08272552490234375, 0.08820724487304688, 0.09368896484375, 0.09917068481445312, 0.10465240478515625, 0.11013412475585938, 0.1156158447265625, 0.12109756469726562, 0.12657928466796875, 0.13206100463867188, 0.137542724609375, 0.14302444458007812, 0.14850616455078125, 0.15398788452148438, 0.1594696044921875, 0.16495132446289062, 0.17043304443359375, 0.17591476440429688, 0.181396484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 11.0, 10.0, 11.0, 12.0, 26.0, 24.0, 33.0, 30.0, 45.0, 37.0, 47.0, 56.0, 64.0, 55.0, 67.0, 70.0, 62.0, 44.0, 44.0, 43.0, 37.0, 45.0, 26.0, 20.0, 21.0, 19.0, 17.0, 6.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.1123952865600586, -0.10693168640136719, -0.10146808624267578, -0.09600448608398438, -0.09054088592529297, -0.08507728576660156, -0.07961368560791016, -0.07415008544921875, -0.06868648529052734, -0.06322288513183594, -0.05775928497314453, -0.052295684814453125, -0.04683208465576172, -0.04136848449707031, -0.035904884338378906, -0.0304412841796875, -0.024977684020996094, -0.019514083862304688, -0.014050483703613281, -0.008586883544921875, -0.0031232833862304688, 0.0023403167724609375, 0.007803916931152344, 0.01326751708984375, 0.018731117248535156, 0.024194717407226562, 0.02965831756591797, 0.035121917724609375, 0.04058551788330078, 0.04604911804199219, 0.051512718200683594, 0.056976318359375, 0.062439918518066406, 0.06790351867675781, 0.07336711883544922, 0.07883071899414062, 0.08429431915283203, 0.08975791931152344, 0.09522151947021484, 0.10068511962890625, 0.10614871978759766, 0.11161231994628906, 0.11707592010498047, 0.12253952026367188, 0.12800312042236328, 0.1334667205810547, 0.1389303207397461, 0.1443939208984375, 0.1498575210571289, 0.1553211212158203, 0.16078472137451172, 0.16624832153320312, 0.17171192169189453, 0.17717552185058594, 0.18263912200927734, 0.18810272216796875, 0.19356632232666016, 0.19902992248535156, 0.20449352264404297, 0.20995712280273438, 0.21542072296142578, 0.2208843231201172, 0.2263479232788086, 0.2318115234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 12.0, 12.0, 24.0, 28.0, 47.0, 70.0, 122.0, 230.0, 561.0, 1263.0, 3647.0, 10277.0, 30220.0, 99236.0, 350242.0, 386133.0, 114194.0, 34157.0, 11436.0, 3983.0, 1493.0, 565.0, 248.0, 122.0, 58.0, 45.0, 29.0, 11.0, 21.0, 13.0, 9.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.425048828125, -0.4113616943359375, -0.397674560546875, -0.3839874267578125, -0.37030029296875, -0.3566131591796875, -0.342926025390625, -0.3292388916015625, -0.3155517578125, -0.3018646240234375, -0.288177490234375, -0.2744903564453125, -0.26080322265625, -0.2471160888671875, -0.233428955078125, -0.2197418212890625, -0.2060546875, -0.1923675537109375, -0.178680419921875, -0.1649932861328125, -0.15130615234375, -0.1376190185546875, -0.123931884765625, -0.1102447509765625, -0.0965576171875, -0.0828704833984375, -0.069183349609375, -0.0554962158203125, -0.04180908203125, -0.0281219482421875, -0.014434814453125, -0.0007476806640625, 0.012939453125, 0.0266265869140625, 0.040313720703125, 0.0540008544921875, 0.06768798828125, 0.0813751220703125, 0.095062255859375, 0.1087493896484375, 0.1224365234375, 0.1361236572265625, 0.149810791015625, 0.1634979248046875, 0.17718505859375, 0.1908721923828125, 0.204559326171875, 0.2182464599609375, 0.23193359375, 0.2456207275390625, 0.259307861328125, 0.2729949951171875, 0.28668212890625, 0.3003692626953125, 0.314056396484375, 0.3277435302734375, 0.3414306640625, 0.3551177978515625, 0.368804931640625, 0.3824920654296875, 0.39617919921875, 0.4098663330078125, 0.423553466796875, 0.4372406005859375, 0.450927734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 7.0, 8.0, 9.0, 20.0, 19.0, 18.0, 17.0, 27.0, 27.0, 28.0, 41.0, 59.0, 49.0, 36.0, 47.0, 58.0, 39.0, 43.0, 38.0, 48.0, 47.0, 45.0, 37.0, 37.0, 33.0, 36.0, 24.0, 17.0, 13.0, 12.0, 4.0, 6.0, 2.0, 7.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.431396484375, -0.4179801940917969, -0.40456390380859375, -0.3911476135253906, -0.3777313232421875, -0.3643150329589844, -0.35089874267578125, -0.3374824523925781, -0.324066162109375, -0.3106498718261719, -0.29723358154296875, -0.2838172912597656, -0.2704010009765625, -0.2569847106933594, -0.24356842041015625, -0.23015213012695312, -0.21673583984375, -0.20331954956054688, -0.18990325927734375, -0.17648696899414062, -0.1630706787109375, -0.14965438842773438, -0.13623809814453125, -0.12282180786132812, -0.109405517578125, -0.09598922729492188, -0.08257293701171875, -0.06915664672851562, -0.0557403564453125, -0.042324066162109375, -0.02890777587890625, -0.015491485595703125, -0.0020751953125, 0.011341094970703125, 0.02475738525390625, 0.038173675537109375, 0.0515899658203125, 0.06500625610351562, 0.07842254638671875, 0.09183883666992188, 0.105255126953125, 0.11867141723632812, 0.13208770751953125, 0.14550399780273438, 0.1589202880859375, 0.17233657836914062, 0.18575286865234375, 0.19916915893554688, 0.21258544921875, 0.22600173950195312, 0.23941802978515625, 0.2528343200683594, 0.2662506103515625, 0.2796669006347656, 0.29308319091796875, 0.3064994812011719, 0.319915771484375, 0.3333320617675781, 0.34674835205078125, 0.3601646423339844, 0.3735809326171875, 0.3869972229003906, 0.40041351318359375, 0.4138298034667969, 0.42724609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 11.0, 12.0, 19.0, 21.0, 39.0, 44.0, 69.0, 105.0, 146.0, 288.0, 416.0, 788.0, 1425.0, 2600.0, 5169.0, 10262.0, 21629.0, 47171.0, 110137.0, 312352.0, 325625.0, 116226.0, 49385.0, 22500.0, 10638.0, 5262.0, 2646.0, 1529.0, 792.0, 451.0, 279.0, 171.0, 119.0, 65.0, 47.0, 32.0, 27.0, 20.0, 13.0, 4.0, 1.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15883445739746094, -0.15336227416992188, -0.1478900909423828, -0.14241790771484375, -0.1369457244873047, -0.13147354125976562, -0.12600135803222656, -0.1205291748046875, -0.11505699157714844, -0.10958480834960938, -0.10411262512207031, -0.09864044189453125, -0.09316825866699219, -0.08769607543945312, -0.08222389221191406, -0.076751708984375, -0.07127952575683594, -0.06580734252929688, -0.06033515930175781, -0.05486297607421875, -0.04939079284667969, -0.043918609619140625, -0.03844642639160156, -0.0329742431640625, -0.027502059936523438, -0.022029876708984375, -0.016557693481445312, -0.01108551025390625, -0.0056133270263671875, -0.000141143798828125, 0.0053310394287109375, 0.01080322265625, 0.016275405883789062, 0.021747589111328125, 0.027219772338867188, 0.03269195556640625, 0.03816413879394531, 0.043636322021484375, 0.04910850524902344, 0.0545806884765625, 0.06005287170410156, 0.06552505493164062, 0.07099723815917969, 0.07646942138671875, 0.08194160461425781, 0.08741378784179688, 0.09288597106933594, 0.098358154296875, 0.10383033752441406, 0.10930252075195312, 0.11477470397949219, 0.12024688720703125, 0.1257190704345703, 0.13119125366210938, 0.13666343688964844, 0.1421356201171875, 0.14760780334472656, 0.15307998657226562, 0.1585521697998047, 0.16402435302734375, 0.1694965362548828, 0.17496871948242188, 0.18044090270996094, 0.1859130859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 16.0, 15.0, 15.0, 25.0, 38.0, 54.0, 99.0, 145.0, 203.0, 153.0, 64.0, 49.0, 35.0, 33.0, 16.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0187110900878906e-05, -4.820898175239563e-05, -4.6230852603912354e-05, -4.425272345542908e-05, -4.22745943069458e-05, -4.0296465158462524e-05, -3.831833600997925e-05, -3.634020686149597e-05, -3.4362077713012695e-05, -3.238394856452942e-05, -3.0405819416046143e-05, -2.8427690267562866e-05, -2.644956111907959e-05, -2.4471431970596313e-05, -2.2493302822113037e-05, -2.051517367362976e-05, -1.8537044525146484e-05, -1.6558915376663208e-05, -1.4580786228179932e-05, -1.2602657079696655e-05, -1.0624527931213379e-05, -8.646398782730103e-06, -6.668269634246826e-06, -4.69014048576355e-06, -2.7120113372802734e-06, -7.338821887969971e-07, 1.2442469596862793e-06, 3.2223761081695557e-06, 5.200505256652832e-06, 7.178634405136108e-06, 9.156763553619385e-06, 1.1134892702102661e-05, 1.3113021850585938e-05, 1.5091150999069214e-05, 1.706928014755249e-05, 1.9047409296035767e-05, 2.1025538444519043e-05, 2.300366759300232e-05, 2.4981796741485596e-05, 2.6959925889968872e-05, 2.893805503845215e-05, 3.0916184186935425e-05, 3.28943133354187e-05, 3.487244248390198e-05, 3.6850571632385254e-05, 3.882870078086853e-05, 4.080682992935181e-05, 4.278495907783508e-05, 4.476308822631836e-05, 4.6741217374801636e-05, 4.871934652328491e-05, 5.069747567176819e-05, 5.2675604820251465e-05, 5.465373396873474e-05, 5.663186311721802e-05, 5.8609992265701294e-05, 6.058812141418457e-05, 6.256625056266785e-05, 6.454437971115112e-05, 6.65225088596344e-05, 6.850063800811768e-05, 7.047876715660095e-05, 7.245689630508423e-05, 7.44350254535675e-05, 7.641315460205078e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 15.0, 9.0, 28.0, 40.0, 37.0, 73.0, 127.0, 185.0, 310.0, 508.0, 983.0, 1972.0, 4536.0, 11369.0, 31597.0, 93028.0, 375199.0, 380796.0, 95111.0, 32235.0, 11679.0, 4653.0, 1916.0, 920.0, 466.0, 245.0, 166.0, 122.0, 76.0, 39.0, 40.0, 24.0, 13.0, 7.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.287353515625, -0.2795886993408203, -0.2718238830566406, -0.26405906677246094, -0.25629425048828125, -0.24852943420410156, -0.24076461791992188, -0.2329998016357422, -0.2252349853515625, -0.2174701690673828, -0.20970535278320312, -0.20194053649902344, -0.19417572021484375, -0.18641090393066406, -0.17864608764648438, -0.1708812713623047, -0.163116455078125, -0.1553516387939453, -0.14758682250976562, -0.13982200622558594, -0.13205718994140625, -0.12429237365722656, -0.11652755737304688, -0.10876274108886719, -0.1009979248046875, -0.09323310852050781, -0.08546829223632812, -0.07770347595214844, -0.06993865966796875, -0.06217384338378906, -0.054409027099609375, -0.04664421081542969, -0.03887939453125, -0.031114578247070312, -0.023349761962890625, -0.015584945678710938, -0.00782012939453125, -5.53131103515625e-05, 0.007709503173828125, 0.015474319458007812, 0.0232391357421875, 0.031003952026367188, 0.038768768310546875, 0.04653358459472656, 0.05429840087890625, 0.06206321716308594, 0.06982803344726562, 0.07759284973144531, 0.085357666015625, 0.09312248229980469, 0.10088729858398438, 0.10865211486816406, 0.11641693115234375, 0.12418174743652344, 0.13194656372070312, 0.1397113800048828, 0.1474761962890625, 0.1552410125732422, 0.16300582885742188, 0.17077064514160156, 0.17853546142578125, 0.18630027770996094, 0.19406509399414062, 0.2018299102783203, 0.2095947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 10.0, 17.0, 18.0, 25.0, 37.0, 64.0, 126.0, 162.0, 190.0, 109.0, 71.0, 41.0, 28.0, 22.0, 18.0, 19.0, 5.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.23785781860351562, -0.22937774658203125, -0.22089767456054688, -0.2124176025390625, -0.20393753051757812, -0.19545745849609375, -0.18697738647460938, -0.178497314453125, -0.17001724243164062, -0.16153717041015625, -0.15305709838867188, -0.1445770263671875, -0.13609695434570312, -0.12761688232421875, -0.11913681030273438, -0.11065673828125, -0.10217666625976562, -0.09369659423828125, -0.08521652221679688, -0.0767364501953125, -0.06825637817382812, -0.05977630615234375, -0.051296234130859375, -0.042816162109375, -0.034336090087890625, -0.02585601806640625, -0.017375946044921875, -0.0088958740234375, -0.000415802001953125, 0.00806427001953125, 0.016544342041015625, 0.0250244140625, 0.033504486083984375, 0.04198455810546875, 0.050464630126953125, 0.0589447021484375, 0.06742477416992188, 0.07590484619140625, 0.08438491821289062, 0.092864990234375, 0.10134506225585938, 0.10982513427734375, 0.11830520629882812, 0.1267852783203125, 0.13526535034179688, 0.14374542236328125, 0.15222549438476562, 0.16070556640625, 0.16918563842773438, 0.17766571044921875, 0.18614578247070312, 0.1946258544921875, 0.20310592651367188, 0.21158599853515625, 0.22006607055664062, 0.228546142578125, 0.23702621459960938, 0.24550628662109375, 0.2539863586425781, 0.2624664306640625, 0.2709465026855469, 0.27942657470703125, 0.2879066467285156, 0.29638671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 45.0, 266.0, 482.0, 193.0, 24.0, 2.0, 1.0], "bins": [-16.446990966796875, -16.1691837310791, -15.891377449035645, -15.613570213317871, -15.335763931274414, -15.05795669555664, -14.780150413513184, -14.50234317779541, -14.224536895751953, -13.94672966003418, -13.668923377990723, -13.39111614227295, -13.113309860229492, -12.835502624511719, -12.557696342468262, -12.279889106750488, -12.002082824707031, -11.724275588989258, -11.4464693069458, -11.168662071228027, -10.89085578918457, -10.613048553466797, -10.33524227142334, -10.057435035705566, -9.779627799987793, -9.50182056427002, -9.224014282226562, -8.946207046508789, -8.668400764465332, -8.390593528747559, -8.112787246704102, -7.834980010986328, -7.557173728942871, -7.279366970062256, -7.001560211181641, -6.723753452301025, -6.44594669342041, -6.168139934539795, -5.89033317565918, -5.612525939941406, -5.334719181060791, -5.056912422180176, -4.7791056632995605, -4.501298904418945, -4.22349214553833, -3.945685386657715, -3.6678783893585205, -3.3900716304779053, -3.112265110015869, -2.834458351135254, -2.5566515922546387, -2.2788448333740234, -2.001038074493408, -1.7232311964035034, -1.4454243183135986, -1.1676175594329834, -0.8898106813430786, -0.6120039224624634, -0.33419710397720337, -0.05639028549194336, 0.22141647338867188, 0.4992232322692871, 0.7770301103591919, 1.0548368692398071, 1.3326436281204224]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 14.0, 6.0, 5.0, 9.0, 24.0, 15.0, 28.0, 32.0, 28.0, 34.0, 33.0, 37.0, 38.0, 42.0, 53.0, 63.0, 67.0, 51.0, 44.0, 63.0, 54.0, 43.0, 31.0, 37.0, 29.0, 31.0, 23.0, 17.0, 11.0, 11.0, 10.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.956747829914093, -0.9150879979133606, -0.873428225517273, -0.8317683935165405, -0.7901085615158081, -0.7484487295150757, -0.706788957118988, -0.6651291251182556, -0.623469352722168, -0.5818095207214355, -0.5401497483253479, -0.4984899163246155, -0.45683008432388306, -0.415170282125473, -0.373510479927063, -0.33185064792633057, -0.29019081592559814, -0.24853099882602692, -0.2068711817264557, -0.16521137952804565, -0.12355156242847443, -0.0818917453289032, -0.040231943130493164, 0.0014278888702392578, 0.04308769106864929, 0.08474750816822052, 0.12640732526779175, 0.16806712746620178, 0.209726944565773, 0.25138676166534424, 0.2930465638637543, 0.3347063958644867, 0.3763662576675415, 0.41802605986595154, 0.45968589186668396, 0.501345694065094, 0.5430055260658264, 0.5846652984619141, 0.6263251304626465, 0.6679849624633789, 0.7096447944641113, 0.7513046264648438, 0.7929643988609314, 0.8346242308616638, 0.8762840628623962, 0.9179438352584839, 0.9596036672592163, 1.0012634992599487, 1.0429232120513916, 1.084583044052124, 1.1262428760528564, 1.1679027080535889, 1.2095624208450317, 1.2512222528457642, 1.2928820848464966, 1.334541916847229, 1.3762017488479614, 1.4178615808486938, 1.4595214128494263, 1.5011811256408691, 1.5428409576416016, 1.584500789642334, 1.6261606216430664, 1.6678204536437988, 1.7094802856445312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 3.0, 9.0, 15.0, 14.0, 17.0, 19.0, 40.0, 58.0, 67.0, 113.0, 158.0, 214.0, 345.0, 580.0, 843.0, 1438.0, 2437.0, 4595.0, 9366.0, 19759.0, 46586.0, 122861.0, 399964.0, 1914837.0, 1238912.0, 273725.0, 90886.0, 35022.0, 15005.0, 7262.0, 3700.0, 2082.0, 1229.0, 697.0, 462.0, 294.0, 217.0, 136.0, 109.0, 63.0, 39.0, 26.0, 26.0, 9.0, 12.0, 12.0, 4.0, 4.0, 4.0, 1.0, 2.0, 6.0], "bins": [-0.290283203125, -0.28218650817871094, -0.2740898132324219, -0.2659931182861328, -0.25789642333984375, -0.2497997283935547, -0.24170303344726562, -0.23360633850097656, -0.2255096435546875, -0.21741294860839844, -0.20931625366210938, -0.2012195587158203, -0.19312286376953125, -0.1850261688232422, -0.17692947387695312, -0.16883277893066406, -0.160736083984375, -0.15263938903808594, -0.14454269409179688, -0.1364459991455078, -0.12834930419921875, -0.12025260925292969, -0.11215591430664062, -0.10405921936035156, -0.0959625244140625, -0.08786582946777344, -0.07976913452148438, -0.07167243957519531, -0.06357574462890625, -0.05547904968261719, -0.047382354736328125, -0.03928565979003906, -0.03118896484375, -0.023092269897460938, -0.014995574951171875, -0.0068988800048828125, 0.00119781494140625, 0.009294509887695312, 0.017391204833984375, 0.025487899780273438, 0.0335845947265625, 0.04168128967285156, 0.049777984619140625, 0.05787467956542969, 0.06597137451171875, 0.07406806945800781, 0.08216476440429688, 0.09026145935058594, 0.098358154296875, 0.10645484924316406, 0.11455154418945312, 0.12264823913574219, 0.13074493408203125, 0.1388416290283203, 0.14693832397460938, 0.15503501892089844, 0.1631317138671875, 0.17122840881347656, 0.17932510375976562, 0.1874217987060547, 0.19551849365234375, 0.2036151885986328, 0.21171188354492188, 0.21980857849121094, 0.2279052734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 13.0, 13.0, 14.0, 11.0, 24.0, 29.0, 27.0, 22.0, 44.0, 28.0, 49.0, 38.0, 47.0, 39.0, 38.0, 63.0, 62.0, 57.0, 43.0, 36.0, 44.0, 39.0, 49.0, 28.0, 25.0, 24.0, 17.0, 15.0, 16.0, 9.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10968017578125, -0.10486888885498047, -0.10005760192871094, -0.0952463150024414, -0.09043502807617188, -0.08562374114990234, -0.08081245422363281, -0.07600116729736328, -0.07118988037109375, -0.06637859344482422, -0.06156730651855469, -0.056756019592285156, -0.051944732666015625, -0.047133445739746094, -0.04232215881347656, -0.03751087188720703, -0.0326995849609375, -0.02788829803466797, -0.023077011108398438, -0.018265724182128906, -0.013454437255859375, -0.008643150329589844, -0.0038318634033203125, 0.0009794235229492188, 0.00579071044921875, 0.010601997375488281, 0.015413284301757812, 0.020224571228027344, 0.025035858154296875, 0.029847145080566406, 0.03465843200683594, 0.03946971893310547, 0.044281005859375, 0.04909229278564453, 0.05390357971191406, 0.058714866638183594, 0.06352615356445312, 0.06833744049072266, 0.07314872741699219, 0.07796001434326172, 0.08277130126953125, 0.08758258819580078, 0.09239387512207031, 0.09720516204833984, 0.10201644897460938, 0.1068277359008789, 0.11163902282714844, 0.11645030975341797, 0.1212615966796875, 0.12607288360595703, 0.13088417053222656, 0.1356954574584961, 0.14050674438476562, 0.14531803131103516, 0.1501293182373047, 0.15494060516357422, 0.15975189208984375, 0.16456317901611328, 0.1693744659423828, 0.17418575286865234, 0.17899703979492188, 0.1838083267211914, 0.18861961364746094, 0.19343090057373047, 0.1982421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 13.0, 21.0, 18.0, 34.0, 57.0, 73.0, 103.0, 172.0, 243.0, 379.0, 605.0, 940.0, 1576.0, 2720.0, 4943.0, 8935.0, 18084.0, 39448.0, 95700.0, 261971.0, 904187.0, 1954870.0, 579441.0, 186499.0, 70912.0, 30744.0, 14455.0, 7356.0, 3948.0, 2218.0, 1324.0, 829.0, 522.0, 325.0, 225.0, 150.0, 86.0, 58.0, 35.0, 24.0, 13.0, 9.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.3072547912597656, -0.29712677001953125, -0.2869987487792969, -0.2768707275390625, -0.2667427062988281, -0.25661468505859375, -0.24648666381835938, -0.236358642578125, -0.22623062133789062, -0.21610260009765625, -0.20597457885742188, -0.1958465576171875, -0.18571853637695312, -0.17559051513671875, -0.16546249389648438, -0.15533447265625, -0.14520645141601562, -0.13507843017578125, -0.12495040893554688, -0.1148223876953125, -0.10469436645507812, -0.09456634521484375, -0.08443832397460938, -0.074310302734375, -0.06418228149414062, -0.05405426025390625, -0.043926239013671875, -0.0337982177734375, -0.023670196533203125, -0.01354217529296875, -0.003414154052734375, 0.0067138671875, 0.016841888427734375, 0.02696990966796875, 0.037097930908203125, 0.0472259521484375, 0.057353973388671875, 0.06748199462890625, 0.07761001586914062, 0.087738037109375, 0.09786605834960938, 0.10799407958984375, 0.11812210083007812, 0.1282501220703125, 0.13837814331054688, 0.14850616455078125, 0.15863418579101562, 0.16876220703125, 0.17889022827148438, 0.18901824951171875, 0.19914627075195312, 0.2092742919921875, 0.21940231323242188, 0.22953033447265625, 0.23965835571289062, 0.249786376953125, 0.2599143981933594, 0.27004241943359375, 0.2801704406738281, 0.2902984619140625, 0.3004264831542969, 0.31055450439453125, 0.3206825256347656, 0.330810546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 13.0, 10.0, 8.0, 15.0, 11.0, 22.0, 29.0, 39.0, 60.0, 85.0, 110.0, 166.0, 237.0, 360.0, 563.0, 745.0, 543.0, 330.0, 221.0, 158.0, 99.0, 73.0, 58.0, 35.0, 20.0, 13.0, 10.0, 8.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34033203125, -0.3283576965332031, -0.31638336181640625, -0.3044090270996094, -0.2924346923828125, -0.2804603576660156, -0.26848602294921875, -0.2565116882324219, -0.244537353515625, -0.23256301879882812, -0.22058868408203125, -0.20861434936523438, -0.1966400146484375, -0.18466567993164062, -0.17269134521484375, -0.16071701049804688, -0.14874267578125, -0.13676834106445312, -0.12479400634765625, -0.11281967163085938, -0.1008453369140625, -0.08887100219726562, -0.07689666748046875, -0.06492233276367188, -0.052947998046875, -0.040973663330078125, -0.02899932861328125, -0.017024993896484375, -0.0050506591796875, 0.006923675537109375, 0.01889801025390625, 0.030872344970703125, 0.0428466796875, 0.054821014404296875, 0.06679534912109375, 0.07876968383789062, 0.0907440185546875, 0.10271835327148438, 0.11469268798828125, 0.12666702270507812, 0.138641357421875, 0.15061569213867188, 0.16259002685546875, 0.17456436157226562, 0.1865386962890625, 0.19851303100585938, 0.21048736572265625, 0.22246170043945312, 0.23443603515625, 0.24641036987304688, 0.25838470458984375, 0.2703590393066406, 0.2823333740234375, 0.2943077087402344, 0.30628204345703125, 0.3182563781738281, 0.330230712890625, 0.3422050476074219, 0.35417938232421875, 0.3661537170410156, 0.3781280517578125, 0.3901023864746094, 0.40207672119140625, 0.4140510559082031, 0.426025390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 6.0, 7.0, 10.0, 16.0, 20.0, 38.0, 38.0, 54.0, 62.0, 74.0, 99.0, 99.0, 80.0, 87.0, 71.0, 61.0, 48.0, 29.0, 28.0, 19.0, 18.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4691505432128906, -1.4128050804138184, -1.3564597368240356, -1.3001142740249634, -1.2437689304351807, -1.1874234676361084, -1.1310780048370361, -1.0747326612472534, -1.0183873176574707, -0.9620419144630432, -0.9056965112686157, -0.8493510484695435, -0.7930057048797607, -0.7366602420806885, -0.680314838886261, -0.6239694356918335, -0.5676239728927612, -0.5112785696983337, -0.45493316650390625, -0.39858773350715637, -0.3422423303127289, -0.2858969271183014, -0.2295514941215515, -0.17320609092712402, -0.11686068773269653, -0.060515277087688446, -0.004169866442680359, 0.052175551652908325, 0.10852095484733582, 0.1648663580417633, 0.22121179103851318, 0.2775571942329407, 0.33390259742736816, 0.39024800062179565, 0.44659340381622314, 0.5029388666152954, 0.5592842102050781, 0.6156296730041504, 0.6719750761985779, 0.7283204793930054, 0.7846658825874329, 0.8410112857818604, 0.8973566889762878, 0.9537020921707153, 1.0100475549697876, 1.0663928985595703, 1.1227383613586426, 1.1790838241577148, 1.2354291677474976, 1.2917746305465698, 1.3481199741363525, 1.4044654369354248, 1.4608107805252075, 1.5171562433242798, 1.5735015869140625, 1.6298470497131348, 1.686192512512207, 1.7425379753112793, 1.798883318901062, 1.8552287817001343, 1.911574125289917, 1.9679195880889893, 2.0242650508880615, 2.0806102752685547, 2.136955738067627]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 8.0, 10.0, 15.0, 9.0, 8.0, 13.0, 16.0, 18.0, 13.0, 28.0, 25.0, 23.0, 30.0, 40.0, 46.0, 41.0, 42.0, 41.0, 38.0, 48.0, 29.0, 40.0, 32.0, 39.0, 40.0, 31.0, 30.0, 25.0, 23.0, 37.0, 26.0, 17.0, 14.0, 13.0, 17.0, 12.0, 13.0, 10.0, 9.0, 5.0, 9.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0113821029663086, -0.9774859547615051, -0.9435898661613464, -0.909693717956543, -0.8757976293563843, -0.8419014811515808, -0.8080053329467773, -0.7741092443466187, -0.7402130961418152, -0.7063169479370117, -0.672420859336853, -0.6385247111320496, -0.6046285629272461, -0.5707324743270874, -0.5368363261222839, -0.5029401779174805, -0.4690440893173218, -0.4351479709148407, -0.4012518525123596, -0.36735570430755615, -0.3334595859050751, -0.299563467502594, -0.2656673192977905, -0.23177120089530945, -0.19787508249282837, -0.1639789640903473, -0.13008283078670502, -0.09618670493364334, -0.062290579080581665, -0.028394460678100586, 0.005501672625541687, 0.03939780592918396, 0.07329380512237549, 0.10718993097543716, 0.14108605682849884, 0.1749821901321411, 0.2088783085346222, 0.24277442693710327, 0.27667057514190674, 0.3105666935443878, 0.3444628119468689, 0.37835893034935, 0.41225504875183105, 0.4461511969566345, 0.4800473153591156, 0.5139434337615967, 0.5478395819664001, 0.5817357301712036, 0.6156318187713623, 0.6495279669761658, 0.6834240555763245, 0.7173202037811279, 0.7512162923812866, 0.7851124405860901, 0.8190085887908936, 0.8529046773910522, 0.8868008255958557, 0.9206969738006592, 0.9545930624008179, 0.9884892106056213, 1.0223853588104248, 1.0562814474105835, 1.0901775360107422, 1.1240737438201904, 1.1579698324203491]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 12.0, 17.0, 33.0, 48.0, 74.0, 123.0, 195.0, 342.0, 514.0, 768.0, 1303.0, 2020.0, 3343.0, 5304.0, 8951.0, 14898.0, 24758.0, 42582.0, 74987.0, 134257.0, 224607.0, 216027.0, 124478.0, 69838.0, 39841.0, 23395.0, 13794.0, 8434.0, 5176.0, 3241.0, 2025.0, 1179.0, 725.0, 472.0, 290.0, 178.0, 116.0, 70.0, 43.0, 36.0, 24.0, 11.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2555732727050781, -0.24674224853515625, -0.23791122436523438, -0.2290802001953125, -0.22024917602539062, -0.21141815185546875, -0.20258712768554688, -0.193756103515625, -0.18492507934570312, -0.17609405517578125, -0.16726303100585938, -0.1584320068359375, -0.14960098266601562, -0.14076995849609375, -0.13193893432617188, -0.12310791015625, -0.11427688598632812, -0.10544586181640625, -0.09661483764648438, -0.0877838134765625, -0.07895278930664062, -0.07012176513671875, -0.061290740966796875, -0.052459716796875, -0.043628692626953125, -0.03479766845703125, -0.025966644287109375, -0.0171356201171875, -0.008304595947265625, 0.00052642822265625, 0.009357452392578125, 0.0181884765625, 0.027019500732421875, 0.03585052490234375, 0.044681549072265625, 0.0535125732421875, 0.062343597412109375, 0.07117462158203125, 0.08000564575195312, 0.088836669921875, 0.09766769409179688, 0.10649871826171875, 0.11532974243164062, 0.1241607666015625, 0.13299179077148438, 0.14182281494140625, 0.15065383911132812, 0.15948486328125, 0.16831588745117188, 0.17714691162109375, 0.18597793579101562, 0.1948089599609375, 0.20363998413085938, 0.21247100830078125, 0.22130203247070312, 0.230133056640625, 0.23896408081054688, 0.24779510498046875, 0.2566261291503906, 0.2654571533203125, 0.2742881774902344, 0.28311920166015625, 0.2919502258300781, 0.30078125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 2.0, 10.0, 12.0, 9.0, 20.0, 21.0, 22.0, 30.0, 34.0, 33.0, 30.0, 35.0, 38.0, 36.0, 43.0, 65.0, 58.0, 47.0, 55.0, 55.0, 47.0, 43.0, 35.0, 34.0, 29.0, 45.0, 26.0, 12.0, 19.0, 12.0, 15.0, 10.0, 3.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.13978004455566406, -0.13417434692382812, -0.1285686492919922, -0.12296295166015625, -0.11735725402832031, -0.11175155639648438, -0.10614585876464844, -0.1005401611328125, -0.09493446350097656, -0.08932876586914062, -0.08372306823730469, -0.07811737060546875, -0.07251167297363281, -0.06690597534179688, -0.06130027770996094, -0.055694580078125, -0.05008888244628906, -0.044483184814453125, -0.03887748718261719, -0.03327178955078125, -0.027666091918945312, -0.022060394287109375, -0.016454696655273438, -0.0108489990234375, -0.0052433013916015625, 0.000362396240234375, 0.0059680938720703125, 0.01157379150390625, 0.017179489135742188, 0.022785186767578125, 0.028390884399414062, 0.03399658203125, 0.03960227966308594, 0.045207977294921875, 0.05081367492675781, 0.05641937255859375, 0.06202507019042969, 0.06763076782226562, 0.07323646545410156, 0.0788421630859375, 0.08444786071777344, 0.09005355834960938, 0.09565925598144531, 0.10126495361328125, 0.10687065124511719, 0.11247634887695312, 0.11808204650878906, 0.123687744140625, 0.12929344177246094, 0.13489913940429688, 0.1405048370361328, 0.14611053466796875, 0.1517162322998047, 0.15732192993164062, 0.16292762756347656, 0.1685333251953125, 0.17413902282714844, 0.17974472045898438, 0.1853504180908203, 0.19095611572265625, 0.1965618133544922, 0.20216751098632812, 0.20777320861816406, 0.21337890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 1.0, 2.0, 10.0, 5.0, 9.0, 15.0, 9.0, 26.0, 34.0, 47.0, 61.0, 99.0, 164.0, 291.0, 534.0, 1105.0, 2192.0, 4787.0, 10175.0, 22268.0, 50259.0, 117993.0, 283950.0, 314697.0, 136008.0, 56607.0, 25328.0, 11459.0, 5237.0, 2495.0, 1176.0, 604.0, 336.0, 194.0, 112.0, 81.0, 49.0, 29.0, 20.0, 14.0, 15.0, 13.0, 8.0, 8.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.415771484375, -0.401947021484375, -0.38812255859375, -0.374298095703125, -0.3604736328125, -0.346649169921875, -0.33282470703125, -0.319000244140625, -0.30517578125, -0.291351318359375, -0.27752685546875, -0.263702392578125, -0.2498779296875, -0.236053466796875, -0.22222900390625, -0.208404541015625, -0.194580078125, -0.180755615234375, -0.16693115234375, -0.153106689453125, -0.1392822265625, -0.125457763671875, -0.11163330078125, -0.097808837890625, -0.083984375, -0.070159912109375, -0.05633544921875, -0.042510986328125, -0.0286865234375, -0.014862060546875, -0.00103759765625, 0.012786865234375, 0.026611328125, 0.040435791015625, 0.05426025390625, 0.068084716796875, 0.0819091796875, 0.095733642578125, 0.10955810546875, 0.123382568359375, 0.13720703125, 0.151031494140625, 0.16485595703125, 0.178680419921875, 0.1925048828125, 0.206329345703125, 0.22015380859375, 0.233978271484375, 0.247802734375, 0.261627197265625, 0.27545166015625, 0.289276123046875, 0.3031005859375, 0.316925048828125, 0.33074951171875, 0.344573974609375, 0.3583984375, 0.372222900390625, 0.38604736328125, 0.399871826171875, 0.4136962890625, 0.427520751953125, 0.44134521484375, 0.455169677734375, 0.468994140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 7.0, 9.0, 15.0, 17.0, 21.0, 14.0, 27.0, 26.0, 32.0, 40.0, 32.0, 33.0, 40.0, 39.0, 50.0, 60.0, 55.0, 44.0, 44.0, 38.0, 45.0, 32.0, 29.0, 29.0, 35.0, 29.0, 22.0, 15.0, 23.0, 19.0, 13.0, 12.0, 12.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5439453125, -0.5272445678710938, -0.5105438232421875, -0.49384307861328125, -0.477142333984375, -0.46044158935546875, -0.4437408447265625, -0.42704010009765625, -0.41033935546875, -0.39363861083984375, -0.3769378662109375, -0.36023712158203125, -0.343536376953125, -0.32683563232421875, -0.3101348876953125, -0.29343414306640625, -0.2767333984375, -0.26003265380859375, -0.2433319091796875, -0.22663116455078125, -0.209930419921875, -0.19322967529296875, -0.1765289306640625, -0.15982818603515625, -0.14312744140625, -0.12642669677734375, -0.1097259521484375, -0.09302520751953125, -0.076324462890625, -0.05962371826171875, -0.0429229736328125, -0.02622222900390625, -0.009521484375, 0.00717926025390625, 0.0238800048828125, 0.04058074951171875, 0.057281494140625, 0.07398223876953125, 0.0906829833984375, 0.10738372802734375, 0.12408447265625, 0.14078521728515625, 0.1574859619140625, 0.17418670654296875, 0.190887451171875, 0.20758819580078125, 0.2242889404296875, 0.24098968505859375, 0.2576904296875, 0.27439117431640625, 0.2910919189453125, 0.30779266357421875, 0.324493408203125, 0.34119415283203125, 0.3578948974609375, 0.37459564208984375, 0.39129638671875, 0.40799713134765625, 0.4246978759765625, 0.44139862060546875, 0.458099365234375, 0.47480010986328125, 0.4915008544921875, 0.5082015991210938, 0.52490234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 6.0, 9.0, 10.0, 31.0, 38.0, 66.0, 111.0, 162.0, 229.0, 386.0, 563.0, 1023.0, 1911.0, 3710.0, 7888.0, 17758.0, 41561.0, 107422.0, 307035.0, 349077.0, 123939.0, 47634.0, 19858.0, 8990.0, 4180.0, 2057.0, 1141.0, 659.0, 415.0, 249.0, 147.0, 104.0, 68.0, 41.0, 27.0, 17.0, 7.0, 2.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2432861328125, -0.2357006072998047, -0.22811508178710938, -0.22052955627441406, -0.21294403076171875, -0.20535850524902344, -0.19777297973632812, -0.1901874542236328, -0.1826019287109375, -0.1750164031982422, -0.16743087768554688, -0.15984535217285156, -0.15225982666015625, -0.14467430114746094, -0.13708877563476562, -0.1295032501220703, -0.121917724609375, -0.11433219909667969, -0.10674667358398438, -0.09916114807128906, -0.09157562255859375, -0.08399009704589844, -0.07640457153320312, -0.06881904602050781, -0.0612335205078125, -0.05364799499511719, -0.046062469482421875, -0.03847694396972656, -0.03089141845703125, -0.023305892944335938, -0.015720367431640625, -0.008134841918945312, -0.00054931640625, 0.0070362091064453125, 0.014621734619140625, 0.022207260131835938, 0.02979278564453125, 0.03737831115722656, 0.044963836669921875, 0.05254936218261719, 0.0601348876953125, 0.06772041320800781, 0.07530593872070312, 0.08289146423339844, 0.09047698974609375, 0.09806251525878906, 0.10564804077148438, 0.11323356628417969, 0.120819091796875, 0.1284046173095703, 0.13599014282226562, 0.14357566833496094, 0.15116119384765625, 0.15874671936035156, 0.16633224487304688, 0.1739177703857422, 0.1815032958984375, 0.1890888214111328, 0.19667434692382812, 0.20425987243652344, 0.21184539794921875, 0.21943092346191406, 0.22701644897460938, 0.2346019744873047, 0.2421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 13.0, 8.0, 16.0, 13.0, 17.0, 14.0, 27.0, 20.0, 32.0, 46.0, 57.0, 93.0, 106.0, 97.0, 84.0, 56.0, 47.0, 38.0, 32.0, 21.0, 25.0, 21.0, 13.0, 15.0, 13.0, 7.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.684925079345703e-05, -4.543270915746689e-05, -4.4016167521476746e-05, -4.25996258854866e-05, -4.118308424949646e-05, -3.976654261350632e-05, -3.8350000977516174e-05, -3.693345934152603e-05, -3.551691770553589e-05, -3.4100376069545746e-05, -3.26838344335556e-05, -3.126729279756546e-05, -2.9850751161575317e-05, -2.8434209525585175e-05, -2.7017667889595032e-05, -2.560112625360489e-05, -2.4184584617614746e-05, -2.2768042981624603e-05, -2.135150134563446e-05, -1.9934959709644318e-05, -1.8518418073654175e-05, -1.7101876437664032e-05, -1.568533480167389e-05, -1.4268793165683746e-05, -1.2852251529693604e-05, -1.143570989370346e-05, -1.0019168257713318e-05, -8.602626621723175e-06, -7.186084985733032e-06, -5.769543349742889e-06, -4.353001713752747e-06, -2.9364600777626038e-06, -1.519918441772461e-06, -1.0337680578231812e-07, 1.3131648302078247e-06, 2.7297064661979675e-06, 4.14624810218811e-06, 5.562789738178253e-06, 6.979331374168396e-06, 8.395873010158539e-06, 9.812414646148682e-06, 1.1228956282138824e-05, 1.2645497918128967e-05, 1.406203955411911e-05, 1.5478581190109253e-05, 1.6895122826099396e-05, 1.831166446208954e-05, 1.972820609807968e-05, 2.1144747734069824e-05, 2.2561289370059967e-05, 2.397783100605011e-05, 2.5394372642040253e-05, 2.6810914278030396e-05, 2.822745591402054e-05, 2.964399755001068e-05, 3.1060539186000824e-05, 3.247708082199097e-05, 3.389362245798111e-05, 3.531016409397125e-05, 3.6726705729961395e-05, 3.814324736595154e-05, 3.955978900194168e-05, 4.0976330637931824e-05, 4.2392872273921967e-05, 4.380941390991211e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 5.0, 5.0, 11.0, 12.0, 30.0, 28.0, 57.0, 89.0, 141.0, 251.0, 495.0, 956.0, 2063.0, 4972.0, 13062.0, 35979.0, 106313.0, 329608.0, 366883.0, 121571.0, 41053.0, 14858.0, 5608.0, 2296.0, 1038.0, 475.0, 271.0, 151.0, 103.0, 49.0, 39.0, 35.0, 10.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206298828125, -0.19806671142578125, -0.1898345947265625, -0.18160247802734375, -0.173370361328125, -0.16513824462890625, -0.1569061279296875, -0.14867401123046875, -0.14044189453125, -0.13220977783203125, -0.1239776611328125, -0.11574554443359375, -0.107513427734375, -0.09928131103515625, -0.0910491943359375, -0.08281707763671875, -0.0745849609375, -0.06635284423828125, -0.0581207275390625, -0.04988861083984375, -0.041656494140625, -0.03342437744140625, -0.0251922607421875, -0.01696014404296875, -0.00872802734375, -0.00049591064453125, 0.0077362060546875, 0.01596832275390625, 0.024200439453125, 0.03243255615234375, 0.0406646728515625, 0.04889678955078125, 0.05712890625, 0.06536102294921875, 0.0735931396484375, 0.08182525634765625, 0.090057373046875, 0.09828948974609375, 0.1065216064453125, 0.11475372314453125, 0.12298583984375, 0.13121795654296875, 0.1394500732421875, 0.14768218994140625, 0.155914306640625, 0.16414642333984375, 0.1723785400390625, 0.18061065673828125, 0.1888427734375, 0.19707489013671875, 0.2053070068359375, 0.21353912353515625, 0.221771240234375, 0.23000335693359375, 0.2382354736328125, 0.24646759033203125, 0.25469970703125, 0.26293182373046875, 0.2711639404296875, 0.27939605712890625, 0.287628173828125, 0.29586029052734375, 0.3040924072265625, 0.31232452392578125, 0.320556640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 7.0, 10.0, 22.0, 13.0, 22.0, 26.0, 50.0, 36.0, 55.0, 59.0, 77.0, 86.0, 85.0, 81.0, 57.0, 58.0, 49.0, 23.0, 34.0, 26.0, 27.0, 14.0, 8.0, 10.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.1644916534423828, -0.15820693969726562, -0.15192222595214844, -0.14563751220703125, -0.13935279846191406, -0.13306808471679688, -0.1267833709716797, -0.1204986572265625, -0.11421394348144531, -0.10792922973632812, -0.10164451599121094, -0.09535980224609375, -0.08907508850097656, -0.08279037475585938, -0.07650566101074219, -0.070220947265625, -0.06393623352050781, -0.057651519775390625, -0.05136680603027344, -0.04508209228515625, -0.03879737854003906, -0.032512664794921875, -0.026227951049804688, -0.0199432373046875, -0.013658523559570312, -0.007373809814453125, -0.0010890960693359375, 0.00519561767578125, 0.011480331420898438, 0.017765045166015625, 0.024049758911132812, 0.03033447265625, 0.03661918640136719, 0.042903900146484375, 0.04918861389160156, 0.05547332763671875, 0.06175804138183594, 0.06804275512695312, 0.07432746887207031, 0.0806121826171875, 0.08689689636230469, 0.09318161010742188, 0.09946632385253906, 0.10575103759765625, 0.11203575134277344, 0.11832046508789062, 0.12460517883300781, 0.130889892578125, 0.1371746063232422, 0.14345932006835938, 0.14974403381347656, 0.15602874755859375, 0.16231346130371094, 0.16859817504882812, 0.1748828887939453, 0.1811676025390625, 0.1874523162841797, 0.19373703002929688, 0.20002174377441406, 0.20630645751953125, 0.21259117126464844, 0.21887588500976562, 0.2251605987548828, 0.2314453125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 28.0, 87.0, 186.0, 320.0, 233.0, 110.0, 39.0, 8.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1280171871185303, -1.8813002109527588, -1.6345831155776978, -1.3878660202026367, -1.1411490440368652, -0.8944320678710938, -0.6477149724960327, -0.4009978771209717, -0.1542809009552002, 0.09243613481521606, 0.3391531705856323, 0.5858702063560486, 0.8325872421264648, 1.0793042182922363, 1.3260213136672974, 1.5727384090423584, 1.8194553852081299, 2.0661723613739014, 2.312889575958252, 2.5596065521240234, 2.806323528289795, 3.0530405044555664, 3.299757480621338, 3.5464746952056885, 3.79319167137146, 4.0399088859558105, 4.286625862121582, 4.5333428382873535, 4.780059814453125, 5.0267767906188965, 5.273493766784668, 5.520211219787598, 5.766927719116211, 6.013644695281982, 6.260361671447754, 6.507078647613525, 6.753795623779297, 7.000513076782227, 7.247230052947998, 7.4939470291137695, 7.740664005279541, 7.9873809814453125, 8.234098434448242, 8.480814933776855, 8.727532386779785, 8.974248886108398, 9.220966339111328, 9.467683792114258, 9.714400291442871, 9.9611177444458, 10.207834243774414, 10.454551696777344, 10.701268196105957, 10.947985649108887, 11.1947021484375, 11.44141960144043, 11.68813705444336, 11.934854507446289, 12.181571006774902, 12.428288459777832, 12.675004959106445, 12.921722412109375, 13.168438911437988, 13.415156364440918, 13.661872863769531]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 11.0, 9.0, 18.0, 10.0, 16.0, 15.0, 24.0, 30.0, 22.0, 34.0, 37.0, 34.0, 48.0, 51.0, 36.0, 64.0, 50.0, 49.0, 54.0, 32.0, 37.0, 50.0, 47.0, 44.0, 19.0, 34.0, 16.0, 21.0, 17.0, 17.0, 10.0, 7.0, 8.0, 10.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7428758144378662, -1.6881561279296875, -1.6334364414215088, -1.57871675491333, -1.5239969491958618, -1.469277262687683, -1.4145575761795044, -1.3598378896713257, -1.3051180839538574, -1.2503983974456787, -1.1956787109375, -1.1409590244293213, -1.086239218711853, -1.0315195322036743, -0.9767998456954956, -0.9220801591873169, -0.8673604726791382, -0.8126407861709595, -0.757921040058136, -0.7032013535499573, -0.6484816074371338, -0.5937619209289551, -0.5390422344207764, -0.48432251811027527, -0.42960280179977417, -0.37488308548927307, -0.320163369178772, -0.26544368267059326, -0.21072396636009216, -0.15600425004959106, -0.10128456354141235, -0.046564847230911255, 0.008154749870300293, 0.0628744587302208, 0.1175941675901413, 0.1723138689994812, 0.2270335853099823, 0.2817533016204834, 0.3364729881286621, 0.3911927044391632, 0.4459124207496643, 0.500632107257843, 0.5553518533706665, 0.6100715398788452, 0.6647912263870239, 0.7195109724998474, 0.7742306590080261, 0.8289504051208496, 0.8836700916290283, 0.938389778137207, 0.9931095242500305, 1.0478291511535645, 1.1025489568710327, 1.1572686433792114, 1.2119883298873901, 1.2667080163955688, 1.321427822113037, 1.3761475086212158, 1.4308671951293945, 1.4855868816375732, 1.5403066873550415, 1.5950263738632202, 1.649746060371399, 1.7044657468795776, 1.7591854333877563]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 11.0, 12.0, 15.0, 21.0, 24.0, 42.0, 54.0, 74.0, 107.0, 114.0, 194.0, 285.0, 453.0, 659.0, 1009.0, 1703.0, 2784.0, 4527.0, 7761.0, 13947.0, 24695.0, 47372.0, 95897.0, 212798.0, 588133.0, 1774509.0, 883003.0, 284104.0, 120847.0, 58708.0, 30572.0, 16627.0, 9272.0, 5508.0, 3078.0, 1906.0, 1100.0, 758.0, 519.0, 335.0, 210.0, 168.0, 92.0, 81.0, 61.0, 42.0, 36.0, 15.0, 16.0, 6.0, 12.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.2200927734375, -0.21314048767089844, -0.20618820190429688, -0.1992359161376953, -0.19228363037109375, -0.1853313446044922, -0.17837905883789062, -0.17142677307128906, -0.1644744873046875, -0.15752220153808594, -0.15056991577148438, -0.1436176300048828, -0.13666534423828125, -0.1297130584716797, -0.12276077270507812, -0.11580848693847656, -0.108856201171875, -0.10190391540527344, -0.09495162963867188, -0.08799934387207031, -0.08104705810546875, -0.07409477233886719, -0.06714248657226562, -0.06019020080566406, -0.0532379150390625, -0.04628562927246094, -0.039333343505859375, -0.03238105773925781, -0.02542877197265625, -0.018476486206054688, -0.011524200439453125, -0.0045719146728515625, 0.00238037109375, 0.009332656860351562, 0.016284942626953125, 0.023237228393554688, 0.03018951416015625, 0.03714179992675781, 0.044094085693359375, 0.05104637145996094, 0.0579986572265625, 0.06495094299316406, 0.07190322875976562, 0.07885551452636719, 0.08580780029296875, 0.09276008605957031, 0.09971237182617188, 0.10666465759277344, 0.113616943359375, 0.12056922912597656, 0.12752151489257812, 0.1344738006591797, 0.14142608642578125, 0.1483783721923828, 0.15533065795898438, 0.16228294372558594, 0.1692352294921875, 0.17618751525878906, 0.18313980102539062, 0.1900920867919922, 0.19704437255859375, 0.2039966583251953, 0.21094894409179688, 0.21790122985839844, 0.224853515625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 6.0, 8.0, 18.0, 14.0, 11.0, 14.0, 17.0, 15.0, 30.0, 28.0, 41.0, 36.0, 34.0, 41.0, 38.0, 39.0, 40.0, 43.0, 45.0, 46.0, 40.0, 53.0, 48.0, 51.0, 46.0, 32.0, 28.0, 28.0, 20.0, 22.0, 17.0, 12.0, 11.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.144073486328125, -0.13836669921875, -0.132659912109375, -0.126953125, -0.121246337890625, -0.11553955078125, -0.109832763671875, -0.1041259765625, -0.098419189453125, -0.09271240234375, -0.087005615234375, -0.081298828125, -0.075592041015625, -0.06988525390625, -0.064178466796875, -0.0584716796875, -0.052764892578125, -0.04705810546875, -0.041351318359375, -0.03564453125, -0.029937744140625, -0.02423095703125, -0.018524169921875, -0.0128173828125, -0.007110595703125, -0.00140380859375, 0.004302978515625, 0.010009765625, 0.015716552734375, 0.02142333984375, 0.027130126953125, 0.0328369140625, 0.038543701171875, 0.04425048828125, 0.049957275390625, 0.0556640625, 0.061370849609375, 0.06707763671875, 0.072784423828125, 0.0784912109375, 0.084197998046875, 0.08990478515625, 0.095611572265625, 0.101318359375, 0.107025146484375, 0.11273193359375, 0.118438720703125, 0.1241455078125, 0.129852294921875, 0.13555908203125, 0.141265869140625, 0.14697265625, 0.152679443359375, 0.15838623046875, 0.164093017578125, 0.1697998046875, 0.175506591796875, 0.18121337890625, 0.186920166015625, 0.192626953125, 0.198333740234375, 0.20404052734375, 0.209747314453125, 0.2154541015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 16.0, 28.0, 26.0, 42.0, 89.0, 116.0, 176.0, 276.0, 458.0, 784.0, 1488.0, 2672.0, 5139.0, 10101.0, 21547.0, 48353.0, 113634.0, 294526.0, 951151.0, 1844581.0, 558157.0, 195997.0, 78889.0, 34062.0, 15741.0, 7557.0, 3826.0, 2039.0, 1108.0, 611.0, 388.0, 225.0, 172.0, 109.0, 62.0, 41.0, 35.0, 19.0, 9.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3773460388183594, -0.36528778076171875, -0.3532295227050781, -0.3411712646484375, -0.3291130065917969, -0.31705474853515625, -0.3049964904785156, -0.292938232421875, -0.2808799743652344, -0.26882171630859375, -0.2567634582519531, -0.2447052001953125, -0.23264694213867188, -0.22058868408203125, -0.20853042602539062, -0.19647216796875, -0.18441390991210938, -0.17235565185546875, -0.16029739379882812, -0.1482391357421875, -0.13618087768554688, -0.12412261962890625, -0.11206436157226562, -0.100006103515625, -0.08794784545898438, -0.07588958740234375, -0.06383132934570312, -0.0517730712890625, -0.039714813232421875, -0.02765655517578125, -0.015598297119140625, -0.0035400390625, 0.008518218994140625, 0.02057647705078125, 0.032634735107421875, 0.0446929931640625, 0.056751251220703125, 0.06880950927734375, 0.08086776733398438, 0.092926025390625, 0.10498428344726562, 0.11704254150390625, 0.12910079956054688, 0.1411590576171875, 0.15321731567382812, 0.16527557373046875, 0.17733383178710938, 0.18939208984375, 0.20145034790039062, 0.21350860595703125, 0.22556686401367188, 0.2376251220703125, 0.24968338012695312, 0.26174163818359375, 0.2737998962402344, 0.285858154296875, 0.2979164123535156, 0.30997467041015625, 0.3220329284667969, 0.3340911865234375, 0.3461494445800781, 0.35820770263671875, 0.3702659606933594, 0.38232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 12.0, 11.0, 17.0, 24.0, 34.0, 43.0, 60.0, 102.0, 133.0, 159.0, 233.0, 373.0, 557.0, 734.0, 544.0, 309.0, 216.0, 147.0, 114.0, 71.0, 39.0, 37.0, 26.0, 23.0, 12.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.4130859375, -0.39794921875, -0.3828125, -0.36767578125, -0.3525390625, -0.33740234375, -0.322265625, -0.30712890625, -0.2919921875, -0.27685546875, -0.26171875, -0.24658203125, -0.2314453125, -0.21630859375, -0.201171875, -0.18603515625, -0.1708984375, -0.15576171875, -0.140625, -0.12548828125, -0.1103515625, -0.09521484375, -0.080078125, -0.06494140625, -0.0498046875, -0.03466796875, -0.01953125, -0.00439453125, 0.0107421875, 0.02587890625, 0.041015625, 0.05615234375, 0.0712890625, 0.08642578125, 0.1015625, 0.11669921875, 0.1318359375, 0.14697265625, 0.162109375, 0.17724609375, 0.1923828125, 0.20751953125, 0.22265625, 0.23779296875, 0.2529296875, 0.26806640625, 0.283203125, 0.29833984375, 0.3134765625, 0.32861328125, 0.34375, 0.35888671875, 0.3740234375, 0.38916015625, 0.404296875, 0.41943359375, 0.4345703125, 0.44970703125, 0.46484375, 0.47998046875, 0.4951171875, 0.51025390625, 0.525390625, 0.54052734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 12.0, 15.0, 27.0, 39.0, 52.0, 64.0, 75.0, 84.0, 120.0, 112.0, 91.0, 84.0, 63.0, 64.0, 35.0, 21.0, 15.0, 7.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2121691703796387, -2.129901647567749, -2.0476343631744385, -1.9653668403625488, -1.8830993175506592, -1.800831913948059, -1.718564510345459, -1.6362969875335693, -1.5540295839309692, -1.4717621803283691, -1.3894946575164795, -1.3072272539138794, -1.2249598503112793, -1.1426923274993896, -1.0604249238967896, -0.9781574606895447, -0.8958899974822998, -0.8136225342750549, -0.7313550710678101, -0.64908766746521, -0.5668202042579651, -0.4845527410507202, -0.40228530764579773, -0.32001787424087524, -0.23775041103363037, -0.1554829627275467, -0.07321551442146301, 0.009051933884620667, 0.09131938219070435, 0.17358684539794922, 0.2558542788028717, 0.3381217122077942, 0.42038917541503906, 0.5026566386222839, 0.5849241018295288, 0.6671915054321289, 0.7494589686393738, 0.8317264318466187, 0.9139938354492188, 0.9962612986564636, 1.0785287618637085, 1.1607961654663086, 1.2430636882781982, 1.3253310918807983, 1.4075984954833984, 1.489866018295288, 1.5721334218978882, 1.6544008255004883, 1.736668348312378, 1.818935751914978, 1.9012032747268677, 1.9834706783294678, 2.0657382011413574, 2.148005485534668, 2.2302730083465576, 2.3125405311584473, 2.394807815551758, 2.4770753383636475, 2.559342622756958, 2.6416101455688477, 2.7238776683807373, 2.806145191192627, 2.8884124755859375, 2.970679998397827, 3.052947521209717]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 3.0, 8.0, 7.0, 7.0, 13.0, 12.0, 9.0, 10.0, 23.0, 18.0, 26.0, 19.0, 25.0, 18.0, 33.0, 34.0, 40.0, 50.0, 31.0, 41.0, 34.0, 27.0, 36.0, 39.0, 48.0, 37.0, 41.0, 40.0, 26.0, 30.0, 28.0, 24.0, 27.0, 31.0, 14.0, 14.0, 17.0, 15.0, 6.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1867331266403198, -1.146103024482727, -1.1054729223251343, -1.064842939376831, -1.0242128372192383, -0.9835827350616455, -0.9429526329040527, -0.90232253074646, -0.861692488193512, -0.8210623860359192, -0.7804323434829712, -0.7398022413253784, -0.6991721391677856, -0.6585420966148376, -0.6179119944572449, -0.5772819519042969, -0.5366518497467041, -0.4960217773914337, -0.45539170503616333, -0.41476160287857056, -0.37413153052330017, -0.3335014581680298, -0.292871356010437, -0.2522412836551666, -0.21161121129989624, -0.17098113894462585, -0.13035105168819427, -0.08972097188234329, -0.04909089207649231, -0.008460819721221924, 0.032169267535209656, 0.07279935479164124, 0.11342930793762207, 0.15405938029289246, 0.19468946754932404, 0.23531955480575562, 0.275949627161026, 0.3165796995162964, 0.35720980167388916, 0.39783987402915955, 0.43846994638442993, 0.4791000187397003, 0.5197300910949707, 0.5603601932525635, 0.6009902954101562, 0.6416203379631042, 0.682250440120697, 0.722880482673645, 0.7635105848312378, 0.8041406869888306, 0.8447707295417786, 0.8854008316993713, 0.9260308742523193, 0.9666609764099121, 1.0072910785675049, 1.0479211807250977, 1.0885512828826904, 1.1291813850402832, 1.169811487197876, 1.2104414701461792, 1.251071572303772, 1.2917016744613647, 1.3323317766189575, 1.3729618787765503, 1.4135918617248535]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 15.0, 16.0, 21.0, 18.0, 50.0, 58.0, 80.0, 134.0, 192.0, 296.0, 441.0, 536.0, 816.0, 1233.0, 1838.0, 2790.0, 4187.0, 6414.0, 10138.0, 16107.0, 27638.0, 50192.0, 103849.0, 235368.0, 288095.0, 144463.0, 65076.0, 34205.0, 19815.0, 12064.0, 7454.0, 4846.0, 3327.0, 2103.0, 1448.0, 997.0, 711.0, 489.0, 336.0, 218.0, 156.0, 102.0, 66.0, 51.0, 34.0, 22.0, 19.0, 11.0, 10.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.304443359375, -0.2949867248535156, -0.28553009033203125, -0.2760734558105469, -0.2666168212890625, -0.2571601867675781, -0.24770355224609375, -0.23824691772460938, -0.228790283203125, -0.21933364868164062, -0.20987701416015625, -0.20042037963867188, -0.1909637451171875, -0.18150711059570312, -0.17205047607421875, -0.16259384155273438, -0.15313720703125, -0.14368057250976562, -0.13422393798828125, -0.12476730346679688, -0.1153106689453125, -0.10585403442382812, -0.09639739990234375, -0.08694076538085938, -0.077484130859375, -0.06802749633789062, -0.05857086181640625, -0.049114227294921875, -0.0396575927734375, -0.030200958251953125, -0.02074432373046875, -0.011287689208984375, -0.0018310546875, 0.007625579833984375, 0.01708221435546875, 0.026538848876953125, 0.0359954833984375, 0.045452117919921875, 0.05490875244140625, 0.06436538696289062, 0.073822021484375, 0.08327865600585938, 0.09273529052734375, 0.10219192504882812, 0.1116485595703125, 0.12110519409179688, 0.13056182861328125, 0.14001846313476562, 0.14947509765625, 0.15893173217773438, 0.16838836669921875, 0.17784500122070312, 0.1873016357421875, 0.19675827026367188, 0.20621490478515625, 0.21567153930664062, 0.225128173828125, 0.23458480834960938, 0.24404144287109375, 0.2534980773925781, 0.2629547119140625, 0.2724113464355469, 0.28186798095703125, 0.2913246154785156, 0.30078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 6.0, 1.0, 2.0, 7.0, 2.0, 13.0, 9.0, 6.0, 12.0, 13.0, 21.0, 19.0, 20.0, 30.0, 19.0, 30.0, 37.0, 34.0, 44.0, 28.0, 32.0, 40.0, 39.0, 40.0, 40.0, 35.0, 51.0, 36.0, 43.0, 33.0, 28.0, 30.0, 22.0, 33.0, 26.0, 25.0, 20.0, 13.0, 21.0, 18.0, 8.0, 4.0, 6.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.162353515625, -0.15653228759765625, -0.1507110595703125, -0.14488983154296875, -0.139068603515625, -0.13324737548828125, -0.1274261474609375, -0.12160491943359375, -0.11578369140625, -0.10996246337890625, -0.1041412353515625, -0.09832000732421875, -0.092498779296875, -0.08667755126953125, -0.0808563232421875, -0.07503509521484375, -0.0692138671875, -0.06339263916015625, -0.0575714111328125, -0.05175018310546875, -0.045928955078125, -0.04010772705078125, -0.0342864990234375, -0.02846527099609375, -0.02264404296875, -0.01682281494140625, -0.0110015869140625, -0.00518035888671875, 0.000640869140625, 0.00646209716796875, 0.0122833251953125, 0.01810455322265625, 0.02392578125, 0.02974700927734375, 0.0355682373046875, 0.04138946533203125, 0.047210693359375, 0.05303192138671875, 0.0588531494140625, 0.06467437744140625, 0.07049560546875, 0.07631683349609375, 0.0821380615234375, 0.08795928955078125, 0.093780517578125, 0.09960174560546875, 0.1054229736328125, 0.11124420166015625, 0.1170654296875, 0.12288665771484375, 0.1287078857421875, 0.13452911376953125, 0.140350341796875, 0.14617156982421875, 0.1519927978515625, 0.15781402587890625, 0.16363525390625, 0.16945648193359375, 0.1752777099609375, 0.18109893798828125, 0.186920166015625, 0.19274139404296875, 0.1985626220703125, 0.20438385009765625, 0.210205078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 4.0, 17.0, 27.0, 32.0, 77.0, 117.0, 310.0, 575.0, 1106.0, 2540.0, 5614.0, 12924.0, 29043.0, 75276.0, 282311.0, 438623.0, 125656.0, 41711.0, 17912.0, 7827.0, 3683.0, 1676.0, 720.0, 360.0, 198.0, 87.0, 51.0, 24.0, 20.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65380859375, -0.6371345520019531, -0.6204605102539062, -0.6037864685058594, -0.5871124267578125, -0.5704383850097656, -0.5537643432617188, -0.5370903015136719, -0.520416259765625, -0.5037422180175781, -0.48706817626953125, -0.4703941345214844, -0.4537200927734375, -0.4370460510253906, -0.42037200927734375, -0.4036979675292969, -0.38702392578125, -0.3703498840332031, -0.35367584228515625, -0.3370018005371094, -0.3203277587890625, -0.3036537170410156, -0.28697967529296875, -0.2703056335449219, -0.253631591796875, -0.23695755004882812, -0.22028350830078125, -0.20360946655273438, -0.1869354248046875, -0.17026138305664062, -0.15358734130859375, -0.13691329956054688, -0.1202392578125, -0.10356521606445312, -0.08689117431640625, -0.07021713256835938, -0.0535430908203125, -0.036869049072265625, -0.02019500732421875, -0.003520965576171875, 0.013153076171875, 0.029827117919921875, 0.04650115966796875, 0.06317520141601562, 0.0798492431640625, 0.09652328491210938, 0.11319732666015625, 0.12987136840820312, 0.14654541015625, 0.16321945190429688, 0.17989349365234375, 0.19656753540039062, 0.2132415771484375, 0.22991561889648438, 0.24658966064453125, 0.2632637023925781, 0.279937744140625, 0.2966117858886719, 0.31328582763671875, 0.3299598693847656, 0.3466339111328125, 0.3633079528808594, 0.37998199462890625, 0.3966560363769531, 0.413330078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 6.0, 7.0, 6.0, 9.0, 1.0, 8.0, 18.0, 9.0, 13.0, 20.0, 25.0, 21.0, 27.0, 26.0, 30.0, 42.0, 38.0, 52.0, 38.0, 42.0, 46.0, 34.0, 39.0, 33.0, 38.0, 37.0, 48.0, 36.0, 32.0, 24.0, 26.0, 23.0, 16.0, 18.0, 13.0, 14.0, 12.0, 13.0, 11.0, 12.0, 5.0, 2.0, 7.0, 7.0, 8.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5598907470703125, -0.542633056640625, -0.5253753662109375, -0.50811767578125, -0.4908599853515625, -0.473602294921875, -0.4563446044921875, -0.4390869140625, -0.4218292236328125, -0.404571533203125, -0.3873138427734375, -0.37005615234375, -0.3527984619140625, -0.335540771484375, -0.3182830810546875, -0.301025390625, -0.2837677001953125, -0.266510009765625, -0.2492523193359375, -0.23199462890625, -0.2147369384765625, -0.197479248046875, -0.1802215576171875, -0.1629638671875, -0.1457061767578125, -0.128448486328125, -0.1111907958984375, -0.09393310546875, -0.0766754150390625, -0.059417724609375, -0.0421600341796875, -0.02490234375, -0.0076446533203125, 0.009613037109375, 0.0268707275390625, 0.04412841796875, 0.0613861083984375, 0.078643798828125, 0.0959014892578125, 0.1131591796875, 0.1304168701171875, 0.147674560546875, 0.1649322509765625, 0.18218994140625, 0.1994476318359375, 0.216705322265625, 0.2339630126953125, 0.251220703125, 0.2684783935546875, 0.285736083984375, 0.3029937744140625, 0.32025146484375, 0.3375091552734375, 0.354766845703125, 0.3720245361328125, 0.3892822265625, 0.4065399169921875, 0.423797607421875, 0.4410552978515625, 0.45831298828125, 0.4755706787109375, 0.492828369140625, 0.5100860595703125, 0.52734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 17.0, 19.0, 17.0, 47.0, 67.0, 124.0, 181.0, 296.0, 553.0, 883.0, 1583.0, 2764.0, 4783.0, 8484.0, 14869.0, 26375.0, 47069.0, 89651.0, 210704.0, 324708.0, 154211.0, 71467.0, 39116.0, 21691.0, 12259.0, 7169.0, 3953.0, 2289.0, 1329.0, 764.0, 451.0, 251.0, 133.0, 91.0, 58.0, 48.0, 26.0, 21.0, 7.0, 11.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11358642578125, -0.10927295684814453, -0.10495948791503906, -0.1006460189819336, -0.09633255004882812, -0.09201908111572266, -0.08770561218261719, -0.08339214324951172, -0.07907867431640625, -0.07476520538330078, -0.07045173645019531, -0.06613826751708984, -0.061824798583984375, -0.057511329650878906, -0.05319786071777344, -0.04888439178466797, -0.0445709228515625, -0.04025745391845703, -0.03594398498535156, -0.031630516052246094, -0.027317047119140625, -0.023003578186035156, -0.018690109252929688, -0.014376640319824219, -0.01006317138671875, -0.005749702453613281, -0.0014362335205078125, 0.0028772354125976562, 0.007190704345703125, 0.011504173278808594, 0.015817642211914062, 0.02013111114501953, 0.024444580078125, 0.02875804901123047, 0.03307151794433594, 0.037384986877441406, 0.041698455810546875, 0.046011924743652344, 0.05032539367675781, 0.05463886260986328, 0.05895233154296875, 0.06326580047607422, 0.06757926940917969, 0.07189273834228516, 0.07620620727539062, 0.0805196762084961, 0.08483314514160156, 0.08914661407470703, 0.0934600830078125, 0.09777355194091797, 0.10208702087402344, 0.1064004898071289, 0.11071395874023438, 0.11502742767333984, 0.11934089660644531, 0.12365436553955078, 0.12796783447265625, 0.13228130340576172, 0.1365947723388672, 0.14090824127197266, 0.14522171020507812, 0.1495351791381836, 0.15384864807128906, 0.15816211700439453, 0.1624755859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 8.0, 3.0, 10.0, 4.0, 7.0, 9.0, 9.0, 11.0, 9.0, 26.0, 31.0, 40.0, 57.0, 106.0, 167.0, 149.0, 126.0, 62.0, 47.0, 39.0, 15.0, 11.0, 14.0, 9.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.435943603515625e-05, -5.260482430458069e-05, -5.085021257400513e-05, -4.9095600843429565e-05, -4.7340989112854004e-05, -4.558637738227844e-05, -4.383176565170288e-05, -4.207715392112732e-05, -4.032254219055176e-05, -3.8567930459976196e-05, -3.6813318729400635e-05, -3.505870699882507e-05, -3.330409526824951e-05, -3.154948353767395e-05, -2.979487180709839e-05, -2.8040260076522827e-05, -2.6285648345947266e-05, -2.4531036615371704e-05, -2.2776424884796143e-05, -2.102181315422058e-05, -1.926720142364502e-05, -1.7512589693069458e-05, -1.5757977962493896e-05, -1.4003366231918335e-05, -1.2248754501342773e-05, -1.0494142770767212e-05, -8.73953104019165e-06, -6.984919309616089e-06, -5.230307579040527e-06, -3.475695848464966e-06, -1.7210841178894043e-06, 3.3527612686157227e-08, 1.7881393432617188e-06, 3.5427510738372803e-06, 5.297362804412842e-06, 7.051974534988403e-06, 8.806586265563965e-06, 1.0561197996139526e-05, 1.2315809726715088e-05, 1.407042145729065e-05, 1.582503318786621e-05, 1.7579644918441772e-05, 1.9334256649017334e-05, 2.1088868379592896e-05, 2.2843480110168457e-05, 2.459809184074402e-05, 2.635270357131958e-05, 2.810731530189514e-05, 2.9861927032470703e-05, 3.1616538763046265e-05, 3.3371150493621826e-05, 3.512576222419739e-05, 3.688037395477295e-05, 3.863498568534851e-05, 4.038959741592407e-05, 4.2144209146499634e-05, 4.3898820877075195e-05, 4.565343260765076e-05, 4.740804433822632e-05, 4.916265606880188e-05, 5.091726779937744e-05, 5.2671879529953e-05, 5.4426491260528564e-05, 5.6181102991104126e-05, 5.793571472167969e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 16.0, 28.0, 46.0, 75.0, 107.0, 189.0, 416.0, 781.0, 1590.0, 3659.0, 7730.0, 17536.0, 40967.0, 103022.0, 319666.0, 355804.0, 115994.0, 45632.0, 19222.0, 8565.0, 3900.0, 1837.0, 844.0, 441.0, 205.0, 109.0, 67.0, 47.0, 27.0, 17.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2052001953125, -0.1991748809814453, -0.19314956665039062, -0.18712425231933594, -0.18109893798828125, -0.17507362365722656, -0.16904830932617188, -0.1630229949951172, -0.1569976806640625, -0.1509723663330078, -0.14494705200195312, -0.13892173767089844, -0.13289642333984375, -0.12687110900878906, -0.12084579467773438, -0.11482048034667969, -0.108795166015625, -0.10276985168457031, -0.09674453735351562, -0.09071922302246094, -0.08469390869140625, -0.07866859436035156, -0.07264328002929688, -0.06661796569824219, -0.0605926513671875, -0.05456733703613281, -0.048542022705078125, -0.04251670837402344, -0.03649139404296875, -0.030466079711914062, -0.024440765380859375, -0.018415451049804688, -0.01239013671875, -0.0063648223876953125, -0.000339508056640625, 0.0056858062744140625, 0.01171112060546875, 0.017736434936523438, 0.023761749267578125, 0.029787063598632812, 0.0358123779296875, 0.04183769226074219, 0.047863006591796875, 0.05388832092285156, 0.05991363525390625, 0.06593894958496094, 0.07196426391601562, 0.07798957824707031, 0.084014892578125, 0.09004020690917969, 0.09606552124023438, 0.10209083557128906, 0.10811614990234375, 0.11414146423339844, 0.12016677856445312, 0.1261920928955078, 0.1322174072265625, 0.1382427215576172, 0.14426803588867188, 0.15029335021972656, 0.15631866455078125, 0.16234397888183594, 0.16836929321289062, 0.1743946075439453, 0.180419921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 15.0, 6.0, 19.0, 17.0, 21.0, 25.0, 35.0, 42.0, 46.0, 81.0, 75.0, 103.0, 101.0, 88.0, 61.0, 50.0, 36.0, 35.0, 18.0, 21.0, 20.0, 7.0, 8.0, 13.0, 6.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1878662109375, -0.18215179443359375, -0.1764373779296875, -0.17072296142578125, -0.165008544921875, -0.15929412841796875, -0.1535797119140625, -0.14786529541015625, -0.14215087890625, -0.13643646240234375, -0.1307220458984375, -0.12500762939453125, -0.119293212890625, -0.11357879638671875, -0.1078643798828125, -0.10214996337890625, -0.096435546875, -0.09072113037109375, -0.0850067138671875, -0.07929229736328125, -0.073577880859375, -0.06786346435546875, -0.0621490478515625, -0.05643463134765625, -0.05072021484375, -0.04500579833984375, -0.0392913818359375, -0.03357696533203125, -0.027862548828125, -0.02214813232421875, -0.0164337158203125, -0.01071929931640625, -0.0050048828125, 0.00070953369140625, 0.0064239501953125, 0.01213836669921875, 0.017852783203125, 0.02356719970703125, 0.0292816162109375, 0.03499603271484375, 0.04071044921875, 0.04642486572265625, 0.0521392822265625, 0.05785369873046875, 0.063568115234375, 0.06928253173828125, 0.0749969482421875, 0.08071136474609375, 0.08642578125, 0.09214019775390625, 0.0978546142578125, 0.10356903076171875, 0.109283447265625, 0.11499786376953125, 0.1207122802734375, 0.12642669677734375, 0.13214111328125, 0.13785552978515625, 0.1435699462890625, 0.14928436279296875, 0.154998779296875, 0.16071319580078125, 0.1664276123046875, 0.17214202880859375, 0.1778564453125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 11.0, 11.0, 22.0, 29.0, 29.0, 74.0, 78.0, 102.0, 120.0, 125.0, 107.0, 87.0, 67.0, 45.0, 33.0, 26.0, 9.0, 16.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5914758443832397, -1.517104148864746, -1.442732334136963, -1.3683606386184692, -1.2939889430999756, -1.2196171283721924, -1.1452454328536987, -1.070873737335205, -0.9965019822120667, -0.9221302270889282, -0.8477585315704346, -0.7733867764472961, -0.6990150213241577, -0.6246433258056641, -0.5502715706825256, -0.475899875164032, -0.40152812004089355, -0.3271563947200775, -0.2527846693992615, -0.17841291427612305, -0.104041188955307, -0.029669463634490967, 0.04470229148864746, 0.11907398700714111, 0.19344574213027954, 0.2678174674510956, 0.3421891927719116, 0.41656094789505005, 0.4909326732158661, 0.5653043985366821, 0.6396761536598206, 0.7140478491783142, 0.7884194850921631, 0.8627912402153015, 0.9371629357337952, 1.0115346908569336, 1.0859063863754272, 1.160278081893921, 1.234649896621704, 1.3090215921401978, 1.3833932876586914, 1.457764983177185, 1.5321367979049683, 1.606508493423462, 1.6808801889419556, 1.7552518844604492, 1.8296236991882324, 1.903995394706726, 1.9783672094345093, 2.052738904953003, 2.127110719680786, 2.2014822959899902, 2.2758541107177734, 2.3502259254455566, 2.42459774017334, 2.498969316482544, 2.573341131210327, 2.6477129459381104, 2.7220845222473145, 2.7964563369750977, 2.870828151702881, 2.945199728012085, 3.019571542739868, 3.0939431190490723, 3.1683149337768555]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 2.0, 2.0, 4.0, 10.0, 7.0, 5.0, 15.0, 11.0, 18.0, 15.0, 27.0, 30.0, 30.0, 30.0, 30.0, 30.0, 33.0, 33.0, 40.0, 46.0, 40.0, 39.0, 42.0, 33.0, 39.0, 48.0, 37.0, 37.0, 36.0, 30.0, 31.0, 29.0, 28.0, 14.0, 18.0, 17.0, 18.0, 19.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5477862358093262, -1.5011661052703857, -1.4545459747314453, -1.4079258441925049, -1.361305832862854, -1.3146857023239136, -1.2680655717849731, -1.2214454412460327, -1.1748254299163818, -1.1282052993774414, -1.081585168838501, -1.0349650382995605, -0.9883450269699097, -0.9417248964309692, -0.8951047658920288, -0.8484846353530884, -0.801864504814148, -0.7552443742752075, -0.7086243033409119, -0.6620041728019714, -0.6153841018676758, -0.5687639713287354, -0.5221438407897949, -0.4755237400531769, -0.42890363931655884, -0.3822835385799408, -0.33566343784332275, -0.2890433073043823, -0.24242320656776428, -0.19580310583114624, -0.1491829752922058, -0.10256287455558777, -0.05594289302825928, -0.009322784841060638, 0.037297323346138, 0.08391743898391724, 0.13053753972053528, 0.17715764045715332, 0.22377777099609375, 0.2703978717327118, 0.31701797246932983, 0.3636380732059479, 0.4102581739425659, 0.45687830448150635, 0.5034984350204468, 0.5501185059547424, 0.5967386364936829, 0.6433587074279785, 0.689978837966919, 0.7365989685058594, 0.783219039440155, 0.8298391699790955, 0.8764592409133911, 0.9230793714523315, 0.969699501991272, 1.0163196325302124, 1.0629396438598633, 1.1095597743988037, 1.1561799049377441, 1.2028000354766846, 1.2494200468063354, 1.2960401773452759, 1.3426603078842163, 1.3892804384231567, 1.4359005689620972]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 8.0, 5.0, 11.0, 21.0, 23.0, 27.0, 50.0, 71.0, 120.0, 189.0, 296.0, 476.0, 798.0, 1389.0, 2221.0, 4104.0, 7431.0, 13439.0, 26063.0, 52191.0, 112308.0, 284336.0, 1165929.0, 1848822.0, 398302.0, 142822.0, 64174.0, 31483.0, 16368.0, 8935.0, 4931.0, 2848.0, 1594.0, 1015.0, 576.0, 304.0, 221.0, 142.0, 89.0, 59.0, 27.0, 23.0, 15.0, 15.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.23386383056640625, -0.2245635986328125, -0.21526336669921875, -0.205963134765625, -0.19666290283203125, -0.1873626708984375, -0.17806243896484375, -0.16876220703125, -0.15946197509765625, -0.1501617431640625, -0.14086151123046875, -0.131561279296875, -0.12226104736328125, -0.1129608154296875, -0.10366058349609375, -0.0943603515625, -0.08506011962890625, -0.0757598876953125, -0.06645965576171875, -0.057159423828125, -0.04785919189453125, -0.0385589599609375, -0.02925872802734375, -0.01995849609375, -0.01065826416015625, -0.0013580322265625, 0.00794219970703125, 0.017242431640625, 0.02654266357421875, 0.0358428955078125, 0.04514312744140625, 0.054443359375, 0.06374359130859375, 0.0730438232421875, 0.08234405517578125, 0.091644287109375, 0.10094451904296875, 0.1102447509765625, 0.11954498291015625, 0.12884521484375, 0.13814544677734375, 0.1474456787109375, 0.15674591064453125, 0.166046142578125, 0.17534637451171875, 0.1846466064453125, 0.19394683837890625, 0.2032470703125, 0.21254730224609375, 0.2218475341796875, 0.23114776611328125, 0.240447998046875, 0.24974822998046875, 0.2590484619140625, 0.26834869384765625, 0.27764892578125, 0.28694915771484375, 0.2962493896484375, 0.30554962158203125, 0.314849853515625, 0.32415008544921875, 0.3334503173828125, 0.34275054931640625, 0.35205078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 7.0, 4.0, 15.0, 5.0, 15.0, 15.0, 10.0, 8.0, 8.0, 19.0, 23.0, 28.0, 25.0, 30.0, 25.0, 46.0, 45.0, 42.0, 36.0, 42.0, 37.0, 38.0, 49.0, 26.0, 26.0, 39.0, 40.0, 29.0, 38.0, 34.0, 36.0, 18.0, 23.0, 20.0, 17.0, 23.0, 13.0, 14.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15688133239746094, -0.15116500854492188, -0.1454486846923828, -0.13973236083984375, -0.1340160369873047, -0.12829971313476562, -0.12258338928222656, -0.1168670654296875, -0.11115074157714844, -0.10543441772460938, -0.09971809387207031, -0.09400177001953125, -0.08828544616699219, -0.08256912231445312, -0.07685279846191406, -0.071136474609375, -0.06542015075683594, -0.059703826904296875, -0.05398750305175781, -0.04827117919921875, -0.04255485534667969, -0.036838531494140625, -0.031122207641601562, -0.0254058837890625, -0.019689559936523438, -0.013973236083984375, -0.008256912231445312, -0.00254058837890625, 0.0031757354736328125, 0.008892059326171875, 0.014608383178710938, 0.02032470703125, 0.026041030883789062, 0.031757354736328125, 0.03747367858886719, 0.04319000244140625, 0.04890632629394531, 0.054622650146484375, 0.06033897399902344, 0.0660552978515625, 0.07177162170410156, 0.07748794555664062, 0.08320426940917969, 0.08892059326171875, 0.09463691711425781, 0.10035324096679688, 0.10606956481933594, 0.111785888671875, 0.11750221252441406, 0.12321853637695312, 0.1289348602294922, 0.13465118408203125, 0.1403675079345703, 0.14608383178710938, 0.15180015563964844, 0.1575164794921875, 0.16323280334472656, 0.16894912719726562, 0.1746654510498047, 0.18038177490234375, 0.1860980987548828, 0.19181442260742188, 0.19753074645996094, 0.2032470703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 11.0, 17.0, 21.0, 22.0, 49.0, 71.0, 134.0, 206.0, 377.0, 522.0, 921.0, 1622.0, 2781.0, 4959.0, 9256.0, 17475.0, 34203.0, 69954.0, 150748.0, 368608.0, 1351184.0, 1479493.0, 393931.0, 159926.0, 72549.0, 35599.0, 18001.0, 9597.0, 5184.0, 2900.0, 1613.0, 949.0, 565.0, 335.0, 179.0, 117.0, 67.0, 50.0, 45.0, 10.0, 11.0, 10.0, 6.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3676719665527344, -0.35619354248046875, -0.3447151184082031, -0.3332366943359375, -0.3217582702636719, -0.31027984619140625, -0.2988014221191406, -0.287322998046875, -0.2758445739746094, -0.26436614990234375, -0.2528877258300781, -0.2414093017578125, -0.22993087768554688, -0.21845245361328125, -0.20697402954101562, -0.19549560546875, -0.18401718139648438, -0.17253875732421875, -0.16106033325195312, -0.1495819091796875, -0.13810348510742188, -0.12662506103515625, -0.11514663696289062, -0.103668212890625, -0.09218978881835938, -0.08071136474609375, -0.06923294067382812, -0.0577545166015625, -0.046276092529296875, -0.03479766845703125, -0.023319244384765625, -0.0118408203125, -0.000362396240234375, 0.01111602783203125, 0.022594451904296875, 0.0340728759765625, 0.045551300048828125, 0.05702972412109375, 0.06850814819335938, 0.079986572265625, 0.09146499633789062, 0.10294342041015625, 0.11442184448242188, 0.1259002685546875, 0.13737869262695312, 0.14885711669921875, 0.16033554077148438, 0.17181396484375, 0.18329238891601562, 0.19477081298828125, 0.20624923706054688, 0.2177276611328125, 0.22920608520507812, 0.24068450927734375, 0.2521629333496094, 0.263641357421875, 0.2751197814941406, 0.28659820556640625, 0.2980766296386719, 0.3095550537109375, 0.3210334777832031, 0.33251190185546875, 0.3439903259277344, 0.35546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 3.0, 10.0, 19.0, 19.0, 24.0, 32.0, 32.0, 43.0, 58.0, 94.0, 114.0, 190.0, 228.0, 379.0, 683.0, 757.0, 458.0, 283.0, 164.0, 138.0, 101.0, 62.0, 42.0, 29.0, 22.0, 25.0, 24.0, 13.0, 9.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416015625, -0.40006256103515625, -0.3841094970703125, -0.36815643310546875, -0.352203369140625, -0.33625030517578125, -0.3202972412109375, -0.30434417724609375, -0.28839111328125, -0.27243804931640625, -0.2564849853515625, -0.24053192138671875, -0.224578857421875, -0.20862579345703125, -0.1926727294921875, -0.17671966552734375, -0.1607666015625, -0.14481353759765625, -0.1288604736328125, -0.11290740966796875, -0.096954345703125, -0.08100128173828125, -0.0650482177734375, -0.04909515380859375, -0.03314208984375, -0.01718902587890625, -0.0012359619140625, 0.01471710205078125, 0.030670166015625, 0.04662322998046875, 0.0625762939453125, 0.07852935791015625, 0.094482421875, 0.11043548583984375, 0.1263885498046875, 0.14234161376953125, 0.158294677734375, 0.17424774169921875, 0.1902008056640625, 0.20615386962890625, 0.22210693359375, 0.23805999755859375, 0.2540130615234375, 0.26996612548828125, 0.285919189453125, 0.30187225341796875, 0.3178253173828125, 0.33377838134765625, 0.3497314453125, 0.36568450927734375, 0.3816375732421875, 0.39759063720703125, 0.413543701171875, 0.42949676513671875, 0.4454498291015625, 0.46140289306640625, 0.47735595703125, 0.49330902099609375, 0.5092620849609375, 0.5252151489257812, 0.541168212890625, 0.5571212768554688, 0.5730743408203125, 0.5890274047851562, 0.60498046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 15.0, 17.0, 43.0, 45.0, 75.0, 100.0, 126.0, 139.0, 112.0, 119.0, 68.0, 56.0, 37.0, 27.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9155347347259521, -1.808927297592163, -1.702319860458374, -1.595712423324585, -1.489104986190796, -1.3824975490570068, -1.2758902311325073, -1.1692827939987183, -1.0626753568649292, -0.9560679197311401, -0.8494604825973511, -0.7428531050682068, -0.6362456679344177, -0.5296382308006287, -0.4230308532714844, -0.3164234161376953, -0.20981597900390625, -0.10320855677127838, 0.0033988654613494873, 0.11000627279281616, 0.21661370992660522, 0.3232211470603943, 0.4298285245895386, 0.5364359617233276, 0.6430433988571167, 0.7496508359909058, 0.8562582731246948, 0.9628656506538391, 1.0694730281829834, 1.1760804653167725, 1.2826879024505615, 1.3892953395843506, 1.4959025382995605, 1.6025099754333496, 1.7091174125671387, 1.8157248497009277, 1.9223322868347168, 2.028939723968506, 2.135547161102295, 2.242154598236084, 2.348762035369873, 2.455369472503662, 2.561976909637451, 2.6685843467712402, 2.7751917839050293, 2.8817992210388184, 2.9884066581726074, 3.0950140953063965, 3.2016212940216064, 3.3082287311553955, 3.4148361682891846, 3.5214436054229736, 3.6280510425567627, 3.7346584796905518, 3.8412656784057617, 3.947873115539551, 4.05448055267334, 4.161087989807129, 4.267695426940918, 4.374302864074707, 4.480910301208496, 4.587517738342285, 4.694125175476074, 4.800732612609863, 4.907340049743652]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 11.0, 3.0, 9.0, 7.0, 11.0, 20.0, 20.0, 21.0, 27.0, 35.0, 24.0, 24.0, 37.0, 40.0, 39.0, 50.0, 48.0, 37.0, 45.0, 44.0, 52.0, 49.0, 50.0, 21.0, 33.0, 28.0, 27.0, 35.0, 23.0, 19.0, 22.0, 14.0, 12.0, 6.0, 9.0, 10.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.650313377380371, -1.6048355102539062, -1.5593576431274414, -1.5138797760009766, -1.4684019088745117, -1.4229241609573364, -1.3774462938308716, -1.3319684267044067, -1.286490559577942, -1.241012692451477, -1.1955348253250122, -1.1500569581985474, -1.104579210281372, -1.0591013431549072, -1.0136234760284424, -0.9681456089019775, -0.9226677417755127, -0.8771898746490479, -0.831712007522583, -0.7862342000007629, -0.7407563328742981, -0.6952784657478333, -0.6498006582260132, -0.6043227910995483, -0.5588449239730835, -0.5133670568466187, -0.4678892195224762, -0.42241138219833374, -0.3769335150718689, -0.33145564794540405, -0.2859778106212616, -0.24049997329711914, -0.19502222537994385, -0.1495443731546402, -0.10406652092933655, -0.0585886687040329, -0.013110816478729248, 0.0323670357465744, 0.07784488797187805, 0.12332272529602051, 0.16880059242248535, 0.214278444647789, 0.25975629687309265, 0.3052341341972351, 0.35071200132369995, 0.3961898684501648, 0.44166770577430725, 0.4871455430984497, 0.5326234102249146, 0.5781012773513794, 0.6235791444778442, 0.6690569519996643, 0.7145348191261292, 0.760012686252594, 0.8054904937744141, 0.8509683609008789, 0.8964462280273438, 0.9419240951538086, 0.9874019622802734, 1.0328798294067383, 1.0783576965332031, 1.1238354444503784, 1.1693133115768433, 1.214791178703308, 1.260269045829773]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 10.0, 4.0, 5.0, 19.0, 32.0, 39.0, 56.0, 117.0, 137.0, 219.0, 352.0, 550.0, 852.0, 1275.0, 2068.0, 3244.0, 5019.0, 8698.0, 14597.0, 26270.0, 53375.0, 117249.0, 235056.0, 272600.0, 156582.0, 71105.0, 33901.0, 18064.0, 10396.0, 6055.0, 3887.0, 2373.0, 1589.0, 961.0, 639.0, 407.0, 261.0, 184.0, 116.0, 63.0, 40.0, 24.0, 22.0, 18.0, 9.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3246307373046875, -0.314544677734375, -0.3044586181640625, -0.29437255859375, -0.2842864990234375, -0.274200439453125, -0.2641143798828125, -0.2540283203125, -0.2439422607421875, -0.233856201171875, -0.2237701416015625, -0.21368408203125, -0.2035980224609375, -0.193511962890625, -0.1834259033203125, -0.17333984375, -0.1632537841796875, -0.153167724609375, -0.1430816650390625, -0.13299560546875, -0.1229095458984375, -0.112823486328125, -0.1027374267578125, -0.0926513671875, -0.0825653076171875, -0.072479248046875, -0.0623931884765625, -0.05230712890625, -0.0422210693359375, -0.032135009765625, -0.0220489501953125, -0.011962890625, -0.0018768310546875, 0.008209228515625, 0.0182952880859375, 0.02838134765625, 0.0384674072265625, 0.048553466796875, 0.0586395263671875, 0.0687255859375, 0.0788116455078125, 0.088897705078125, 0.0989837646484375, 0.10906982421875, 0.1191558837890625, 0.129241943359375, 0.1393280029296875, 0.1494140625, 0.1595001220703125, 0.169586181640625, 0.1796722412109375, 0.18975830078125, 0.1998443603515625, 0.209930419921875, 0.2200164794921875, 0.2301025390625, 0.2401885986328125, 0.250274658203125, 0.2603607177734375, 0.27044677734375, 0.2805328369140625, 0.290618896484375, 0.3007049560546875, 0.310791015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 2.0, 11.0, 14.0, 13.0, 12.0, 18.0, 20.0, 16.0, 23.0, 32.0, 31.0, 37.0, 28.0, 38.0, 39.0, 41.0, 42.0, 41.0, 50.0, 40.0, 42.0, 40.0, 54.0, 41.0, 25.0, 31.0, 36.0, 25.0, 27.0, 28.0, 15.0, 15.0, 12.0, 9.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.2099609375, -0.20343589782714844, -0.19691085815429688, -0.1903858184814453, -0.18386077880859375, -0.1773357391357422, -0.17081069946289062, -0.16428565979003906, -0.1577606201171875, -0.15123558044433594, -0.14471054077148438, -0.1381855010986328, -0.13166046142578125, -0.1251354217529297, -0.11861038208007812, -0.11208534240722656, -0.105560302734375, -0.09903526306152344, -0.09251022338867188, -0.08598518371582031, -0.07946014404296875, -0.07293510437011719, -0.06641006469726562, -0.05988502502441406, -0.0533599853515625, -0.04683494567871094, -0.040309906005859375, -0.03378486633300781, -0.02725982666015625, -0.020734786987304688, -0.014209747314453125, -0.0076847076416015625, -0.00115966796875, 0.0053653717041015625, 0.011890411376953125, 0.018415451049804688, 0.02494049072265625, 0.03146553039550781, 0.037990570068359375, 0.04451560974121094, 0.0510406494140625, 0.05756568908691406, 0.06409072875976562, 0.07061576843261719, 0.07714080810546875, 0.08366584777832031, 0.09019088745117188, 0.09671592712402344, 0.103240966796875, 0.10976600646972656, 0.11629104614257812, 0.12281608581542969, 0.12934112548828125, 0.1358661651611328, 0.14239120483398438, 0.14891624450683594, 0.1554412841796875, 0.16196632385253906, 0.16849136352539062, 0.1750164031982422, 0.18154144287109375, 0.1880664825439453, 0.19459152221679688, 0.20111656188964844, 0.2076416015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 14.0, 28.0, 30.0, 60.0, 105.0, 167.0, 402.0, 879.0, 2149.0, 5420.0, 13867.0, 39467.0, 137298.0, 435619.0, 295228.0, 77170.0, 24939.0, 9244.0, 3672.0, 1508.0, 616.0, 290.0, 121.0, 88.0, 53.0, 40.0, 19.0, 13.0, 13.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6494140625, -0.6317596435546875, -0.614105224609375, -0.5964508056640625, -0.57879638671875, -0.5611419677734375, -0.543487548828125, -0.5258331298828125, -0.5081787109375, -0.4905242919921875, -0.472869873046875, -0.4552154541015625, -0.43756103515625, -0.4199066162109375, -0.402252197265625, -0.3845977783203125, -0.366943359375, -0.3492889404296875, -0.331634521484375, -0.3139801025390625, -0.29632568359375, -0.2786712646484375, -0.261016845703125, -0.2433624267578125, -0.2257080078125, -0.2080535888671875, -0.190399169921875, -0.1727447509765625, -0.15509033203125, -0.1374359130859375, -0.119781494140625, -0.1021270751953125, -0.08447265625, -0.0668182373046875, -0.049163818359375, -0.0315093994140625, -0.01385498046875, 0.0037994384765625, 0.021453857421875, 0.0391082763671875, 0.0567626953125, 0.0744171142578125, 0.092071533203125, 0.1097259521484375, 0.12738037109375, 0.1450347900390625, 0.162689208984375, 0.1803436279296875, 0.197998046875, 0.2156524658203125, 0.233306884765625, 0.2509613037109375, 0.26861572265625, 0.2862701416015625, 0.303924560546875, 0.3215789794921875, 0.3392333984375, 0.3568878173828125, 0.374542236328125, 0.3921966552734375, 0.40985107421875, 0.4275054931640625, 0.445159912109375, 0.4628143310546875, 0.48046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 9.0, 9.0, 5.0, 9.0, 13.0, 16.0, 19.0, 16.0, 26.0, 23.0, 25.0, 37.0, 35.0, 46.0, 40.0, 38.0, 44.0, 46.0, 52.0, 41.0, 43.0, 48.0, 37.0, 40.0, 34.0, 41.0, 39.0, 26.0, 24.0, 22.0, 15.0, 14.0, 18.0, 10.0, 8.0, 8.0, 10.0, 5.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.67822265625, -0.6588134765625, -0.639404296875, -0.6199951171875, -0.6005859375, -0.5811767578125, -0.561767578125, -0.5423583984375, -0.52294921875, -0.5035400390625, -0.484130859375, -0.4647216796875, -0.4453125, -0.4259033203125, -0.406494140625, -0.3870849609375, -0.36767578125, -0.3482666015625, -0.328857421875, -0.3094482421875, -0.2900390625, -0.2706298828125, -0.251220703125, -0.2318115234375, -0.21240234375, -0.1929931640625, -0.173583984375, -0.1541748046875, -0.134765625, -0.1153564453125, -0.095947265625, -0.0765380859375, -0.05712890625, -0.0377197265625, -0.018310546875, 0.0010986328125, 0.0205078125, 0.0399169921875, 0.059326171875, 0.0787353515625, 0.09814453125, 0.1175537109375, 0.136962890625, 0.1563720703125, 0.17578125, 0.1951904296875, 0.214599609375, 0.2340087890625, 0.25341796875, 0.2728271484375, 0.292236328125, 0.3116455078125, 0.3310546875, 0.3504638671875, 0.369873046875, 0.3892822265625, 0.40869140625, 0.4281005859375, 0.447509765625, 0.4669189453125, 0.486328125, 0.5057373046875, 0.525146484375, 0.5445556640625, 0.56396484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 15.0, 21.0, 35.0, 48.0, 70.0, 119.0, 169.0, 306.0, 506.0, 971.0, 1844.0, 3608.0, 7151.0, 15089.0, 32620.0, 71192.0, 164916.0, 310309.0, 240949.0, 108055.0, 47624.0, 22055.0, 10332.0, 5025.0, 2486.0, 1335.0, 665.0, 372.0, 223.0, 140.0, 109.0, 52.0, 36.0, 36.0, 15.0, 12.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.17333984375, -0.16820335388183594, -0.16306686401367188, -0.1579303741455078, -0.15279388427734375, -0.1476573944091797, -0.14252090454101562, -0.13738441467285156, -0.1322479248046875, -0.12711143493652344, -0.12197494506835938, -0.11683845520019531, -0.11170196533203125, -0.10656547546386719, -0.10142898559570312, -0.09629249572753906, -0.091156005859375, -0.08601951599121094, -0.08088302612304688, -0.07574653625488281, -0.07061004638671875, -0.06547355651855469, -0.060337066650390625, -0.05520057678222656, -0.0500640869140625, -0.04492759704589844, -0.039791107177734375, -0.03465461730957031, -0.02951812744140625, -0.024381637573242188, -0.019245147705078125, -0.014108657836914062, -0.00897216796875, -0.0038356781005859375, 0.001300811767578125, 0.0064373016357421875, 0.01157379150390625, 0.016710281372070312, 0.021846771240234375, 0.026983261108398438, 0.0321197509765625, 0.03725624084472656, 0.042392730712890625, 0.04752922058105469, 0.05266571044921875, 0.05780220031738281, 0.06293869018554688, 0.06807518005371094, 0.073211669921875, 0.07834815979003906, 0.08348464965820312, 0.08862113952636719, 0.09375762939453125, 0.09889411926269531, 0.10403060913085938, 0.10916709899902344, 0.1143035888671875, 0.11944007873535156, 0.12457656860351562, 0.1297130584716797, 0.13484954833984375, 0.1399860382080078, 0.14512252807617188, 0.15025901794433594, 0.1553955078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 7.0, 8.0, 12.0, 13.0, 12.0, 26.0, 24.0, 68.0, 76.0, 109.0, 140.0, 146.0, 121.0, 58.0, 40.0, 34.0, 34.0, 13.0, 8.0, 8.0, 4.0, 3.0, 11.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7637691497802734e-05, -5.577504634857178e-05, -5.391240119934082e-05, -5.204975605010986e-05, -5.0187110900878906e-05, -4.832446575164795e-05, -4.646182060241699e-05, -4.4599175453186035e-05, -4.273653030395508e-05, -4.087388515472412e-05, -3.9011240005493164e-05, -3.714859485626221e-05, -3.528594970703125e-05, -3.342330455780029e-05, -3.1560659408569336e-05, -2.969801425933838e-05, -2.7835369110107422e-05, -2.5972723960876465e-05, -2.4110078811645508e-05, -2.224743366241455e-05, -2.0384788513183594e-05, -1.8522143363952637e-05, -1.665949821472168e-05, -1.4796853065490723e-05, -1.2934207916259766e-05, -1.1071562767028809e-05, -9.208917617797852e-06, -7.3462724685668945e-06, -5.4836273193359375e-06, -3.6209821701049805e-06, -1.7583370208740234e-06, 1.043081283569336e-07, 1.9669532775878906e-06, 3.829598426818848e-06, 5.692243576049805e-06, 7.554888725280762e-06, 9.417533874511719e-06, 1.1280179023742676e-05, 1.3142824172973633e-05, 1.500546932220459e-05, 1.6868114471435547e-05, 1.8730759620666504e-05, 2.059340476989746e-05, 2.2456049919128418e-05, 2.4318695068359375e-05, 2.6181340217590332e-05, 2.804398536682129e-05, 2.9906630516052246e-05, 3.17692756652832e-05, 3.363192081451416e-05, 3.549456596374512e-05, 3.7357211112976074e-05, 3.921985626220703e-05, 4.108250141143799e-05, 4.2945146560668945e-05, 4.48077917098999e-05, 4.667043685913086e-05, 4.8533082008361816e-05, 5.0395727157592773e-05, 5.225837230682373e-05, 5.412101745605469e-05, 5.5983662605285645e-05, 5.78463077545166e-05, 5.970895290374756e-05, 6.157159805297852e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 5.0, 9.0, 16.0, 24.0, 45.0, 71.0, 106.0, 164.0, 321.0, 602.0, 1084.0, 2124.0, 4580.0, 10466.0, 26325.0, 69021.0, 188991.0, 360267.0, 237548.0, 89252.0, 33358.0, 13131.0, 5726.0, 2605.0, 1170.0, 640.0, 367.0, 193.0, 135.0, 79.0, 43.0, 30.0, 21.0, 12.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.1690654754638672, -0.16271591186523438, -0.15636634826660156, -0.15001678466796875, -0.14366722106933594, -0.13731765747070312, -0.1309680938720703, -0.1246185302734375, -0.11826896667480469, -0.11191940307617188, -0.10556983947753906, -0.09922027587890625, -0.09287071228027344, -0.08652114868164062, -0.08017158508300781, -0.073822021484375, -0.06747245788574219, -0.061122894287109375, -0.05477333068847656, -0.04842376708984375, -0.04207420349121094, -0.035724639892578125, -0.029375076293945312, -0.0230255126953125, -0.016675949096679688, -0.010326385498046875, -0.0039768218994140625, 0.00237274169921875, 0.008722305297851562, 0.015071868896484375, 0.021421432495117188, 0.02777099609375, 0.03412055969238281, 0.040470123291015625, 0.04681968688964844, 0.05316925048828125, 0.05951881408691406, 0.06586837768554688, 0.07221794128417969, 0.0785675048828125, 0.08491706848144531, 0.09126663208007812, 0.09761619567871094, 0.10396575927734375, 0.11031532287597656, 0.11666488647460938, 0.12301445007324219, 0.129364013671875, 0.1357135772705078, 0.14206314086914062, 0.14841270446777344, 0.15476226806640625, 0.16111183166503906, 0.16746139526367188, 0.1738109588623047, 0.1801605224609375, 0.1865100860595703, 0.19285964965820312, 0.19920921325683594, 0.20555877685546875, 0.21190834045410156, 0.21825790405273438, 0.2246074676513672, 0.23095703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 14.0, 11.0, 21.0, 23.0, 31.0, 40.0, 52.0, 48.0, 70.0, 96.0, 100.0, 74.0, 79.0, 59.0, 38.0, 55.0, 36.0, 33.0, 26.0, 13.0, 16.0, 17.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2095947265625, -0.20334815979003906, -0.19710159301757812, -0.1908550262451172, -0.18460845947265625, -0.1783618927001953, -0.17211532592773438, -0.16586875915527344, -0.1596221923828125, -0.15337562561035156, -0.14712905883789062, -0.1408824920654297, -0.13463592529296875, -0.1283893585205078, -0.12214279174804688, -0.11589622497558594, -0.109649658203125, -0.10340309143066406, -0.09715652465820312, -0.09090995788574219, -0.08466339111328125, -0.07841682434082031, -0.07217025756835938, -0.06592369079589844, -0.0596771240234375, -0.05343055725097656, -0.047183990478515625, -0.04093742370605469, -0.03469085693359375, -0.028444290161132812, -0.022197723388671875, -0.015951156616210938, -0.00970458984375, -0.0034580230712890625, 0.002788543701171875, 0.009035110473632812, 0.01528167724609375, 0.021528244018554688, 0.027774810791015625, 0.03402137756347656, 0.0402679443359375, 0.04651451110839844, 0.052761077880859375, 0.05900764465332031, 0.06525421142578125, 0.07150077819824219, 0.07774734497070312, 0.08399391174316406, 0.090240478515625, 0.09648704528808594, 0.10273361206054688, 0.10898017883300781, 0.11522674560546875, 0.12147331237792969, 0.12771987915039062, 0.13396644592285156, 0.1402130126953125, 0.14645957946777344, 0.15270614624023438, 0.1589527130126953, 0.16519927978515625, 0.1714458465576172, 0.17769241333007812, 0.18393898010253906, 0.190185546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 11.0, 21.0, 31.0, 43.0, 71.0, 102.0, 134.0, 145.0, 135.0, 113.0, 85.0, 47.0, 20.0, 23.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9292144775390625, -2.8419816493988037, -2.754748821258545, -2.667515993118286, -2.5802831649780273, -2.4930505752563477, -2.405817747116089, -2.31858491897583, -2.2313520908355713, -2.1441192626953125, -2.0568864345550537, -1.9696537256240845, -1.8824208974838257, -1.795188069343567, -1.7079553604125977, -1.6207225322723389, -1.53348970413208, -1.4462568759918213, -1.3590240478515625, -1.2717913389205933, -1.1845585107803345, -1.0973256826400757, -1.0100929737091064, -0.9228601455688477, -0.8356273174285889, -0.7483944892883301, -0.6611617207527161, -0.573928952217102, -0.48669612407684326, -0.39946332573890686, -0.31223052740097046, -0.22499775886535645, -0.13776516914367676, -0.050532370805740356, 0.036700427532196045, 0.12393322587013245, 0.21116602420806885, 0.29839882254600525, 0.38563162088394165, 0.47286438941955566, 0.5600972175598145, 0.6473300457000732, 0.7345628142356873, 0.8217955827713013, 0.9090284109115601, 0.9962612390518188, 1.083493947982788, 1.1707267761230469, 1.2579596042633057, 1.3451924324035645, 1.4324252605438232, 1.5196579694747925, 1.6068907976150513, 1.69412362575531, 1.7813563346862793, 1.868589162826538, 1.9558219909667969, 2.0430548191070557, 2.1302876472473145, 2.2175204753875732, 2.304753303527832, 2.3919858932495117, 2.4792187213897705, 2.5664515495300293, 2.653684377670288]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 6.0, 5.0, 3.0, 12.0, 14.0, 10.0, 11.0, 15.0, 19.0, 26.0, 15.0, 24.0, 29.0, 21.0, 40.0, 37.0, 30.0, 35.0, 50.0, 44.0, 29.0, 33.0, 41.0, 39.0, 48.0, 50.0, 36.0, 33.0, 39.0, 33.0, 33.0, 17.0, 19.0, 18.0, 17.0, 8.0, 11.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4986697435379028, -1.4501937627792358, -1.4017176628112793, -1.3532416820526123, -1.3047655820846558, -1.2562896013259888, -1.2078135013580322, -1.1593375205993652, -1.1108615398406982, -1.0623855590820312, -1.0139094591140747, -0.9654334783554077, -0.9169573783874512, -0.8684813976287842, -0.8200053572654724, -0.7715293169021606, -0.7230532169342041, -0.6745771765708923, -0.6261011362075806, -0.5776251554489136, -0.529149055480957, -0.48067304491996765, -0.43219703435897827, -0.3837209939956665, -0.33524495363235474, -0.28676891326904297, -0.2382928878068924, -0.18981686234474182, -0.14134082198143005, -0.09286478161811829, -0.044388771057128906, 0.004087269306182861, 0.05256319046020508, 0.10103922337293625, 0.14951525628566742, 0.197991281747818, 0.24646732211112976, 0.29494336247444153, 0.3434193730354309, 0.3918954133987427, 0.44037145376205444, 0.4888474941253662, 0.537323534488678, 0.5857995748519897, 0.6342755556106567, 0.6827516555786133, 0.7312276363372803, 0.779703676700592, 0.8281797170639038, 0.8766557574272156, 0.9251317977905273, 0.9736077785491943, 1.0220838785171509, 1.0705598592758179, 1.1190359592437744, 1.1675119400024414, 1.2159879207611084, 1.2644639015197754, 1.312940001487732, 1.361415982246399, 1.4098920822143555, 1.4583680629730225, 1.5068440437316895, 1.555320143699646, 1.6037962436676025]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 7.0, 4.0, 13.0, 14.0, 37.0, 46.0, 86.0, 152.0, 280.0, 557.0, 1205.0, 2498.0, 5504.0, 13562.0, 34655.0, 98162.0, 333721.0, 1727240.0, 1531983.0, 299338.0, 90327.0, 32559.0, 12626.0, 5258.0, 2314.0, 1085.0, 499.0, 253.0, 144.0, 70.0, 43.0, 17.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302978515625, -0.2885246276855469, -0.27407073974609375, -0.2596168518066406, -0.2451629638671875, -0.23070907592773438, -0.21625518798828125, -0.20180130004882812, -0.187347412109375, -0.17289352416992188, -0.15843963623046875, -0.14398574829101562, -0.1295318603515625, -0.11507797241210938, -0.10062408447265625, -0.08617019653320312, -0.07171630859375, -0.057262420654296875, -0.04280853271484375, -0.028354644775390625, -0.0139007568359375, 0.000553131103515625, 0.01500701904296875, 0.029460906982421875, 0.043914794921875, 0.058368682861328125, 0.07282257080078125, 0.08727645874023438, 0.1017303466796875, 0.11618423461914062, 0.13063812255859375, 0.14509201049804688, 0.1595458984375, 0.17399978637695312, 0.18845367431640625, 0.20290756225585938, 0.2173614501953125, 0.23181533813476562, 0.24626922607421875, 0.2607231140136719, 0.275177001953125, 0.2896308898925781, 0.30408477783203125, 0.3185386657714844, 0.3329925537109375, 0.3474464416503906, 0.36190032958984375, 0.3763542175292969, 0.39080810546875, 0.4052619934082031, 0.41971588134765625, 0.4341697692871094, 0.4486236572265625, 0.4630775451660156, 0.47753143310546875, 0.4919853210449219, 0.506439208984375, 0.5208930969238281, 0.5353469848632812, 0.5498008728027344, 0.5642547607421875, 0.5787086486816406, 0.5931625366210938, 0.6076164245605469, 0.6220703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 14.0, 6.0, 8.0, 19.0, 20.0, 23.0, 32.0, 22.0, 22.0, 29.0, 28.0, 38.0, 35.0, 45.0, 52.0, 41.0, 43.0, 40.0, 37.0, 43.0, 48.0, 36.0, 33.0, 33.0, 48.0, 28.0, 23.0, 16.0, 16.0, 21.0, 17.0, 12.0, 14.0, 12.0, 9.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2109375, -0.20439720153808594, -0.19785690307617188, -0.1913166046142578, -0.18477630615234375, -0.1782360076904297, -0.17169570922851562, -0.16515541076660156, -0.1586151123046875, -0.15207481384277344, -0.14553451538085938, -0.1389942169189453, -0.13245391845703125, -0.1259136199951172, -0.11937332153320312, -0.11283302307128906, -0.106292724609375, -0.09975242614746094, -0.09321212768554688, -0.08667182922363281, -0.08013153076171875, -0.07359123229980469, -0.06705093383789062, -0.06051063537597656, -0.0539703369140625, -0.04743003845214844, -0.040889739990234375, -0.03434944152832031, -0.02780914306640625, -0.021268844604492188, -0.014728546142578125, -0.008188247680664062, -0.00164794921875, 0.0048923492431640625, 0.011432647705078125, 0.017972946166992188, 0.02451324462890625, 0.031053543090820312, 0.037593841552734375, 0.04413414001464844, 0.0506744384765625, 0.05721473693847656, 0.06375503540039062, 0.07029533386230469, 0.07683563232421875, 0.08337593078613281, 0.08991622924804688, 0.09645652770996094, 0.102996826171875, 0.10953712463378906, 0.11607742309570312, 0.12261772155761719, 0.12915802001953125, 0.1356983184814453, 0.14223861694335938, 0.14877891540527344, 0.1553192138671875, 0.16185951232910156, 0.16839981079101562, 0.1749401092529297, 0.18148040771484375, 0.1880207061767578, 0.19456100463867188, 0.20110130310058594, 0.2076416015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 12.0, 18.0, 18.0, 29.0, 39.0, 70.0, 105.0, 180.0, 260.0, 390.0, 626.0, 971.0, 1671.0, 2777.0, 4819.0, 8580.0, 15861.0, 29616.0, 58013.0, 117262.0, 255245.0, 644477.0, 1653106.0, 817601.0, 303061.0, 137127.0, 66672.0, 34300.0, 17972.0, 9854.0, 5457.0, 3173.0, 1907.0, 1157.0, 678.0, 399.0, 277.0, 176.0, 114.0, 69.0, 50.0, 28.0, 23.0, 15.0, 10.0, 9.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.309326171875, -0.2998390197753906, -0.29035186767578125, -0.2808647155761719, -0.2713775634765625, -0.2618904113769531, -0.25240325927734375, -0.24291610717773438, -0.233428955078125, -0.22394180297851562, -0.21445465087890625, -0.20496749877929688, -0.1954803466796875, -0.18599319458007812, -0.17650604248046875, -0.16701889038085938, -0.15753173828125, -0.14804458618164062, -0.13855743408203125, -0.12907028198242188, -0.1195831298828125, -0.11009597778320312, -0.10060882568359375, -0.09112167358398438, -0.081634521484375, -0.07214736938476562, -0.06266021728515625, -0.053173065185546875, -0.0436859130859375, -0.034198760986328125, -0.02471160888671875, -0.015224456787109375, -0.0057373046875, 0.003749847412109375, 0.01323699951171875, 0.022724151611328125, 0.0322113037109375, 0.041698455810546875, 0.05118560791015625, 0.060672760009765625, 0.070159912109375, 0.07964706420898438, 0.08913421630859375, 0.09862136840820312, 0.1081085205078125, 0.11759567260742188, 0.12708282470703125, 0.13656997680664062, 0.14605712890625, 0.15554428100585938, 0.16503143310546875, 0.17451858520507812, 0.1840057373046875, 0.19349288940429688, 0.20298004150390625, 0.21246719360351562, 0.221954345703125, 0.23144149780273438, 0.24092864990234375, 0.2504158020019531, 0.2599029541015625, 0.2693901062011719, 0.27887725830078125, 0.2883644104003906, 0.2978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 9.0, 4.0, 11.0, 16.0, 19.0, 14.0, 18.0, 30.0, 32.0, 44.0, 49.0, 77.0, 71.0, 124.0, 164.0, 199.0, 270.0, 383.0, 506.0, 513.0, 405.0, 242.0, 189.0, 171.0, 94.0, 106.0, 60.0, 56.0, 48.0, 24.0, 37.0, 17.0, 14.0, 11.0, 7.0, 8.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.413330078125, -0.4004058837890625, -0.387481689453125, -0.3745574951171875, -0.36163330078125, -0.3487091064453125, -0.335784912109375, -0.3228607177734375, -0.3099365234375, -0.2970123291015625, -0.284088134765625, -0.2711639404296875, -0.25823974609375, -0.2453155517578125, -0.232391357421875, -0.2194671630859375, -0.20654296875, -0.1936187744140625, -0.180694580078125, -0.1677703857421875, -0.15484619140625, -0.1419219970703125, -0.128997802734375, -0.1160736083984375, -0.1031494140625, -0.0902252197265625, -0.077301025390625, -0.0643768310546875, -0.05145263671875, -0.0385284423828125, -0.025604248046875, -0.0126800537109375, 0.000244140625, 0.0131683349609375, 0.026092529296875, 0.0390167236328125, 0.05194091796875, 0.0648651123046875, 0.077789306640625, 0.0907135009765625, 0.1036376953125, 0.1165618896484375, 0.129486083984375, 0.1424102783203125, 0.15533447265625, 0.1682586669921875, 0.181182861328125, 0.1941070556640625, 0.20703125, 0.2199554443359375, 0.232879638671875, 0.2458038330078125, 0.25872802734375, 0.2716522216796875, 0.284576416015625, 0.2975006103515625, 0.3104248046875, 0.3233489990234375, 0.336273193359375, 0.3491973876953125, 0.36212158203125, 0.3750457763671875, 0.387969970703125, 0.4008941650390625, 0.413818359375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 10.0, 19.0, 28.0, 45.0, 52.0, 71.0, 86.0, 104.0, 111.0, 108.0, 91.0, 86.0, 46.0, 41.0, 37.0, 19.0, 9.0, 13.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.197746515274048, -2.1109507083892822, -2.0241551399230957, -1.93735933303833, -1.8505635261535645, -1.7637677192687988, -1.6769720315933228, -1.5901763439178467, -1.503380537033081, -1.4165847301483154, -1.3297890424728394, -1.2429933547973633, -1.1561975479125977, -1.069401741027832, -0.982606053352356, -0.8958103060722351, -0.8090145587921143, -0.7222188115119934, -0.6354230642318726, -0.5486273169517517, -0.46183156967163086, -0.37503582239151, -0.28824007511138916, -0.2014443278312683, -0.11464858055114746, -0.02785283327102661, 0.05894291400909424, 0.1457386612892151, 0.23253440856933594, 0.3193301558494568, 0.40612590312957764, 0.4929216504096985, 0.5797173976898193, 0.6665131449699402, 0.753308892250061, 0.8401046395301819, 0.9269003868103027, 1.0136961936950684, 1.1004918813705444, 1.1872875690460205, 1.2740833759307861, 1.3608791828155518, 1.4476748704910278, 1.534470558166504, 1.6212663650512695, 1.7080621719360352, 1.7948578596115112, 1.8816535472869873, 1.968449354171753, 2.0552451610565186, 2.142040729522705, 2.2288365364074707, 2.3156323432922363, 2.402428150177002, 2.4892239570617676, 2.576019525527954, 2.6628153324127197, 2.7496111392974854, 2.836406707763672, 2.9232025146484375, 3.009998321533203, 3.0967941284179688, 3.1835899353027344, 3.270385503768921, 3.3571813106536865]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 5.0, 5.0, 11.0, 8.0, 11.0, 8.0, 13.0, 12.0, 23.0, 18.0, 18.0, 22.0, 23.0, 23.0, 38.0, 32.0, 45.0, 32.0, 36.0, 35.0, 48.0, 42.0, 39.0, 29.0, 45.0, 38.0, 30.0, 44.0, 31.0, 23.0, 30.0, 35.0, 32.0, 16.0, 10.0, 14.0, 16.0, 12.0, 8.0, 13.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4809997081756592, -1.435689091682434, -1.3903785943984985, -1.3450679779052734, -1.299757480621338, -1.2544468641281128, -1.2091363668441772, -1.1638257503509521, -1.1185152530670166, -1.0732046365737915, -1.027894139289856, -0.9825835824012756, -0.9372730255126953, -0.891962468624115, -0.8466519117355347, -0.8013412952423096, -0.7560307383537292, -0.7107201814651489, -0.6654096245765686, -0.6200990676879883, -0.574788510799408, -0.5294779539108276, -0.4841673672199249, -0.4388568103313446, -0.3935462534427643, -0.34823569655418396, -0.30292513966560364, -0.2576145529747009, -0.2123040109872818, -0.16699345409870148, -0.12168288230895996, -0.07637232542037964, -0.031061768531799316, 0.014248792082071304, 0.059559352695941925, 0.10486991703510284, 0.15018047392368317, 0.1954910308122635, 0.240801602602005, 0.2861121594905853, 0.33142271637916565, 0.37673327326774597, 0.4220438301563263, 0.467354416847229, 0.5126649737358093, 0.5579755306243896, 0.60328608751297, 0.6485966444015503, 0.6939072012901306, 0.7392177581787109, 0.7845283150672913, 0.8298388719558716, 0.8751494288444519, 0.9204599857330322, 0.9657706022262573, 1.0110810995101929, 1.056391716003418, 1.101702332496643, 1.1470128297805786, 1.1923234462738037, 1.2376339435577393, 1.2829445600509644, 1.3282550573349, 1.373565673828125, 1.4188761711120605]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 17.0, 16.0, 27.0, 35.0, 102.0, 126.0, 160.0, 256.0, 453.0, 599.0, 839.0, 1257.0, 1839.0, 2667.0, 3816.0, 5422.0, 8403.0, 13210.0, 22587.0, 44179.0, 105154.0, 257661.0, 306881.0, 143294.0, 57211.0, 27384.0, 15533.0, 9405.0, 6205.0, 4301.0, 3001.0, 2065.0, 1484.0, 967.0, 654.0, 496.0, 284.0, 195.0, 130.0, 77.0, 53.0, 46.0, 28.0, 9.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0], "bins": [-0.44775390625, -0.43537139892578125, -0.4229888916015625, -0.41060638427734375, -0.398223876953125, -0.38584136962890625, -0.3734588623046875, -0.36107635498046875, -0.34869384765625, -0.33631134033203125, -0.3239288330078125, -0.31154632568359375, -0.299163818359375, -0.28678131103515625, -0.2743988037109375, -0.26201629638671875, -0.2496337890625, -0.23725128173828125, -0.2248687744140625, -0.21248626708984375, -0.200103759765625, -0.18772125244140625, -0.1753387451171875, -0.16295623779296875, -0.15057373046875, -0.13819122314453125, -0.1258087158203125, -0.11342620849609375, -0.101043701171875, -0.08866119384765625, -0.0762786865234375, -0.06389617919921875, -0.051513671875, -0.03913116455078125, -0.0267486572265625, -0.01436614990234375, -0.001983642578125, 0.01039886474609375, 0.0227813720703125, 0.03516387939453125, 0.04754638671875, 0.05992889404296875, 0.0723114013671875, 0.08469390869140625, 0.097076416015625, 0.10945892333984375, 0.1218414306640625, 0.13422393798828125, 0.1466064453125, 0.15898895263671875, 0.1713714599609375, 0.18375396728515625, 0.196136474609375, 0.20851898193359375, 0.2209014892578125, 0.23328399658203125, 0.24566650390625, 0.25804901123046875, 0.2704315185546875, 0.28281402587890625, 0.295196533203125, 0.30757904052734375, 0.3199615478515625, 0.33234405517578125, 0.3447265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 12.0, 7.0, 8.0, 10.0, 8.0, 18.0, 18.0, 18.0, 22.0, 19.0, 24.0, 38.0, 35.0, 33.0, 38.0, 37.0, 35.0, 42.0, 35.0, 30.0, 39.0, 42.0, 40.0, 39.0, 49.0, 35.0, 37.0, 36.0, 28.0, 20.0, 26.0, 27.0, 18.0, 15.0, 17.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19839096069335938, -0.19194793701171875, -0.18550491333007812, -0.1790618896484375, -0.17261886596679688, -0.16617584228515625, -0.15973281860351562, -0.153289794921875, -0.14684677124023438, -0.14040374755859375, -0.13396072387695312, -0.1275177001953125, -0.12107467651367188, -0.11463165283203125, -0.10818862915039062, -0.10174560546875, -0.09530258178710938, -0.08885955810546875, -0.08241653442382812, -0.0759735107421875, -0.06953048706054688, -0.06308746337890625, -0.056644439697265625, -0.050201416015625, -0.043758392333984375, -0.03731536865234375, -0.030872344970703125, -0.0244293212890625, -0.017986297607421875, -0.01154327392578125, -0.005100250244140625, 0.0013427734375, 0.007785797119140625, 0.01422882080078125, 0.020671844482421875, 0.0271148681640625, 0.033557891845703125, 0.04000091552734375, 0.046443939208984375, 0.052886962890625, 0.059329986572265625, 0.06577301025390625, 0.07221603393554688, 0.0786590576171875, 0.08510208129882812, 0.09154510498046875, 0.09798812866210938, 0.10443115234375, 0.11087417602539062, 0.11731719970703125, 0.12376022338867188, 0.1302032470703125, 0.13664627075195312, 0.14308929443359375, 0.14953231811523438, 0.155975341796875, 0.16241836547851562, 0.16886138916015625, 0.17530441284179688, 0.1817474365234375, 0.18819046020507812, 0.19463348388671875, 0.20107650756835938, 0.20751953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 13.0, 17.0, 17.0, 38.0, 58.0, 81.0, 109.0, 182.0, 262.0, 545.0, 1092.0, 2226.0, 4922.0, 11396.0, 25914.0, 68499.0, 267720.0, 464745.0, 128306.0, 41023.0, 17099.0, 7417.0, 3465.0, 1575.0, 760.0, 390.0, 200.0, 141.0, 88.0, 64.0, 52.0, 27.0, 25.0, 14.0, 21.0, 7.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6865005493164062, -0.6664581298828125, -0.6464157104492188, -0.626373291015625, -0.6063308715820312, -0.5862884521484375, -0.5662460327148438, -0.54620361328125, -0.5261611938476562, -0.5061187744140625, -0.48607635498046875, -0.466033935546875, -0.44599151611328125, -0.4259490966796875, -0.40590667724609375, -0.3858642578125, -0.36582183837890625, -0.3457794189453125, -0.32573699951171875, -0.305694580078125, -0.28565216064453125, -0.2656097412109375, -0.24556732177734375, -0.22552490234375, -0.20548248291015625, -0.1854400634765625, -0.16539764404296875, -0.145355224609375, -0.12531280517578125, -0.1052703857421875, -0.08522796630859375, -0.065185546875, -0.04514312744140625, -0.0251007080078125, -0.00505828857421875, 0.014984130859375, 0.03502655029296875, 0.0550689697265625, 0.07511138916015625, 0.09515380859375, 0.11519622802734375, 0.1352386474609375, 0.15528106689453125, 0.175323486328125, 0.19536590576171875, 0.2154083251953125, 0.23545074462890625, 0.2554931640625, 0.27553558349609375, 0.2955780029296875, 0.31562042236328125, 0.335662841796875, 0.35570526123046875, 0.3757476806640625, 0.39579010009765625, 0.41583251953125, 0.43587493896484375, 0.4559173583984375, 0.47595977783203125, 0.496002197265625, 0.5160446166992188, 0.5360870361328125, 0.5561294555664062, 0.576171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 7.0, 6.0, 6.0, 9.0, 9.0, 12.0, 10.0, 17.0, 25.0, 35.0, 27.0, 40.0, 28.0, 32.0, 34.0, 31.0, 56.0, 42.0, 46.0, 32.0, 44.0, 42.0, 38.0, 42.0, 47.0, 28.0, 35.0, 34.0, 36.0, 16.0, 23.0, 16.0, 19.0, 12.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 2.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.5565032958984375, -0.537322998046875, -0.5181427001953125, -0.49896240234375, -0.4797821044921875, -0.460601806640625, -0.4414215087890625, -0.4222412109375, -0.4030609130859375, -0.383880615234375, -0.3647003173828125, -0.34552001953125, -0.3263397216796875, -0.307159423828125, -0.2879791259765625, -0.268798828125, -0.2496185302734375, -0.230438232421875, -0.2112579345703125, -0.19207763671875, -0.1728973388671875, -0.153717041015625, -0.1345367431640625, -0.1153564453125, -0.0961761474609375, -0.076995849609375, -0.0578155517578125, -0.03863525390625, -0.0194549560546875, -0.000274658203125, 0.0189056396484375, 0.0380859375, 0.0572662353515625, 0.076446533203125, 0.0956268310546875, 0.11480712890625, 0.1339874267578125, 0.153167724609375, 0.1723480224609375, 0.1915283203125, 0.2107086181640625, 0.229888916015625, 0.2490692138671875, 0.26824951171875, 0.2874298095703125, 0.306610107421875, 0.3257904052734375, 0.344970703125, 0.3641510009765625, 0.383331298828125, 0.4025115966796875, 0.42169189453125, 0.4408721923828125, 0.460052490234375, 0.4792327880859375, 0.4984130859375, 0.5175933837890625, 0.536773681640625, 0.5559539794921875, 0.57513427734375, 0.5943145751953125, 0.613494873046875, 0.6326751708984375, 0.65185546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 4.0, 16.0, 20.0, 29.0, 27.0, 45.0, 82.0, 121.0, 195.0, 310.0, 516.0, 858.0, 1359.0, 2040.0, 3258.0, 5313.0, 9259.0, 17039.0, 36104.0, 83861.0, 212199.0, 337122.0, 191449.0, 76356.0, 33076.0, 15713.0, 8600.0, 5079.0, 3124.0, 2031.0, 1239.0, 742.0, 506.0, 293.0, 187.0, 126.0, 87.0, 57.0, 29.0, 21.0, 13.0, 14.0, 3.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.144775390625, -0.14017105102539062, -0.13556671142578125, -0.13096237182617188, -0.1263580322265625, -0.12175369262695312, -0.11714935302734375, -0.11254501342773438, -0.107940673828125, -0.10333633422851562, -0.09873199462890625, -0.09412765502929688, -0.0895233154296875, -0.08491897583007812, -0.08031463623046875, -0.07571029663085938, -0.07110595703125, -0.06650161743164062, -0.06189727783203125, -0.057292938232421875, -0.0526885986328125, -0.048084259033203125, -0.04347991943359375, -0.038875579833984375, -0.034271240234375, -0.029666900634765625, -0.02506256103515625, -0.020458221435546875, -0.0158538818359375, -0.011249542236328125, -0.00664520263671875, -0.002040863037109375, 0.0025634765625, 0.007167816162109375, 0.01177215576171875, 0.016376495361328125, 0.0209808349609375, 0.025585174560546875, 0.03018951416015625, 0.034793853759765625, 0.039398193359375, 0.044002532958984375, 0.04860687255859375, 0.053211212158203125, 0.0578155517578125, 0.062419891357421875, 0.06702423095703125, 0.07162857055664062, 0.07623291015625, 0.08083724975585938, 0.08544158935546875, 0.09004592895507812, 0.0946502685546875, 0.09925460815429688, 0.10385894775390625, 0.10846328735351562, 0.113067626953125, 0.11767196655273438, 0.12227630615234375, 0.12688064575195312, 0.1314849853515625, 0.13608932495117188, 0.14069366455078125, 0.14529800415039062, 0.14990234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 30.0, 21.0, 42.0, 70.0, 155.0, 250.0, 184.0, 83.0, 39.0, 31.0, 9.0, 11.0, 10.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.202957153320312e-05, -8.91275703907013e-05, -8.622556924819946e-05, -8.332356810569763e-05, -8.04215669631958e-05, -7.751956582069397e-05, -7.461756467819214e-05, -7.171556353569031e-05, -6.881356239318848e-05, -6.591156125068665e-05, -6.300956010818481e-05, -6.0107558965682983e-05, -5.720555782318115e-05, -5.430355668067932e-05, -5.140155553817749e-05, -4.849955439567566e-05, -4.559755325317383e-05, -4.2695552110672e-05, -3.9793550968170166e-05, -3.6891549825668335e-05, -3.3989548683166504e-05, -3.108754754066467e-05, -2.8185546398162842e-05, -2.528354525566101e-05, -2.238154411315918e-05, -1.947954297065735e-05, -1.6577541828155518e-05, -1.3675540685653687e-05, -1.0773539543151855e-05, -7.871538400650024e-06, -4.969537258148193e-06, -2.0675361156463623e-06, 8.344650268554688e-07, 3.7364661693573e-06, 6.638467311859131e-06, 9.540468454360962e-06, 1.2442469596862793e-05, 1.5344470739364624e-05, 1.8246471881866455e-05, 2.1148473024368286e-05, 2.4050474166870117e-05, 2.6952475309371948e-05, 2.985447645187378e-05, 3.275647759437561e-05, 3.565847873687744e-05, 3.856047987937927e-05, 4.1462481021881104e-05, 4.4364482164382935e-05, 4.7266483306884766e-05, 5.01684844493866e-05, 5.307048559188843e-05, 5.597248673439026e-05, 5.887448787689209e-05, 6.177648901939392e-05, 6.467849016189575e-05, 6.758049130439758e-05, 7.048249244689941e-05, 7.338449358940125e-05, 7.628649473190308e-05, 7.918849587440491e-05, 8.209049701690674e-05, 8.499249815940857e-05, 8.78944993019104e-05, 9.079650044441223e-05, 9.369850158691406e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 1.0, 5.0, 9.0, 10.0, 15.0, 10.0, 16.0, 23.0, 28.0, 45.0, 59.0, 73.0, 121.0, 222.0, 339.0, 531.0, 980.0, 1841.0, 3415.0, 6898.0, 13962.0, 31131.0, 75787.0, 187912.0, 323670.0, 230435.0, 97139.0, 39221.0, 17121.0, 8376.0, 4085.0, 2181.0, 1113.0, 680.0, 394.0, 243.0, 144.0, 90.0, 72.0, 40.0, 38.0, 22.0, 21.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1424560546875, -0.13780593872070312, -0.13315582275390625, -0.12850570678710938, -0.1238555908203125, -0.11920547485351562, -0.11455535888671875, -0.10990524291992188, -0.105255126953125, -0.10060501098632812, -0.09595489501953125, -0.09130477905273438, -0.0866546630859375, -0.08200454711914062, -0.07735443115234375, -0.07270431518554688, -0.06805419921875, -0.06340408325195312, -0.05875396728515625, -0.054103851318359375, -0.0494537353515625, -0.044803619384765625, -0.04015350341796875, -0.035503387451171875, -0.030853271484375, -0.026203155517578125, -0.02155303955078125, -0.016902923583984375, -0.0122528076171875, -0.007602691650390625, -0.00295257568359375, 0.001697540283203125, 0.00634765625, 0.010997772216796875, 0.01564788818359375, 0.020298004150390625, 0.0249481201171875, 0.029598236083984375, 0.03424835205078125, 0.038898468017578125, 0.043548583984375, 0.048198699951171875, 0.05284881591796875, 0.057498931884765625, 0.0621490478515625, 0.06679916381835938, 0.07144927978515625, 0.07609939575195312, 0.08074951171875, 0.08539962768554688, 0.09004974365234375, 0.09469985961914062, 0.0993499755859375, 0.10400009155273438, 0.10865020751953125, 0.11330032348632812, 0.117950439453125, 0.12260055541992188, 0.12725067138671875, 0.13190078735351562, 0.1365509033203125, 0.14120101928710938, 0.14585113525390625, 0.15050125122070312, 0.1551513671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 10.0, 15.0, 14.0, 11.0, 23.0, 35.0, 36.0, 48.0, 77.0, 83.0, 107.0, 107.0, 93.0, 84.0, 61.0, 53.0, 37.0, 24.0, 14.0, 22.0, 9.0, 9.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.20372772216796875, -0.1971282958984375, -0.19052886962890625, -0.183929443359375, -0.17733001708984375, -0.1707305908203125, -0.16413116455078125, -0.15753173828125, -0.15093231201171875, -0.1443328857421875, -0.13773345947265625, -0.131134033203125, -0.12453460693359375, -0.1179351806640625, -0.11133575439453125, -0.104736328125, -0.09813690185546875, -0.0915374755859375, -0.08493804931640625, -0.078338623046875, -0.07173919677734375, -0.0651397705078125, -0.05854034423828125, -0.05194091796875, -0.04534149169921875, -0.0387420654296875, -0.03214263916015625, -0.025543212890625, -0.01894378662109375, -0.0123443603515625, -0.00574493408203125, 0.0008544921875, 0.00745391845703125, 0.0140533447265625, 0.02065277099609375, 0.027252197265625, 0.03385162353515625, 0.0404510498046875, 0.04705047607421875, 0.05364990234375, 0.06024932861328125, 0.0668487548828125, 0.07344818115234375, 0.080047607421875, 0.08664703369140625, 0.0932464599609375, 0.09984588623046875, 0.1064453125, 0.11304473876953125, 0.1196441650390625, 0.12624359130859375, 0.132843017578125, 0.13944244384765625, 0.1460418701171875, 0.15264129638671875, 0.15924072265625, 0.16584014892578125, 0.1724395751953125, 0.17903900146484375, 0.185638427734375, 0.19223785400390625, 0.1988372802734375, 0.20543670654296875, 0.2120361328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 17.0, 21.0, 33.0, 51.0, 68.0, 88.0, 70.0, 81.0, 103.0, 79.0, 90.0, 81.0, 56.0, 42.0, 36.0, 25.0, 11.0, 12.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.058450222015381, -1.9919641017913818, -1.9254779815673828, -1.8589919805526733, -1.7925058603286743, -1.7260197401046753, -1.6595337390899658, -1.5930476188659668, -1.5265614986419678, -1.4600753784179688, -1.3935892581939697, -1.3271032571792603, -1.2606171369552612, -1.1941310167312622, -1.1276450157165527, -1.0611588954925537, -0.9946727752685547, -0.9281866550445557, -0.8617005944252014, -0.7952145338058472, -0.7287284135818481, -0.6622422933578491, -0.5957562327384949, -0.5292701721191406, -0.4627840518951416, -0.39629796147346497, -0.32981187105178833, -0.2633257806301117, -0.19683969020843506, -0.13035359978675842, -0.06386750936508179, 0.0026185810565948486, 0.06910467147827148, 0.13559076189994812, 0.20207685232162476, 0.2685629427433014, 0.335049033164978, 0.40153512358665466, 0.4680212140083313, 0.5345072746276855, 0.6009933948516846, 0.6674795150756836, 0.7339655756950378, 0.8004516363143921, 0.8669377565383911, 0.9334238767623901, 0.9999099373817444, 1.0663959980010986, 1.1328821182250977, 1.1993682384490967, 1.2658543586730957, 1.3323403596878052, 1.3988264799118042, 1.4653126001358032, 1.5317986011505127, 1.5982847213745117, 1.6647708415985107, 1.7312569618225098, 1.7977430820465088, 1.8642290830612183, 1.9307152032852173, 1.9972013235092163, 2.063687324523926, 2.130173444747925, 2.196659564971924]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 8.0, 5.0, 11.0, 12.0, 7.0, 16.0, 19.0, 16.0, 17.0, 17.0, 19.0, 25.0, 37.0, 28.0, 30.0, 45.0, 31.0, 40.0, 43.0, 38.0, 60.0, 50.0, 38.0, 35.0, 35.0, 43.0, 35.0, 33.0, 24.0, 28.0, 29.0, 20.0, 16.0, 18.0, 12.0, 7.0, 9.0, 7.0, 6.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4276683330535889, -1.3805620670318604, -1.3334559202194214, -1.2863496541976929, -1.2392433881759644, -1.1921372413635254, -1.1450309753417969, -1.0979247093200684, -1.0508184432983398, -1.0037121772766113, -0.9566059708595276, -0.9094997644424438, -0.8623934984207153, -0.8152872920036316, -0.7681810855865479, -0.7210748195648193, -0.6739686727523804, -0.6268624663352966, -0.5797562003135681, -0.5326499938964844, -0.48554375767707825, -0.4384375214576721, -0.3913313150405884, -0.34422507882118225, -0.2971188426017761, -0.25001260638237, -0.20290638506412506, -0.15580016374588013, -0.108693927526474, -0.06158769130706787, -0.01448148488998413, 0.032624751329422, 0.07973098754882812, 0.12683722376823425, 0.1739434450864792, 0.22104966640472412, 0.26815590262413025, 0.3152621388435364, 0.3623683452606201, 0.40947458148002625, 0.4565808176994324, 0.5036870241165161, 0.5507932901382446, 0.5978994965553284, 0.6450057029724121, 0.6921119689941406, 0.7392181754112244, 0.7863243818283081, 0.8334306478500366, 0.8805368542671204, 0.9276431202888489, 0.9747493267059326, 1.0218555927276611, 1.0689618587493896, 1.1160680055618286, 1.1631742715835571, 1.210280418395996, 1.2573866844177246, 1.3044928312301636, 1.351599097251892, 1.3987053632736206, 1.4458115100860596, 1.492917776107788, 1.5400240421295166, 1.5871303081512451]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 20.0, 37.0, 54.0, 78.0, 154.0, 236.0, 414.0, 867.0, 1632.0, 3209.0, 7231.0, 16718.0, 40968.0, 108778.0, 354673.0, 1707446.0, 1481594.0, 307568.0, 97087.0, 37012.0, 15480.0, 6618.0, 3043.0, 1526.0, 821.0, 437.0, 217.0, 124.0, 79.0, 55.0, 40.0, 25.0, 6.0, 11.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.266845703125, -0.2546882629394531, -0.24253082275390625, -0.23037338256835938, -0.2182159423828125, -0.20605850219726562, -0.19390106201171875, -0.18174362182617188, -0.169586181640625, -0.15742874145507812, -0.14527130126953125, -0.13311386108398438, -0.1209564208984375, -0.10879898071289062, -0.09664154052734375, -0.08448410034179688, -0.07232666015625, -0.060169219970703125, -0.04801177978515625, -0.035854339599609375, -0.0236968994140625, -0.011539459228515625, 0.00061798095703125, 0.012775421142578125, 0.024932861328125, 0.037090301513671875, 0.04924774169921875, 0.061405181884765625, 0.0735626220703125, 0.08572006225585938, 0.09787750244140625, 0.11003494262695312, 0.1221923828125, 0.13434982299804688, 0.14650726318359375, 0.15866470336914062, 0.1708221435546875, 0.18297958374023438, 0.19513702392578125, 0.20729446411132812, 0.219451904296875, 0.23160934448242188, 0.24376678466796875, 0.2559242248535156, 0.2680816650390625, 0.2802391052246094, 0.29239654541015625, 0.3045539855957031, 0.31671142578125, 0.3288688659667969, 0.34102630615234375, 0.3531837463378906, 0.3653411865234375, 0.3774986267089844, 0.38965606689453125, 0.4018135070800781, 0.413970947265625, 0.4261283874511719, 0.43828582763671875, 0.4504432678222656, 0.4626007080078125, 0.4747581481933594, 0.48691558837890625, 0.4990730285644531, 0.51123046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 4.0, 11.0, 7.0, 13.0, 11.0, 15.0, 11.0, 17.0, 15.0, 22.0, 23.0, 22.0, 19.0, 34.0, 36.0, 39.0, 41.0, 29.0, 45.0, 41.0, 38.0, 32.0, 44.0, 39.0, 48.0, 34.0, 34.0, 33.0, 20.0, 24.0, 20.0, 23.0, 28.0, 16.0, 12.0, 17.0, 19.0, 6.0, 11.0, 12.0, 7.0, 6.0, 4.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.16796875, -0.16219329833984375, -0.1564178466796875, -0.15064239501953125, -0.144866943359375, -0.13909149169921875, -0.1333160400390625, -0.12754058837890625, -0.12176513671875, -0.11598968505859375, -0.1102142333984375, -0.10443878173828125, -0.098663330078125, -0.09288787841796875, -0.0871124267578125, -0.08133697509765625, -0.0755615234375, -0.06978607177734375, -0.0640106201171875, -0.05823516845703125, -0.052459716796875, -0.04668426513671875, -0.0409088134765625, -0.03513336181640625, -0.02935791015625, -0.02358245849609375, -0.0178070068359375, -0.01203155517578125, -0.006256103515625, -0.00048065185546875, 0.0052947998046875, 0.01107025146484375, 0.016845703125, 0.02262115478515625, 0.0283966064453125, 0.03417205810546875, 0.039947509765625, 0.04572296142578125, 0.0514984130859375, 0.05727386474609375, 0.06304931640625, 0.06882476806640625, 0.0746002197265625, 0.08037567138671875, 0.086151123046875, 0.09192657470703125, 0.0977020263671875, 0.10347747802734375, 0.1092529296875, 0.11502838134765625, 0.1208038330078125, 0.12657928466796875, 0.132354736328125, 0.13813018798828125, 0.1439056396484375, 0.14968109130859375, 0.15545654296875, 0.16123199462890625, 0.1670074462890625, 0.17278289794921875, 0.178558349609375, 0.18433380126953125, 0.1901092529296875, 0.19588470458984375, 0.20166015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 17.0, 24.0, 35.0, 54.0, 105.0, 127.0, 229.0, 355.0, 601.0, 1220.0, 2417.0, 5924.0, 15520.0, 46205.0, 153358.0, 692175.0, 2538330.0, 544356.0, 129757.0, 39734.0, 13636.0, 5265.0, 2297.0, 1114.0, 562.0, 328.0, 205.0, 114.0, 89.0, 37.0, 28.0, 24.0, 6.0, 6.0, 4.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.56982421875, -0.5527801513671875, -0.535736083984375, -0.5186920166015625, -0.50164794921875, -0.4846038818359375, -0.467559814453125, -0.4505157470703125, -0.4334716796875, -0.4164276123046875, -0.399383544921875, -0.3823394775390625, -0.36529541015625, -0.3482513427734375, -0.331207275390625, -0.3141632080078125, -0.297119140625, -0.2800750732421875, -0.263031005859375, -0.2459869384765625, -0.22894287109375, -0.2118988037109375, -0.194854736328125, -0.1778106689453125, -0.1607666015625, -0.1437225341796875, -0.126678466796875, -0.1096343994140625, -0.09259033203125, -0.0755462646484375, -0.058502197265625, -0.0414581298828125, -0.0244140625, -0.0073699951171875, 0.009674072265625, 0.0267181396484375, 0.04376220703125, 0.0608062744140625, 0.077850341796875, 0.0948944091796875, 0.1119384765625, 0.1289825439453125, 0.146026611328125, 0.1630706787109375, 0.18011474609375, 0.1971588134765625, 0.214202880859375, 0.2312469482421875, 0.248291015625, 0.2653350830078125, 0.282379150390625, 0.2994232177734375, 0.31646728515625, 0.3335113525390625, 0.350555419921875, 0.3675994873046875, 0.3846435546875, 0.4016876220703125, 0.418731689453125, 0.4357757568359375, 0.45281982421875, 0.4698638916015625, 0.486907958984375, 0.5039520263671875, 0.52099609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 6.0, 13.0, 13.0, 19.0, 24.0, 34.0, 49.0, 61.0, 64.0, 88.0, 148.0, 188.0, 308.0, 465.0, 628.0, 626.0, 378.0, 262.0, 156.0, 126.0, 100.0, 77.0, 56.0, 31.0, 31.0, 26.0, 16.0, 13.0, 13.0, 12.0, 6.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.552734375, -0.536865234375, -0.52099609375, -0.505126953125, -0.4892578125, -0.473388671875, -0.45751953125, -0.441650390625, -0.42578125, -0.409912109375, -0.39404296875, -0.378173828125, -0.3623046875, -0.346435546875, -0.33056640625, -0.314697265625, -0.298828125, -0.282958984375, -0.26708984375, -0.251220703125, -0.2353515625, -0.219482421875, -0.20361328125, -0.187744140625, -0.171875, -0.156005859375, -0.14013671875, -0.124267578125, -0.1083984375, -0.092529296875, -0.07666015625, -0.060791015625, -0.044921875, -0.029052734375, -0.01318359375, 0.002685546875, 0.0185546875, 0.034423828125, 0.05029296875, 0.066162109375, 0.08203125, 0.097900390625, 0.11376953125, 0.129638671875, 0.1455078125, 0.161376953125, 0.17724609375, 0.193115234375, 0.208984375, 0.224853515625, 0.24072265625, 0.256591796875, 0.2724609375, 0.288330078125, 0.30419921875, 0.320068359375, 0.3359375, 0.351806640625, 0.36767578125, 0.383544921875, 0.3994140625, 0.415283203125, 0.43115234375, 0.447021484375, 0.462890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 18.0, 30.0, 64.0, 92.0, 136.0, 153.0, 153.0, 141.0, 89.0, 50.0, 33.0, 19.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.621156692504883, -5.490445613861084, -5.359734535217285, -5.229023456573486, -5.0983123779296875, -4.967601776123047, -4.83689022064209, -4.706179618835449, -4.57546854019165, -4.444757461547852, -4.314046382904053, -4.183335304260254, -4.052624225616455, -3.9219133853912354, -3.7912023067474365, -3.6604912281036377, -3.529780149459839, -3.39906907081604, -3.268357992172241, -3.1376471519470215, -3.0069360733032227, -2.876224994659424, -2.745513916015625, -2.614802837371826, -2.4840917587280273, -2.3533806800842285, -2.2226696014404297, -2.091958522796631, -1.9612476825714111, -1.8305366039276123, -1.6998255252838135, -1.5691144466400146, -1.4384033679962158, -1.307692289352417, -1.1769813299179077, -1.0462702512741089, -0.9155592322349548, -0.7848482131958008, -0.654137134552002, -0.5234261155128479, -0.39271509647369385, -0.2620040774345398, -0.13129302859306335, -0.0005819797515869141, 0.13012903928756714, 0.2608400583267212, 0.39155113697052, 0.5222621560096741, 0.6529731750488281, 0.7836841940879822, 0.9143952131271362, 1.045106291770935, 1.1758172512054443, 1.3065283298492432, 1.437239408493042, 1.5679504871368408, 1.69866144657135, 1.829372525215149, 1.9600834846496582, 2.090794563293457, 2.221505641937256, 2.3522167205810547, 2.4829277992248535, 2.6136386394500732, 2.744349718093872]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 9.0, 7.0, 7.0, 11.0, 7.0, 12.0, 14.0, 18.0, 19.0, 31.0, 28.0, 28.0, 28.0, 27.0, 43.0, 46.0, 43.0, 45.0, 51.0, 35.0, 29.0, 42.0, 42.0, 53.0, 34.0, 43.0, 39.0, 32.0, 33.0, 14.0, 21.0, 14.0, 12.0, 15.0, 6.0, 19.0, 9.0, 8.0, 11.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5673120021820068, -1.5174849033355713, -1.4676578044891357, -1.4178305864334106, -1.368003487586975, -1.3181763887405396, -1.2683491706848145, -1.218522071838379, -1.1686949729919434, -1.1188678741455078, -1.0690407752990723, -1.0192135572433472, -0.9693864583969116, -0.9195593595504761, -0.8697322010993958, -0.8199050426483154, -0.7700779438018799, -0.7202508449554443, -0.670423686504364, -0.6205965280532837, -0.5707694292068481, -0.5209423303604126, -0.4711151719093323, -0.42128804326057434, -0.3714609146118164, -0.32163378596305847, -0.27180665731430054, -0.2219795286655426, -0.17215240001678467, -0.12232527136802673, -0.0724981427192688, -0.022671014070510864, 0.02715611457824707, 0.076983243227005, 0.12681037187576294, 0.17663750052452087, 0.2264646291732788, 0.27629175782203674, 0.3261188864707947, 0.3759460151195526, 0.42577314376831055, 0.4756002724170685, 0.5254274010658264, 0.5752545595169067, 0.6250816583633423, 0.6749087572097778, 0.7247359156608582, 0.7745630741119385, 0.824390172958374, 0.8742172718048096, 0.9240444302558899, 0.9738715887069702, 1.0236986875534058, 1.0735257863998413, 1.1233530044555664, 1.173180103302002, 1.2230072021484375, 1.272834300994873, 1.3226613998413086, 1.3724886178970337, 1.4223157167434692, 1.4721428155899048, 1.5219700336456299, 1.5717971324920654, 1.621624231338501]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 9.0, 11.0, 20.0, 34.0, 46.0, 87.0, 126.0, 215.0, 285.0, 535.0, 816.0, 1253.0, 2042.0, 2976.0, 4698.0, 7168.0, 11502.0, 18714.0, 33136.0, 68169.0, 162104.0, 296028.0, 230345.0, 100438.0, 45011.0, 23682.0, 14027.0, 9014.0, 5738.0, 3733.0, 2395.0, 1554.0, 947.0, 608.0, 437.0, 244.0, 166.0, 96.0, 66.0, 29.0, 11.0, 17.0, 9.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34375, -0.3317832946777344, -0.31981658935546875, -0.3078498840332031, -0.2958831787109375, -0.2839164733886719, -0.27194976806640625, -0.2599830627441406, -0.248016357421875, -0.23604965209960938, -0.22408294677734375, -0.21211624145507812, -0.2001495361328125, -0.18818283081054688, -0.17621612548828125, -0.16424942016601562, -0.15228271484375, -0.14031600952148438, -0.12834930419921875, -0.11638259887695312, -0.1044158935546875, -0.09244918823242188, -0.08048248291015625, -0.06851577758789062, -0.056549072265625, -0.044582366943359375, -0.03261566162109375, -0.020648956298828125, -0.0086822509765625, 0.003284454345703125, 0.01525115966796875, 0.027217864990234375, 0.0391845703125, 0.051151275634765625, 0.06311798095703125, 0.07508468627929688, 0.0870513916015625, 0.09901809692382812, 0.11098480224609375, 0.12295150756835938, 0.134918212890625, 0.14688491821289062, 0.15885162353515625, 0.17081832885742188, 0.1827850341796875, 0.19475173950195312, 0.20671844482421875, 0.21868515014648438, 0.23065185546875, 0.24261856079101562, 0.25458526611328125, 0.2665519714355469, 0.2785186767578125, 0.2904853820800781, 0.30245208740234375, 0.3144187927246094, 0.326385498046875, 0.3383522033691406, 0.35031890869140625, 0.3622856140136719, 0.3742523193359375, 0.3862190246582031, 0.39818572998046875, 0.4101524353027344, 0.422119140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 11.0, 16.0, 14.0, 18.0, 16.0, 21.0, 21.0, 26.0, 26.0, 33.0, 33.0, 37.0, 42.0, 42.0, 33.0, 43.0, 36.0, 45.0, 42.0, 41.0, 39.0, 44.0, 36.0, 35.0, 30.0, 27.0, 25.0, 27.0, 17.0, 16.0, 16.0, 16.0, 16.0, 8.0, 6.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2113037109375, -0.2046833038330078, -0.19806289672851562, -0.19144248962402344, -0.18482208251953125, -0.17820167541503906, -0.17158126831054688, -0.1649608612060547, -0.1583404541015625, -0.1517200469970703, -0.14509963989257812, -0.13847923278808594, -0.13185882568359375, -0.12523841857910156, -0.11861801147460938, -0.11199760437011719, -0.105377197265625, -0.09875679016113281, -0.09213638305664062, -0.08551597595214844, -0.07889556884765625, -0.07227516174316406, -0.06565475463867188, -0.05903434753417969, -0.0524139404296875, -0.04579353332519531, -0.039173126220703125, -0.03255271911621094, -0.02593231201171875, -0.019311904907226562, -0.012691497802734375, -0.0060710906982421875, 0.00054931640625, 0.0071697235107421875, 0.013790130615234375, 0.020410537719726562, 0.02703094482421875, 0.03365135192871094, 0.040271759033203125, 0.04689216613769531, 0.0535125732421875, 0.06013298034667969, 0.06675338745117188, 0.07337379455566406, 0.07999420166015625, 0.08661460876464844, 0.09323501586914062, 0.09985542297363281, 0.106475830078125, 0.11309623718261719, 0.11971664428710938, 0.12633705139160156, 0.13295745849609375, 0.13957786560058594, 0.14619827270507812, 0.1528186798095703, 0.1594390869140625, 0.1660594940185547, 0.17267990112304688, 0.17930030822753906, 0.18592071533203125, 0.19254112243652344, 0.19916152954101562, 0.2057819366455078, 0.21240234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 7.0, 7.0, 8.0, 11.0, 10.0, 18.0, 37.0, 25.0, 50.0, 63.0, 90.0, 128.0, 208.0, 345.0, 627.0, 1252.0, 2535.0, 5695.0, 13849.0, 36563.0, 121051.0, 476892.0, 281936.0, 66568.0, 23310.0, 9378.0, 3973.0, 1796.0, 877.0, 463.0, 259.0, 166.0, 102.0, 66.0, 49.0, 38.0, 28.0, 25.0, 13.0, 19.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.8447265625, -0.8217544555664062, -0.7987823486328125, -0.7758102416992188, -0.752838134765625, -0.7298660278320312, -0.7068939208984375, -0.6839218139648438, -0.66094970703125, -0.6379776000976562, -0.6150054931640625, -0.5920333862304688, -0.569061279296875, -0.5460891723632812, -0.5231170654296875, -0.5001449584960938, -0.4771728515625, -0.45420074462890625, -0.4312286376953125, -0.40825653076171875, -0.385284423828125, -0.36231231689453125, -0.3393402099609375, -0.31636810302734375, -0.29339599609375, -0.27042388916015625, -0.2474517822265625, -0.22447967529296875, -0.201507568359375, -0.17853546142578125, -0.1555633544921875, -0.13259124755859375, -0.109619140625, -0.08664703369140625, -0.0636749267578125, -0.04070281982421875, -0.017730712890625, 0.00524139404296875, 0.0282135009765625, 0.05118560791015625, 0.07415771484375, 0.09712982177734375, 0.1201019287109375, 0.14307403564453125, 0.166046142578125, 0.18901824951171875, 0.2119903564453125, 0.23496246337890625, 0.2579345703125, 0.28090667724609375, 0.3038787841796875, 0.32685089111328125, 0.349822998046875, 0.37279510498046875, 0.3957672119140625, 0.41873931884765625, 0.44171142578125, 0.46468353271484375, 0.4876556396484375, 0.5106277465820312, 0.533599853515625, 0.5565719604492188, 0.5795440673828125, 0.6025161743164062, 0.62548828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 9.0, 17.0, 12.0, 23.0, 29.0, 31.0, 43.0, 40.0, 54.0, 51.0, 60.0, 67.0, 68.0, 62.0, 63.0, 53.0, 59.0, 52.0, 33.0, 33.0, 31.0, 20.0, 26.0, 15.0, 13.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.224609375, -1.1919937133789062, -1.1593780517578125, -1.1267623901367188, -1.094146728515625, -1.0615310668945312, -1.0289154052734375, -0.9962997436523438, -0.96368408203125, -0.9310684204101562, -0.8984527587890625, -0.8658370971679688, -0.833221435546875, -0.8006057739257812, -0.7679901123046875, -0.7353744506835938, -0.7027587890625, -0.6701431274414062, -0.6375274658203125, -0.6049118041992188, -0.572296142578125, -0.5396804809570312, -0.5070648193359375, -0.47444915771484375, -0.44183349609375, -0.40921783447265625, -0.3766021728515625, -0.34398651123046875, -0.311370849609375, -0.27875518798828125, -0.2461395263671875, -0.21352386474609375, -0.180908203125, -0.14829254150390625, -0.1156768798828125, -0.08306121826171875, -0.050445556640625, -0.01782989501953125, 0.0147857666015625, 0.04740142822265625, 0.08001708984375, 0.11263275146484375, 0.1452484130859375, 0.17786407470703125, 0.210479736328125, 0.24309539794921875, 0.2757110595703125, 0.30832672119140625, 0.3409423828125, 0.37355804443359375, 0.4061737060546875, 0.43878936767578125, 0.471405029296875, 0.5040206909179688, 0.5366363525390625, 0.5692520141601562, 0.60186767578125, 0.6344833374023438, 0.6670989990234375, 0.6997146606445312, 0.732330322265625, 0.7649459838867188, 0.7975616455078125, 0.8301773071289062, 0.86279296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 8.0, 2.0, 8.0, 6.0, 7.0, 7.0, 29.0, 17.0, 39.0, 57.0, 92.0, 165.0, 247.0, 427.0, 708.0, 1307.0, 2413.0, 4724.0, 9615.0, 19942.0, 44618.0, 114098.0, 342489.0, 321636.0, 105531.0, 42368.0, 19090.0, 9163.0, 4408.0, 2359.0, 1236.0, 713.0, 365.0, 243.0, 133.0, 85.0, 56.0, 34.0, 26.0, 21.0, 17.0, 14.0, 6.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.20068359375, -0.1945953369140625, -0.188507080078125, -0.1824188232421875, -0.17633056640625, -0.1702423095703125, -0.164154052734375, -0.1580657958984375, -0.1519775390625, -0.1458892822265625, -0.139801025390625, -0.1337127685546875, -0.12762451171875, -0.1215362548828125, -0.115447998046875, -0.1093597412109375, -0.103271484375, -0.0971832275390625, -0.091094970703125, -0.0850067138671875, -0.07891845703125, -0.0728302001953125, -0.066741943359375, -0.0606536865234375, -0.0545654296875, -0.0484771728515625, -0.042388916015625, -0.0363006591796875, -0.03021240234375, -0.0241241455078125, -0.018035888671875, -0.0119476318359375, -0.005859375, 0.0002288818359375, 0.006317138671875, 0.0124053955078125, 0.01849365234375, 0.0245819091796875, 0.030670166015625, 0.0367584228515625, 0.0428466796875, 0.0489349365234375, 0.055023193359375, 0.0611114501953125, 0.06719970703125, 0.0732879638671875, 0.079376220703125, 0.0854644775390625, 0.091552734375, 0.0976409912109375, 0.103729248046875, 0.1098175048828125, 0.11590576171875, 0.1219940185546875, 0.128082275390625, 0.1341705322265625, 0.1402587890625, 0.1463470458984375, 0.152435302734375, 0.1585235595703125, 0.16461181640625, 0.1707000732421875, 0.176788330078125, 0.1828765869140625, 0.18896484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 9.0, 2.0, 16.0, 10.0, 22.0, 26.0, 38.0, 80.0, 139.0, 186.0, 178.0, 104.0, 54.0, 27.0, 13.0, 19.0, 16.0, 9.0, 11.0, 10.0, 0.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00010943412780761719, -0.00010660570114850998, -0.00010377727448940277, -0.00010094884783029556, -9.812042117118835e-05, -9.529199451208115e-05, -9.246356785297394e-05, -8.963514119386673e-05, -8.680671453475952e-05, -8.397828787565231e-05, -8.11498612165451e-05, -7.83214345574379e-05, -7.549300789833069e-05, -7.266458123922348e-05, -6.983615458011627e-05, -6.700772792100906e-05, -6.417930126190186e-05, -6.135087460279465e-05, -5.852244794368744e-05, -5.569402128458023e-05, -5.286559462547302e-05, -5.0037167966365814e-05, -4.7208741307258606e-05, -4.43803146481514e-05, -4.155188798904419e-05, -3.872346132993698e-05, -3.589503467082977e-05, -3.3066608011722565e-05, -3.0238181352615356e-05, -2.7409754693508148e-05, -2.458132803440094e-05, -2.175290137529373e-05, -1.8924474716186523e-05, -1.6096048057079315e-05, -1.3267621397972107e-05, -1.0439194738864899e-05, -7.6107680797576904e-06, -4.782341420650482e-06, -1.953914761543274e-06, 8.745118975639343e-07, 3.7029385566711426e-06, 6.531365215778351e-06, 9.359791874885559e-06, 1.2188218533992767e-05, 1.5016645193099976e-05, 1.7845071852207184e-05, 2.0673498511314392e-05, 2.35019251704216e-05, 2.633035182952881e-05, 2.9158778488636017e-05, 3.1987205147743225e-05, 3.481563180685043e-05, 3.764405846595764e-05, 4.047248512506485e-05, 4.330091178417206e-05, 4.6129338443279266e-05, 4.8957765102386475e-05, 5.178619176149368e-05, 5.461461842060089e-05, 5.74430450797081e-05, 6.027147173881531e-05, 6.309989839792252e-05, 6.592832505702972e-05, 6.875675171613693e-05, 7.158517837524414e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 6.0, 9.0, 13.0, 16.0, 21.0, 24.0, 33.0, 50.0, 65.0, 92.0, 142.0, 198.0, 320.0, 465.0, 893.0, 1681.0, 3525.0, 7903.0, 18641.0, 45373.0, 116221.0, 321300.0, 329039.0, 120657.0, 46512.0, 19540.0, 8040.0, 3732.0, 1700.0, 883.0, 490.0, 292.0, 206.0, 138.0, 84.0, 62.0, 62.0, 41.0, 28.0, 23.0, 13.0, 11.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20263671875, -0.19684982299804688, -0.19106292724609375, -0.18527603149414062, -0.1794891357421875, -0.17370223999023438, -0.16791534423828125, -0.16212844848632812, -0.156341552734375, -0.15055465698242188, -0.14476776123046875, -0.13898086547851562, -0.1331939697265625, -0.12740707397460938, -0.12162017822265625, -0.11583328247070312, -0.11004638671875, -0.10425949096679688, -0.09847259521484375, -0.09268569946289062, -0.0868988037109375, -0.08111190795898438, -0.07532501220703125, -0.06953811645507812, -0.063751220703125, -0.057964324951171875, -0.05217742919921875, -0.046390533447265625, -0.0406036376953125, -0.034816741943359375, -0.02902984619140625, -0.023242950439453125, -0.0174560546875, -0.011669158935546875, -0.00588226318359375, -9.5367431640625e-05, 0.0056915283203125, 0.011478424072265625, 0.01726531982421875, 0.023052215576171875, 0.028839111328125, 0.034626007080078125, 0.04041290283203125, 0.046199798583984375, 0.0519866943359375, 0.057773590087890625, 0.06356048583984375, 0.06934738159179688, 0.07513427734375, 0.08092117309570312, 0.08670806884765625, 0.09249496459960938, 0.0982818603515625, 0.10406875610351562, 0.10985565185546875, 0.11564254760742188, 0.121429443359375, 0.12721633911132812, 0.13300323486328125, 0.13879013061523438, 0.1445770263671875, 0.15036392211914062, 0.15615081787109375, 0.16193771362304688, 0.167724609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 10.0, 7.0, 12.0, 14.0, 22.0, 25.0, 25.0, 28.0, 38.0, 41.0, 55.0, 62.0, 75.0, 78.0, 86.0, 73.0, 53.0, 49.0, 34.0, 34.0, 32.0, 14.0, 20.0, 15.0, 13.0, 11.0, 15.0, 7.0, 8.0, 5.0, 5.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.1500244140625, -0.14404296875, -0.1380615234375, -0.132080078125, -0.1260986328125, -0.1201171875, -0.1141357421875, -0.108154296875, -0.1021728515625, -0.09619140625, -0.0902099609375, -0.084228515625, -0.0782470703125, -0.072265625, -0.0662841796875, -0.060302734375, -0.0543212890625, -0.04833984375, -0.0423583984375, -0.036376953125, -0.0303955078125, -0.0244140625, -0.0184326171875, -0.012451171875, -0.0064697265625, -0.00048828125, 0.0054931640625, 0.011474609375, 0.0174560546875, 0.0234375, 0.0294189453125, 0.035400390625, 0.0413818359375, 0.04736328125, 0.0533447265625, 0.059326171875, 0.0653076171875, 0.0712890625, 0.0772705078125, 0.083251953125, 0.0892333984375, 0.09521484375, 0.1011962890625, 0.107177734375, 0.1131591796875, 0.119140625, 0.1251220703125, 0.131103515625, 0.1370849609375, 0.14306640625, 0.1490478515625, 0.155029296875, 0.1610107421875, 0.1669921875, 0.1729736328125, 0.178955078125, 0.1849365234375, 0.19091796875, 0.1968994140625, 0.202880859375, 0.2088623046875, 0.21484375, 0.2208251953125, 0.226806640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 14.0, 19.0, 62.0, 146.0, 217.0, 230.0, 159.0, 91.0, 34.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.352656841278076, -6.17669153213501, -6.000726222991943, -5.824760913848877, -5.6487956047058105, -5.472830295562744, -5.2968645095825195, -5.120899200439453, -4.944933891296387, -4.76896858215332, -4.593003273010254, -4.4170379638671875, -4.241072654724121, -4.065107345581055, -3.889141798019409, -3.7131764888763428, -3.5372114181518555, -3.361246109008789, -3.1852807998657227, -3.0093154907226562, -2.83335018157959, -2.6573848724365234, -2.481419324874878, -2.3054540157318115, -2.129488706588745, -1.9535233974456787, -1.7775580883026123, -1.6015926599502563, -1.42562735080719, -1.2496620416641235, -1.0736966133117676, -0.8977313041687012, -0.7217655181884766, -0.5458002090454102, -0.369834840297699, -0.1938694715499878, -0.017904162406921387, 0.15806114673614502, 0.334026575088501, 0.5099918842315674, 0.6859571933746338, 0.8619225025177002, 1.0378878116607666, 1.2138532400131226, 1.389818549156189, 1.5657838582992554, 1.7417492866516113, 1.9177145957946777, 2.093679904937744, 2.2696452140808105, 2.445610523223877, 2.6215758323669434, 2.7975411415100098, 2.973506450653076, 3.1494719982147217, 3.325437307357788, 3.5014026165008545, 3.677367925643921, 3.8533332347869873, 4.029298782348633, 4.205264091491699, 4.381229400634766, 4.557194709777832, 4.733160018920898, 4.909125328063965]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 4.0, 5.0, 5.0, 13.0, 10.0, 10.0, 13.0, 17.0, 9.0, 25.0, 19.0, 22.0, 34.0, 14.0, 37.0, 25.0, 25.0, 42.0, 39.0, 49.0, 35.0, 31.0, 32.0, 51.0, 34.0, 42.0, 37.0, 36.0, 40.0, 25.0, 29.0, 19.0, 27.0, 19.0, 27.0, 20.0, 16.0, 16.0, 12.0, 11.0, 9.0, 1.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7826440334320068, -1.7286403179168701, -1.674636721611023, -1.6206330060958862, -1.5666292905807495, -1.5126256942749023, -1.4586219787597656, -1.404618263244629, -1.3506145477294922, -1.2966108322143555, -1.2426072359085083, -1.1886035203933716, -1.1345998048782349, -1.0805962085723877, -1.026592493057251, -0.9725887775421143, -0.9185851812362671, -0.8645815253257751, -0.8105778098106384, -0.7565741539001465, -0.7025704383850098, -0.6485667824745178, -0.5945631265640259, -0.5405594110488892, -0.4865557551383972, -0.4325520694255829, -0.37854838371276855, -0.3245447278022766, -0.2705410420894623, -0.21653735637664795, -0.162533700466156, -0.10853001475334167, -0.054526329040527344, -0.0005226507782936096, 0.053481027483940125, 0.10748469829559326, 0.1614883840084076, 0.21549206972122192, 0.26949572563171387, 0.3234994113445282, 0.37750309705734253, 0.43150678277015686, 0.4855104684829712, 0.5395141243934631, 0.5935177803039551, 0.6475214958190918, 0.7015251517295837, 0.7555288076400757, 0.8095325231552124, 0.8635361790657043, 0.9175398945808411, 0.971543550491333, 1.0255472660064697, 1.0795509815216064, 1.1335545778274536, 1.1875582933425903, 1.2415618896484375, 1.2955656051635742, 1.3495692014694214, 1.403572916984558, 1.4575766324996948, 1.511580228805542, 1.5655839443206787, 1.6195876598358154, 1.6735913753509521]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 6.0, 8.0, 13.0, 20.0, 27.0, 29.0, 52.0, 88.0, 138.0, 202.0, 311.0, 493.0, 850.0, 1440.0, 2452.0, 4335.0, 8095.0, 15054.0, 29420.0, 59536.0, 131706.0, 329281.0, 942850.0, 1533463.0, 684014.0, 246965.0, 103852.0, 48384.0, 23998.0, 12197.0, 6481.0, 3484.0, 2015.0, 1200.0, 724.0, 377.0, 259.0, 161.0, 114.0, 65.0, 45.0, 31.0, 25.0, 8.0, 5.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2435302734375, -0.2355060577392578, -0.22748184204101562, -0.21945762634277344, -0.21143341064453125, -0.20340919494628906, -0.19538497924804688, -0.1873607635498047, -0.1793365478515625, -0.1713123321533203, -0.16328811645507812, -0.15526390075683594, -0.14723968505859375, -0.13921546936035156, -0.13119125366210938, -0.12316703796386719, -0.115142822265625, -0.10711860656738281, -0.09909439086914062, -0.09107017517089844, -0.08304595947265625, -0.07502174377441406, -0.06699752807617188, -0.05897331237792969, -0.0509490966796875, -0.04292488098144531, -0.034900665283203125, -0.026876449584960938, -0.01885223388671875, -0.010828018188476562, -0.002803802490234375, 0.0052204132080078125, 0.01324462890625, 0.021268844604492188, 0.029293060302734375, 0.03731727600097656, 0.04534149169921875, 0.05336570739746094, 0.061389923095703125, 0.06941413879394531, 0.0774383544921875, 0.08546257019042969, 0.09348678588867188, 0.10151100158691406, 0.10953521728515625, 0.11755943298339844, 0.12558364868164062, 0.1336078643798828, 0.141632080078125, 0.1496562957763672, 0.15768051147460938, 0.16570472717285156, 0.17372894287109375, 0.18175315856933594, 0.18977737426757812, 0.1978015899658203, 0.2058258056640625, 0.2138500213623047, 0.22187423706054688, 0.22989845275878906, 0.23792266845703125, 0.24594688415527344, 0.2539710998535156, 0.2619953155517578, 0.27001953125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 1.0, 5.0, 2.0, 6.0, 3.0, 8.0, 6.0, 9.0, 6.0, 12.0, 12.0, 11.0, 17.0, 16.0, 20.0, 27.0, 33.0, 26.0, 37.0, 32.0, 27.0, 28.0, 32.0, 31.0, 43.0, 49.0, 51.0, 47.0, 42.0, 30.0, 45.0, 28.0, 31.0, 25.0, 30.0, 21.0, 23.0, 17.0, 20.0, 16.0, 18.0, 12.0, 10.0, 6.0, 6.0, 5.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.17143630981445312, -0.16526031494140625, -0.15908432006835938, -0.1529083251953125, -0.14673233032226562, -0.14055633544921875, -0.13438034057617188, -0.128204345703125, -0.12202835083007812, -0.11585235595703125, -0.10967636108398438, -0.1035003662109375, -0.09732437133789062, -0.09114837646484375, -0.08497238159179688, -0.07879638671875, -0.07262039184570312, -0.06644439697265625, -0.060268402099609375, -0.0540924072265625, -0.047916412353515625, -0.04174041748046875, -0.035564422607421875, -0.029388427734375, -0.023212432861328125, -0.01703643798828125, -0.010860443115234375, -0.0046844482421875, 0.001491546630859375, 0.00766754150390625, 0.013843536376953125, 0.02001953125, 0.026195526123046875, 0.03237152099609375, 0.038547515869140625, 0.0447235107421875, 0.050899505615234375, 0.05707550048828125, 0.06325149536132812, 0.069427490234375, 0.07560348510742188, 0.08177947998046875, 0.08795547485351562, 0.0941314697265625, 0.10030746459960938, 0.10648345947265625, 0.11265945434570312, 0.11883544921875, 0.12501144409179688, 0.13118743896484375, 0.13736343383789062, 0.1435394287109375, 0.14971542358398438, 0.15589141845703125, 0.16206741333007812, 0.168243408203125, 0.17441940307617188, 0.18059539794921875, 0.18677139282226562, 0.1929473876953125, 0.19912338256835938, 0.20529937744140625, 0.21147537231445312, 0.2176513671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 8.0, 14.0, 31.0, 30.0, 46.0, 87.0, 127.0, 193.0, 250.0, 457.0, 791.0, 1408.0, 2954.0, 6689.0, 16404.0, 46557.0, 141669.0, 493585.0, 2103897.0, 1012044.0, 245004.0, 76432.0, 26308.0, 10120.0, 4304.0, 2005.0, 1121.0, 625.0, 352.0, 254.0, 169.0, 107.0, 56.0, 38.0, 32.0, 21.0, 15.0, 21.0, 12.0, 8.0, 6.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.43994140625, -0.42462921142578125, -0.4093170166015625, -0.39400482177734375, -0.378692626953125, -0.36338043212890625, -0.3480682373046875, -0.33275604248046875, -0.31744384765625, -0.30213165283203125, -0.2868194580078125, -0.27150726318359375, -0.256195068359375, -0.24088287353515625, -0.2255706787109375, -0.21025848388671875, -0.1949462890625, -0.17963409423828125, -0.1643218994140625, -0.14900970458984375, -0.133697509765625, -0.11838531494140625, -0.1030731201171875, -0.08776092529296875, -0.07244873046875, -0.05713653564453125, -0.0418243408203125, -0.02651214599609375, -0.011199951171875, 0.00411224365234375, 0.0194244384765625, 0.03473663330078125, 0.050048828125, 0.06536102294921875, 0.0806732177734375, 0.09598541259765625, 0.111297607421875, 0.12660980224609375, 0.1419219970703125, 0.15723419189453125, 0.17254638671875, 0.18785858154296875, 0.2031707763671875, 0.21848297119140625, 0.233795166015625, 0.24910736083984375, 0.2644195556640625, 0.27973175048828125, 0.2950439453125, 0.31035614013671875, 0.3256683349609375, 0.34098052978515625, 0.356292724609375, 0.37160491943359375, 0.3869171142578125, 0.40222930908203125, 0.41754150390625, 0.43285369873046875, 0.4481658935546875, 0.46347808837890625, 0.478790283203125, 0.49410247802734375, 0.5094146728515625, 0.5247268676757812, 0.5400390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 13.0, 19.0, 28.0, 46.0, 66.0, 90.0, 122.0, 156.0, 237.0, 348.0, 527.0, 693.0, 588.0, 341.0, 225.0, 147.0, 102.0, 81.0, 60.0, 54.0, 35.0, 23.0, 18.0, 9.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5140228271484375, -0.493865966796875, -0.4737091064453125, -0.45355224609375, -0.4333953857421875, -0.413238525390625, -0.3930816650390625, -0.3729248046875, -0.3527679443359375, -0.332611083984375, -0.3124542236328125, -0.29229736328125, -0.2721405029296875, -0.251983642578125, -0.2318267822265625, -0.211669921875, -0.1915130615234375, -0.171356201171875, -0.1511993408203125, -0.13104248046875, -0.1108856201171875, -0.090728759765625, -0.0705718994140625, -0.0504150390625, -0.0302581787109375, -0.010101318359375, 0.0100555419921875, 0.03021240234375, 0.0503692626953125, 0.070526123046875, 0.0906829833984375, 0.11083984375, 0.1309967041015625, 0.151153564453125, 0.1713104248046875, 0.19146728515625, 0.2116241455078125, 0.231781005859375, 0.2519378662109375, 0.2720947265625, 0.2922515869140625, 0.312408447265625, 0.3325653076171875, 0.35272216796875, 0.3728790283203125, 0.393035888671875, 0.4131927490234375, 0.433349609375, 0.4535064697265625, 0.473663330078125, 0.4938201904296875, 0.51397705078125, 0.5341339111328125, 0.554290771484375, 0.5744476318359375, 0.5946044921875, 0.6147613525390625, 0.634918212890625, 0.6550750732421875, 0.67523193359375, 0.6953887939453125, 0.715545654296875, 0.7357025146484375, 0.755859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 13.0, 23.0, 63.0, 74.0, 121.0, 129.0, 145.0, 138.0, 104.0, 83.0, 39.0, 25.0, 15.0, 5.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9223976135253906, -3.7934978008270264, -3.664597988128662, -3.535698413848877, -3.4067986011505127, -3.2778987884521484, -3.1489992141723633, -3.020099401473999, -2.8911995887756348, -2.7622997760772705, -2.6333999633789062, -2.504500389099121, -2.375600576400757, -2.2467007637023926, -2.1178011894226074, -1.9889013767242432, -1.860001564025879, -1.7311017513275146, -1.60220205783844, -1.4733023643493652, -1.344402551651001, -1.2155027389526367, -1.086603045463562, -0.9577032923698425, -0.828803539276123, -0.6999037861824036, -0.5710040330886841, -0.4421042799949646, -0.3132045269012451, -0.18430477380752563, -0.05540502071380615, 0.07349473237991333, 0.2023940086364746, 0.3312937617301941, 0.4601935148239136, 0.5890932679176331, 0.7179930210113525, 0.846892774105072, 0.9757925271987915, 1.1046922206878662, 1.2335920333862305, 1.3624918460845947, 1.4913915395736694, 1.6202912330627441, 1.7491910457611084, 1.8780908584594727, 2.006990432739258, 2.135890245437622, 2.2647900581359863, 2.3936898708343506, 2.522589683532715, 2.6514892578125, 2.7803890705108643, 2.9092888832092285, 3.0381884574890137, 3.167088270187378, 3.295988082885742, 3.4248878955841064, 3.5537877082824707, 3.682687282562256, 3.81158709526062, 3.9404869079589844, 4.0693864822387695, 4.198286533355713, 4.327186107635498]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 9.0, 8.0, 14.0, 12.0, 14.0, 13.0, 19.0, 19.0, 20.0, 35.0, 38.0, 23.0, 32.0, 35.0, 45.0, 40.0, 45.0, 47.0, 46.0, 39.0, 46.0, 51.0, 32.0, 39.0, 30.0, 29.0, 29.0, 25.0, 35.0, 19.0, 17.0, 17.0, 11.0, 13.0, 8.0, 9.0, 13.0, 8.0, 1.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.1739280223846436, -2.1132686138153076, -2.0526092052459717, -1.9919497966766357, -1.9312903881072998, -1.8706309795379639, -1.809971570968628, -1.7493120431900024, -1.6886526346206665, -1.6279932260513306, -1.5673338174819946, -1.5066744089126587, -1.4460150003433228, -1.3853554725646973, -1.3246960639953613, -1.2640366554260254, -1.2033772468566895, -1.1427178382873535, -1.0820584297180176, -1.0213990211486816, -0.9607395529747009, -0.900080144405365, -0.839420735836029, -0.7787612676620483, -0.718101978302002, -0.657442569732666, -0.5967831611633301, -0.5361237525939941, -0.4754642844200134, -0.4148048758506775, -0.35414546728134155, -0.2934860289096832, -0.2328265905380249, -0.17216716706752777, -0.11150775104761124, -0.0508483350276947, 0.00981108844280243, 0.07047051191329956, 0.1311299204826355, 0.19178935885429382, 0.25244876742362976, 0.3131081759929657, 0.373767614364624, 0.43442702293395996, 0.4950864315032959, 0.5557458400726318, 0.6164052486419678, 0.6770647168159485, 0.7377241253852844, 0.7983835339546204, 0.8590429425239563, 0.919702410697937, 0.980361819267273, 1.0410212278366089, 1.1016806364059448, 1.1623400449752808, 1.2229994535446167, 1.2836588621139526, 1.3443182706832886, 1.4049776792526245, 1.4656370878219604, 1.526296615600586, 1.5869560241699219, 1.6476154327392578, 1.7082748413085938]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 8.0, 3.0, 7.0, 14.0, 12.0, 13.0, 18.0, 40.0, 57.0, 72.0, 107.0, 172.0, 254.0, 384.0, 501.0, 826.0, 1262.0, 1891.0, 2827.0, 4252.0, 6505.0, 10039.0, 15177.0, 23480.0, 37822.0, 65282.0, 119097.0, 198675.0, 216936.0, 142443.0, 77853.0, 44726.0, 27253.0, 17297.0, 11388.0, 7449.0, 4933.0, 3221.0, 2087.0, 1447.0, 912.0, 626.0, 392.0, 267.0, 187.0, 108.0, 90.0, 50.0, 38.0, 26.0, 13.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.287841796875, -0.27860260009765625, -0.2693634033203125, -0.26012420654296875, -0.250885009765625, -0.24164581298828125, -0.2324066162109375, -0.22316741943359375, -0.21392822265625, -0.20468902587890625, -0.1954498291015625, -0.18621063232421875, -0.176971435546875, -0.16773223876953125, -0.1584930419921875, -0.14925384521484375, -0.1400146484375, -0.13077545166015625, -0.1215362548828125, -0.11229705810546875, -0.103057861328125, -0.09381866455078125, -0.0845794677734375, -0.07534027099609375, -0.06610107421875, -0.05686187744140625, -0.0476226806640625, -0.03838348388671875, -0.029144287109375, -0.01990509033203125, -0.0106658935546875, -0.00142669677734375, 0.0078125, 0.01705169677734375, 0.0262908935546875, 0.03553009033203125, 0.044769287109375, 0.05400848388671875, 0.0632476806640625, 0.07248687744140625, 0.08172607421875, 0.09096527099609375, 0.1002044677734375, 0.10944366455078125, 0.118682861328125, 0.12792205810546875, 0.1371612548828125, 0.14640045166015625, 0.1556396484375, 0.16487884521484375, 0.1741180419921875, 0.18335723876953125, 0.192596435546875, 0.20183563232421875, 0.2110748291015625, 0.22031402587890625, 0.22955322265625, 0.23879241943359375, 0.2480316162109375, 0.25727081298828125, 0.266510009765625, 0.27574920654296875, 0.2849884033203125, 0.29422760009765625, 0.303466796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 10.0, 15.0, 18.0, 17.0, 20.0, 20.0, 32.0, 25.0, 38.0, 47.0, 34.0, 34.0, 43.0, 45.0, 42.0, 46.0, 43.0, 40.0, 43.0, 44.0, 45.0, 25.0, 31.0, 22.0, 30.0, 27.0, 13.0, 19.0, 23.0, 18.0, 17.0, 18.0, 4.0, 7.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2196044921875, -0.21258544921875, -0.20556640625, -0.19854736328125, -0.1915283203125, -0.18450927734375, -0.177490234375, -0.17047119140625, -0.1634521484375, -0.15643310546875, -0.1494140625, -0.14239501953125, -0.1353759765625, -0.12835693359375, -0.121337890625, -0.11431884765625, -0.1072998046875, -0.10028076171875, -0.09326171875, -0.08624267578125, -0.0792236328125, -0.07220458984375, -0.065185546875, -0.05816650390625, -0.0511474609375, -0.04412841796875, -0.037109375, -0.03009033203125, -0.0230712890625, -0.01605224609375, -0.009033203125, -0.00201416015625, 0.0050048828125, 0.01202392578125, 0.01904296875, 0.02606201171875, 0.0330810546875, 0.04010009765625, 0.047119140625, 0.05413818359375, 0.0611572265625, 0.06817626953125, 0.0751953125, 0.08221435546875, 0.0892333984375, 0.09625244140625, 0.103271484375, 0.11029052734375, 0.1173095703125, 0.12432861328125, 0.13134765625, 0.13836669921875, 0.1453857421875, 0.15240478515625, 0.159423828125, 0.16644287109375, 0.1734619140625, 0.18048095703125, 0.1875, 0.19451904296875, 0.2015380859375, 0.20855712890625, 0.215576171875, 0.22259521484375, 0.2296142578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 16.0, 19.0, 28.0, 40.0, 77.0, 122.0, 250.0, 488.0, 1004.0, 2812.0, 9748.0, 39841.0, 212664.0, 603277.0, 138179.0, 28794.0, 7348.0, 2165.0, 809.0, 359.0, 213.0, 96.0, 73.0, 42.0, 24.0, 21.0, 11.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7314834594726562, -0.6988067626953125, -0.6661300659179688, -0.633453369140625, -0.6007766723632812, -0.5680999755859375, -0.5354232788085938, -0.50274658203125, -0.47006988525390625, -0.4373931884765625, -0.40471649169921875, -0.372039794921875, -0.33936309814453125, -0.3066864013671875, -0.27400970458984375, -0.2413330078125, -0.20865631103515625, -0.1759796142578125, -0.14330291748046875, -0.110626220703125, -0.07794952392578125, -0.0452728271484375, -0.01259613037109375, 0.02008056640625, 0.05275726318359375, 0.0854339599609375, 0.11811065673828125, 0.150787353515625, 0.18346405029296875, 0.2161407470703125, 0.24881744384765625, 0.281494140625, 0.31417083740234375, 0.3468475341796875, 0.37952423095703125, 0.412200927734375, 0.44487762451171875, 0.4775543212890625, 0.5102310180664062, 0.54290771484375, 0.5755844116210938, 0.6082611083984375, 0.6409378051757812, 0.673614501953125, 0.7062911987304688, 0.7389678955078125, 0.7716445922851562, 0.8043212890625, 0.8369979858398438, 0.8696746826171875, 0.9023513793945312, 0.935028076171875, 0.9677047729492188, 1.0003814697265625, 1.0330581665039062, 1.06573486328125, 1.0984115600585938, 1.1310882568359375, 1.1637649536132812, 1.196441650390625, 1.2291183471679688, 1.2617950439453125, 1.2944717407226562, 1.3271484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 1.0, 2.0, 8.0, 4.0, 8.0, 10.0, 7.0, 15.0, 18.0, 22.0, 26.0, 35.0, 26.0, 33.0, 43.0, 29.0, 45.0, 42.0, 59.0, 53.0, 39.0, 47.0, 58.0, 47.0, 34.0, 43.0, 29.0, 19.0, 29.0, 39.0, 15.0, 20.0, 18.0, 10.0, 17.0, 11.0, 11.0, 5.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6632537841796875, -0.640472412109375, -0.6176910400390625, -0.59490966796875, -0.5721282958984375, -0.549346923828125, -0.5265655517578125, -0.5037841796875, -0.4810028076171875, -0.458221435546875, -0.4354400634765625, -0.41265869140625, -0.3898773193359375, -0.367095947265625, -0.3443145751953125, -0.321533203125, -0.2987518310546875, -0.275970458984375, -0.2531890869140625, -0.23040771484375, -0.2076263427734375, -0.184844970703125, -0.1620635986328125, -0.1392822265625, -0.1165008544921875, -0.093719482421875, -0.0709381103515625, -0.04815673828125, -0.0253753662109375, -0.002593994140625, 0.0201873779296875, 0.04296875, 0.0657501220703125, 0.088531494140625, 0.1113128662109375, 0.13409423828125, 0.1568756103515625, 0.179656982421875, 0.2024383544921875, 0.2252197265625, 0.2480010986328125, 0.270782470703125, 0.2935638427734375, 0.31634521484375, 0.3391265869140625, 0.361907958984375, 0.3846893310546875, 0.407470703125, 0.4302520751953125, 0.453033447265625, 0.4758148193359375, 0.49859619140625, 0.5213775634765625, 0.544158935546875, 0.5669403076171875, 0.5897216796875, 0.6125030517578125, 0.635284423828125, 0.6580657958984375, 0.68084716796875, 0.7036285400390625, 0.726409912109375, 0.7491912841796875, 0.77197265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 14.0, 27.0, 36.0, 75.0, 151.0, 279.0, 553.0, 1208.0, 3169.0, 8109.0, 22953.0, 79410.0, 340087.0, 436739.0, 109034.0, 29835.0, 10205.0, 3822.0, 1438.0, 679.0, 327.0, 157.0, 92.0, 50.0, 39.0, 23.0, 12.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2936267852783203, -0.2854957580566406, -0.27736473083496094, -0.26923370361328125, -0.26110267639160156, -0.2529716491699219, -0.2448406219482422, -0.2367095947265625, -0.2285785675048828, -0.22044754028320312, -0.21231651306152344, -0.20418548583984375, -0.19605445861816406, -0.18792343139648438, -0.1797924041748047, -0.171661376953125, -0.1635303497314453, -0.15539932250976562, -0.14726829528808594, -0.13913726806640625, -0.13100624084472656, -0.12287521362304688, -0.11474418640136719, -0.1066131591796875, -0.09848213195800781, -0.09035110473632812, -0.08222007751464844, -0.07408905029296875, -0.06595802307128906, -0.057826995849609375, -0.04969596862792969, -0.04156494140625, -0.03343391418457031, -0.025302886962890625, -0.017171859741210938, -0.00904083251953125, -0.0009098052978515625, 0.007221221923828125, 0.015352249145507812, 0.0234832763671875, 0.03161430358886719, 0.039745330810546875, 0.04787635803222656, 0.05600738525390625, 0.06413841247558594, 0.07226943969726562, 0.08040046691894531, 0.088531494140625, 0.09666252136230469, 0.10479354858398438, 0.11292457580566406, 0.12105560302734375, 0.12918663024902344, 0.13731765747070312, 0.1454486846923828, 0.1535797119140625, 0.1617107391357422, 0.16984176635742188, 0.17797279357910156, 0.18610382080078125, 0.19423484802246094, 0.20236587524414062, 0.2104969024658203, 0.2186279296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 4.0, 14.0, 11.0, 18.0, 32.0, 34.0, 70.0, 99.0, 134.0, 170.0, 124.0, 85.0, 53.0, 34.0, 22.0, 15.0, 17.0, 9.0, 4.0, 5.0, 7.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.07046890258789e-05, -7.820315659046173e-05, -7.570162415504456e-05, -7.320009171962738e-05, -7.06985592842102e-05, -6.819702684879303e-05, -6.569549441337585e-05, -6.319396197795868e-05, -6.0692429542541504e-05, -5.819089710712433e-05, -5.568936467170715e-05, -5.318783223628998e-05, -5.06862998008728e-05, -4.818476736545563e-05, -4.568323493003845e-05, -4.318170249462128e-05, -4.06801700592041e-05, -3.8178637623786926e-05, -3.567710518836975e-05, -3.3175572752952576e-05, -3.06740403175354e-05, -2.8172507882118225e-05, -2.567097544670105e-05, -2.3169443011283875e-05, -2.06679105758667e-05, -1.8166378140449524e-05, -1.566484570503235e-05, -1.3163313269615173e-05, -1.0661780834197998e-05, -8.160248398780823e-06, -5.6587159633636475e-06, -3.157183527946472e-06, -6.556510925292969e-07, 1.8458813428878784e-06, 4.347413778305054e-06, 6.848946213722229e-06, 9.350478649139404e-06, 1.185201108455658e-05, 1.4353543519973755e-05, 1.685507595539093e-05, 1.9356608390808105e-05, 2.185814082622528e-05, 2.4359673261642456e-05, 2.686120569705963e-05, 2.9362738132476807e-05, 3.186427056789398e-05, 3.436580300331116e-05, 3.686733543872833e-05, 3.936886787414551e-05, 4.187040030956268e-05, 4.437193274497986e-05, 4.6873465180397034e-05, 4.937499761581421e-05, 5.1876530051231384e-05, 5.437806248664856e-05, 5.6879594922065735e-05, 5.938112735748291e-05, 6.188265979290009e-05, 6.438419222831726e-05, 6.688572466373444e-05, 6.938725709915161e-05, 7.188878953456879e-05, 7.439032196998596e-05, 7.689185440540314e-05, 7.939338684082031e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 7.0, 6.0, 7.0, 5.0, 12.0, 21.0, 28.0, 35.0, 63.0, 76.0, 150.0, 182.0, 299.0, 511.0, 806.0, 1686.0, 3543.0, 8016.0, 19666.0, 53594.0, 146844.0, 343560.0, 289629.0, 111796.0, 40333.0, 15307.0, 6198.0, 2857.0, 1378.0, 728.0, 438.0, 253.0, 160.0, 105.0, 62.0, 59.0, 38.0, 29.0, 18.0, 12.0, 14.0, 5.0, 6.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.170654296875, -0.1652984619140625, -0.159942626953125, -0.1545867919921875, -0.14923095703125, -0.1438751220703125, -0.138519287109375, -0.1331634521484375, -0.1278076171875, -0.1224517822265625, -0.117095947265625, -0.1117401123046875, -0.10638427734375, -0.1010284423828125, -0.095672607421875, -0.0903167724609375, -0.0849609375, -0.0796051025390625, -0.074249267578125, -0.0688934326171875, -0.06353759765625, -0.0581817626953125, -0.052825927734375, -0.0474700927734375, -0.0421142578125, -0.0367584228515625, -0.031402587890625, -0.0260467529296875, -0.02069091796875, -0.0153350830078125, -0.009979248046875, -0.0046234130859375, 0.000732421875, 0.0060882568359375, 0.011444091796875, 0.0167999267578125, 0.02215576171875, 0.0275115966796875, 0.032867431640625, 0.0382232666015625, 0.0435791015625, 0.0489349365234375, 0.054290771484375, 0.0596466064453125, 0.06500244140625, 0.0703582763671875, 0.075714111328125, 0.0810699462890625, 0.08642578125, 0.0917816162109375, 0.097137451171875, 0.1024932861328125, 0.10784912109375, 0.1132049560546875, 0.118560791015625, 0.1239166259765625, 0.1292724609375, 0.1346282958984375, 0.139984130859375, 0.1453399658203125, 0.15069580078125, 0.1560516357421875, 0.161407470703125, 0.1667633056640625, 0.172119140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 13.0, 15.0, 19.0, 31.0, 38.0, 55.0, 61.0, 85.0, 72.0, 110.0, 94.0, 91.0, 66.0, 36.0, 42.0, 34.0, 35.0, 14.0, 18.0, 12.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21875, -0.21225357055664062, -0.20575714111328125, -0.19926071166992188, -0.1927642822265625, -0.18626785278320312, -0.17977142333984375, -0.17327499389648438, -0.166778564453125, -0.16028213500976562, -0.15378570556640625, -0.14728927612304688, -0.1407928466796875, -0.13429641723632812, -0.12779998779296875, -0.12130355834960938, -0.11480712890625, -0.10831069946289062, -0.10181427001953125, -0.09531784057617188, -0.0888214111328125, -0.08232498168945312, -0.07582855224609375, -0.06933212280273438, -0.062835693359375, -0.056339263916015625, -0.04984283447265625, -0.043346405029296875, -0.0368499755859375, -0.030353546142578125, -0.02385711669921875, -0.017360687255859375, -0.0108642578125, -0.004367828369140625, 0.00212860107421875, 0.008625030517578125, 0.0151214599609375, 0.021617889404296875, 0.02811431884765625, 0.034610748291015625, 0.041107177734375, 0.047603607177734375, 0.05410003662109375, 0.060596466064453125, 0.0670928955078125, 0.07358932495117188, 0.08008575439453125, 0.08658218383789062, 0.09307861328125, 0.09957504272460938, 0.10607147216796875, 0.11256790161132812, 0.1190643310546875, 0.12556076049804688, 0.13205718994140625, 0.13855361938476562, 0.145050048828125, 0.15154647827148438, 0.15804290771484375, 0.16453933715820312, 0.1710357666015625, 0.17753219604492188, 0.18402862548828125, 0.19052505493164062, 0.197021484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 10.0, 25.0, 35.0, 49.0, 71.0, 138.0, 137.0, 156.0, 123.0, 79.0, 69.0, 40.0, 17.0, 12.0, 10.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.483091354370117, -3.380591630935669, -3.2780919075012207, -3.1755921840667725, -3.073092460632324, -2.970592975616455, -2.868093252182007, -2.7655935287475586, -2.6630938053131104, -2.560594081878662, -2.458094358444214, -2.3555946350097656, -2.2530951499938965, -2.150595188140869, -2.048095703125, -1.9455959796905518, -1.8430962562561035, -1.7405965328216553, -1.638096809387207, -1.5355972051620483, -1.4330974817276, -1.3305977582931519, -1.2280981540679932, -1.125598430633545, -1.0230987071990967, -0.9205989837646484, -0.818099319934845, -0.7155996561050415, -0.6130999326705933, -0.510600209236145, -0.40810054540634155, -0.3056008815765381, -0.20310115814208984, -0.10060146450996399, 0.0018982291221618652, 0.10439792275428772, 0.20689761638641357, 0.3093973398208618, 0.4118970036506653, 0.5143966674804688, 0.616896390914917, 0.7193961143493652, 0.8218957781791687, 0.9243954420089722, 1.0268951654434204, 1.1293948888778687, 1.2318944931030273, 1.3343942165374756, 1.4368939399719238, 1.539393663406372, 1.6418933868408203, 1.744392991065979, 1.8468927145004272, 1.9493924379348755, 2.051892042160034, 2.1543917655944824, 2.2568914890289307, 2.359391212463379, 2.461890935897827, 2.5643906593322754, 2.6668901443481445, 2.769390106201172, 2.871889591217041, 2.9743893146514893, 3.0768890380859375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 8.0, 5.0, 6.0, 6.0, 10.0, 10.0, 14.0, 23.0, 17.0, 15.0, 30.0, 14.0, 21.0, 32.0, 41.0, 28.0, 34.0, 46.0, 31.0, 38.0, 42.0, 43.0, 35.0, 34.0, 44.0, 36.0, 33.0, 34.0, 32.0, 32.0, 28.0, 20.0, 34.0, 20.0, 22.0, 19.0, 15.0, 8.0, 7.0, 11.0, 4.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5926952362060547, -1.5439839363098145, -1.4952726364135742, -1.446561336517334, -1.3978500366210938, -1.3491387367248535, -1.3004274368286133, -1.251716136932373, -1.2030048370361328, -1.1542935371398926, -1.1055822372436523, -1.056870937347412, -1.0081596374511719, -0.9594483375549316, -0.9107370972633362, -0.862025797367096, -0.8133145570755005, -0.7646032571792603, -0.71589195728302, -0.6671806573867798, -0.6184693574905396, -0.5697580575942993, -0.5210468173027039, -0.4723355174064636, -0.4236242175102234, -0.37491291761398315, -0.3262016177177429, -0.2774903476238251, -0.22877904772758484, -0.1800677478313446, -0.13135647773742676, -0.08264517784118652, -0.03393387794494629, 0.014777414500713348, 0.06348870694637299, 0.11219999194145203, 0.16091129183769226, 0.2096225917339325, 0.25833386182785034, 0.3070451617240906, 0.3557564616203308, 0.40446776151657104, 0.4531790614128113, 0.5018903017044067, 0.550601601600647, 0.5993129014968872, 0.6480242013931274, 0.6967355012893677, 0.7454468011856079, 0.7941581010818481, 0.8428694009780884, 0.8915807008743286, 0.9402920007705688, 0.9890033006668091, 1.0377144813537598, 1.08642578125, 1.1351370811462402, 1.1838483810424805, 1.2325596809387207, 1.281270980834961, 1.3299822807312012, 1.3786935806274414, 1.4274048805236816, 1.4761161804199219, 1.524827480316162]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 16.0, 16.0, 35.0, 49.0, 55.0, 97.0, 149.0, 262.0, 363.0, 628.0, 1054.0, 1788.0, 3155.0, 5302.0, 9695.0, 17341.0, 33286.0, 64913.0, 138774.0, 329430.0, 812590.0, 1324185.0, 834153.0, 339431.0, 139769.0, 65273.0, 32890.0, 17243.0, 9412.0, 5251.0, 3051.0, 1781.0, 1110.0, 638.0, 401.0, 239.0, 140.0, 99.0, 69.0, 43.0, 31.0, 26.0, 12.0, 8.0, 6.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2005615234375, -0.1939868927001953, -0.18741226196289062, -0.18083763122558594, -0.17426300048828125, -0.16768836975097656, -0.16111373901367188, -0.1545391082763672, -0.1479644775390625, -0.1413898468017578, -0.13481521606445312, -0.12824058532714844, -0.12166595458984375, -0.11509132385253906, -0.10851669311523438, -0.10194206237792969, -0.095367431640625, -0.08879280090332031, -0.08221817016601562, -0.07564353942871094, -0.06906890869140625, -0.06249427795410156, -0.055919647216796875, -0.04934501647949219, -0.0427703857421875, -0.03619575500488281, -0.029621124267578125, -0.023046493530273438, -0.01647186279296875, -0.009897232055664062, -0.003322601318359375, 0.0032520294189453125, 0.00982666015625, 0.016401290893554688, 0.022975921630859375, 0.029550552368164062, 0.03612518310546875, 0.04269981384277344, 0.049274444580078125, 0.05584907531738281, 0.0624237060546875, 0.06899833679199219, 0.07557296752929688, 0.08214759826660156, 0.08872222900390625, 0.09529685974121094, 0.10187149047851562, 0.10844612121582031, 0.115020751953125, 0.12159538269042969, 0.12817001342773438, 0.13474464416503906, 0.14131927490234375, 0.14789390563964844, 0.15446853637695312, 0.1610431671142578, 0.1676177978515625, 0.1741924285888672, 0.18076705932617188, 0.18734169006347656, 0.19391632080078125, 0.20049095153808594, 0.20706558227539062, 0.2136402130126953, 0.22021484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 7.0, 5.0, 7.0, 4.0, 12.0, 12.0, 18.0, 24.0, 28.0, 25.0, 25.0, 37.0, 29.0, 22.0, 34.0, 38.0, 27.0, 40.0, 42.0, 37.0, 44.0, 38.0, 40.0, 34.0, 42.0, 44.0, 37.0, 26.0, 26.0, 30.0, 25.0, 25.0, 28.0, 17.0, 8.0, 15.0, 12.0, 7.0, 6.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.170166015625, -0.16399765014648438, -0.15782928466796875, -0.15166091918945312, -0.1454925537109375, -0.13932418823242188, -0.13315582275390625, -0.12698745727539062, -0.120819091796875, -0.11465072631835938, -0.10848236083984375, -0.10231399536132812, -0.0961456298828125, -0.08997726440429688, -0.08380889892578125, -0.07764053344726562, -0.07147216796875, -0.06530380249023438, -0.05913543701171875, -0.052967071533203125, -0.0467987060546875, -0.040630340576171875, -0.03446197509765625, -0.028293609619140625, -0.022125244140625, -0.015956878662109375, -0.00978851318359375, -0.003620147705078125, 0.0025482177734375, 0.008716583251953125, 0.01488494873046875, 0.021053314208984375, 0.0272216796875, 0.033390045166015625, 0.03955841064453125, 0.045726776123046875, 0.0518951416015625, 0.058063507080078125, 0.06423187255859375, 0.07040023803710938, 0.076568603515625, 0.08273696899414062, 0.08890533447265625, 0.09507369995117188, 0.1012420654296875, 0.10741043090820312, 0.11357879638671875, 0.11974716186523438, 0.12591552734375, 0.13208389282226562, 0.13825225830078125, 0.14442062377929688, 0.1505889892578125, 0.15675735473632812, 0.16292572021484375, 0.16909408569335938, 0.175262451171875, 0.18143081665039062, 0.18759918212890625, 0.19376754760742188, 0.1999359130859375, 0.20610427856445312, 0.21227264404296875, 0.21844100952148438, 0.224609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 15.0, 27.0, 26.0, 44.0, 58.0, 98.0, 120.0, 163.0, 284.0, 409.0, 703.0, 1188.0, 2456.0, 5112.0, 12398.0, 34283.0, 104178.0, 350703.0, 1561199.0, 1597131.0, 358796.0, 106474.0, 34875.0, 12679.0, 5304.0, 2449.0, 1178.0, 676.0, 414.0, 265.0, 178.0, 129.0, 67.0, 47.0, 41.0, 31.0, 22.0, 14.0, 15.0, 6.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.431884765625, -0.4183921813964844, -0.40489959716796875, -0.3914070129394531, -0.3779144287109375, -0.3644218444824219, -0.35092926025390625, -0.3374366760253906, -0.323944091796875, -0.3104515075683594, -0.29695892333984375, -0.2834663391113281, -0.2699737548828125, -0.2564811706542969, -0.24298858642578125, -0.22949600219726562, -0.21600341796875, -0.20251083374023438, -0.18901824951171875, -0.17552566528320312, -0.1620330810546875, -0.14854049682617188, -0.13504791259765625, -0.12155532836914062, -0.108062744140625, -0.09457015991210938, -0.08107757568359375, -0.06758499145507812, -0.0540924072265625, -0.040599822998046875, -0.02710723876953125, -0.013614654541015625, -0.0001220703125, 0.013370513916015625, 0.02686309814453125, 0.040355682373046875, 0.0538482666015625, 0.06734085083007812, 0.08083343505859375, 0.09432601928710938, 0.107818603515625, 0.12131118774414062, 0.13480377197265625, 0.14829635620117188, 0.1617889404296875, 0.17528152465820312, 0.18877410888671875, 0.20226669311523438, 0.21575927734375, 0.22925186157226562, 0.24274444580078125, 0.2562370300292969, 0.2697296142578125, 0.2832221984863281, 0.29671478271484375, 0.3102073669433594, 0.323699951171875, 0.3371925354003906, 0.35068511962890625, 0.3641777038574219, 0.3776702880859375, 0.3911628723144531, 0.40465545654296875, 0.4181480407714844, 0.431640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 1.0, 3.0, 8.0, 8.0, 8.0, 11.0, 14.0, 11.0, 8.0, 22.0, 35.0, 32.0, 29.0, 33.0, 52.0, 71.0, 79.0, 107.0, 106.0, 141.0, 168.0, 226.0, 283.0, 365.0, 389.0, 325.0, 290.0, 237.0, 179.0, 157.0, 127.0, 97.0, 87.0, 71.0, 50.0, 44.0, 41.0, 31.0, 20.0, 16.0, 22.0, 8.0, 9.0, 12.0, 12.0, 10.0, 5.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.3193359375, -0.30954742431640625, -0.2997589111328125, -0.28997039794921875, -0.280181884765625, -0.27039337158203125, -0.2606048583984375, -0.25081634521484375, -0.24102783203125, -0.23123931884765625, -0.2214508056640625, -0.21166229248046875, -0.201873779296875, -0.19208526611328125, -0.1822967529296875, -0.17250823974609375, -0.1627197265625, -0.15293121337890625, -0.1431427001953125, -0.13335418701171875, -0.123565673828125, -0.11377716064453125, -0.1039886474609375, -0.09420013427734375, -0.08441162109375, -0.07462310791015625, -0.0648345947265625, -0.05504608154296875, -0.045257568359375, -0.03546905517578125, -0.0256805419921875, -0.01589202880859375, -0.006103515625, 0.00368499755859375, 0.0134735107421875, 0.02326202392578125, 0.033050537109375, 0.04283905029296875, 0.0526275634765625, 0.06241607666015625, 0.07220458984375, 0.08199310302734375, 0.0917816162109375, 0.10157012939453125, 0.111358642578125, 0.12114715576171875, 0.1309356689453125, 0.14072418212890625, 0.1505126953125, 0.16030120849609375, 0.1700897216796875, 0.17987823486328125, 0.189666748046875, 0.19945526123046875, 0.2092437744140625, 0.21903228759765625, 0.22882080078125, 0.23860931396484375, 0.2483978271484375, 0.25818634033203125, 0.267974853515625, 0.27776336669921875, 0.2875518798828125, 0.29734039306640625, 0.30712890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 8.0, 28.0, 37.0, 78.0, 117.0, 136.0, 192.0, 138.0, 116.0, 75.0, 28.0, 22.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.516013145446777, -4.381528854370117, -4.247044086456299, -4.112559795379639, -3.9780752658843994, -3.84359073638916, -3.7091064453125, -3.5746219158172607, -3.4401373863220215, -3.3056528568267822, -3.171168565750122, -3.036684036254883, -2.9021995067596436, -2.7677149772644043, -2.633230686187744, -2.498746156692505, -2.3642618656158447, -2.2297773361206055, -2.0952930450439453, -1.960808515548706, -1.8263239860534668, -1.691839575767517, -1.5573551654815674, -1.4228706359863281, -1.2883862257003784, -1.1539018154144287, -1.0194172859191895, -0.8849328756332397, -0.7504484057426453, -0.6159639358520508, -0.4814795255661011, -0.3469950556755066, -0.2125105857849121, -0.07802613079547882, 0.05645832419395447, 0.19094276428222656, 0.32542723417282104, 0.4599117040634155, 0.5943961143493652, 0.7288805842399597, 0.8633650541305542, 0.9978495240211487, 1.1323339939117432, 1.2668184041976929, 1.4013028144836426, 1.5357873439788818, 1.6702717542648315, 1.8047561645507812, 1.9392406940460205, 2.0737252235412598, 2.20820951461792, 2.342694044113159, 2.4771785736083984, 2.6116628646850586, 2.746147394180298, 2.880631923675537, 3.0151162147521973, 3.1496007442474365, 3.2840850353240967, 3.418569564819336, 3.553054094314575, 3.6875386238098145, 3.8220229148864746, 3.956507444381714, 4.090991973876953]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 9.0, 4.0, 7.0, 8.0, 11.0, 16.0, 15.0, 15.0, 20.0, 20.0, 24.0, 25.0, 22.0, 36.0, 31.0, 32.0, 30.0, 30.0, 38.0, 35.0, 44.0, 57.0, 33.0, 43.0, 37.0, 31.0, 29.0, 38.0, 22.0, 40.0, 20.0, 35.0, 22.0, 19.0, 10.0, 22.0, 12.0, 12.0, 7.0, 6.0, 3.0, 6.0, 6.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.4504894018173218, -1.4076894521713257, -1.36488938331604, -1.322089433670044, -1.2792894840240479, -1.2364894151687622, -1.1936894655227661, -1.1508893966674805, -1.1080894470214844, -1.0652894973754883, -1.0224894285202026, -0.9796894788742065, -0.9368894696235657, -0.8940894603729248, -0.8512895107269287, -0.8084895014762878, -0.7656895518302917, -0.7228895425796509, -0.6800895929336548, -0.6372895836830139, -0.594489574432373, -0.551689624786377, -0.5088896155357361, -0.4660896062850952, -0.42328962683677673, -0.38048964738845825, -0.3376896381378174, -0.2948896586894989, -0.2520896792411804, -0.20928966999053955, -0.16648969054222107, -0.1236896812915802, -0.08088970184326172, -0.03808971121907234, 0.004710279405117035, 0.04751026630401611, 0.09031026065349579, 0.13311025500297546, 0.17591023445129395, 0.21871024370193481, 0.2615102231502533, 0.3043102025985718, 0.34711021184921265, 0.38991019129753113, 0.4327101707458496, 0.4755101799964905, 0.5183101892471313, 0.5611101388931274, 0.6039101481437683, 0.6467101573944092, 0.6895101070404053, 0.7323101162910461, 0.775110125541687, 0.8179100751876831, 0.860710084438324, 0.9035100936889648, 0.9463100433349609, 0.9891100525856018, 1.0319100618362427, 1.0747100114822388, 1.1175099611282349, 1.1603100299835205, 1.2031099796295166, 1.2459099292755127, 1.2887099981307983]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 14.0, 22.0, 35.0, 63.0, 82.0, 138.0, 194.0, 327.0, 518.0, 925.0, 1622.0, 2916.0, 5078.0, 9421.0, 17713.0, 33509.0, 61700.0, 107216.0, 161197.0, 193751.0, 173283.0, 121252.0, 71924.0, 39145.0, 21061.0, 11280.0, 6134.0, 3361.0, 1919.0, 1072.0, 642.0, 379.0, 228.0, 162.0, 78.0, 62.0, 43.0, 19.0, 12.0, 6.0, 3.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22093772888183594, -0.21348190307617188, -0.2060260772705078, -0.19857025146484375, -0.1911144256591797, -0.18365859985351562, -0.17620277404785156, -0.1687469482421875, -0.16129112243652344, -0.15383529663085938, -0.1463794708251953, -0.13892364501953125, -0.1314678192138672, -0.12401199340820312, -0.11655616760253906, -0.109100341796875, -0.10164451599121094, -0.09418869018554688, -0.08673286437988281, -0.07927703857421875, -0.07182121276855469, -0.06436538696289062, -0.05690956115722656, -0.0494537353515625, -0.04199790954589844, -0.034542083740234375, -0.027086257934570312, -0.01963043212890625, -0.012174606323242188, -0.004718780517578125, 0.0027370452880859375, 0.01019287109375, 0.017648696899414062, 0.025104522705078125, 0.03256034851074219, 0.04001617431640625, 0.04747200012207031, 0.054927825927734375, 0.06238365173339844, 0.0698394775390625, 0.07729530334472656, 0.08475112915039062, 0.09220695495605469, 0.09966278076171875, 0.10711860656738281, 0.11457443237304688, 0.12203025817871094, 0.129486083984375, 0.13694190979003906, 0.14439773559570312, 0.1518535614013672, 0.15930938720703125, 0.1667652130126953, 0.17422103881835938, 0.18167686462402344, 0.1891326904296875, 0.19658851623535156, 0.20404434204101562, 0.2115001678466797, 0.21895599365234375, 0.2264118194580078, 0.23386764526367188, 0.24132347106933594, 0.248779296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 13.0, 13.0, 17.0, 12.0, 12.0, 25.0, 25.0, 29.0, 37.0, 22.0, 36.0, 34.0, 46.0, 42.0, 33.0, 46.0, 45.0, 46.0, 46.0, 43.0, 33.0, 36.0, 34.0, 37.0, 28.0, 33.0, 30.0, 19.0, 14.0, 15.0, 24.0, 12.0, 17.0, 9.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.1735706329345703, -0.16708755493164062, -0.16060447692871094, -0.15412139892578125, -0.14763832092285156, -0.14115524291992188, -0.1346721649169922, -0.1281890869140625, -0.12170600891113281, -0.11522293090820312, -0.10873985290527344, -0.10225677490234375, -0.09577369689941406, -0.08929061889648438, -0.08280754089355469, -0.076324462890625, -0.06984138488769531, -0.06335830688476562, -0.05687522888183594, -0.05039215087890625, -0.04390907287597656, -0.037425994873046875, -0.030942916870117188, -0.0244598388671875, -0.017976760864257812, -0.011493682861328125, -0.0050106048583984375, 0.00147247314453125, 0.007955551147460938, 0.014438629150390625, 0.020921707153320312, 0.02740478515625, 0.03388786315917969, 0.040370941162109375, 0.04685401916503906, 0.05333709716796875, 0.05982017517089844, 0.06630325317382812, 0.07278633117675781, 0.0792694091796875, 0.08575248718261719, 0.09223556518554688, 0.09871864318847656, 0.10520172119140625, 0.11168479919433594, 0.11816787719726562, 0.12465095520019531, 0.131134033203125, 0.1376171112060547, 0.14410018920898438, 0.15058326721191406, 0.15706634521484375, 0.16354942321777344, 0.17003250122070312, 0.1765155792236328, 0.1829986572265625, 0.1894817352294922, 0.19596481323242188, 0.20244789123535156, 0.20893096923828125, 0.21541404724121094, 0.22189712524414062, 0.2283802032470703, 0.23486328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 15.0, 20.0, 24.0, 38.0, 65.0, 105.0, 222.0, 504.0, 1119.0, 3552.0, 12621.0, 53089.0, 231107.0, 469576.0, 211662.0, 48124.0, 11421.0, 3288.0, 1111.0, 370.0, 226.0, 102.0, 56.0, 38.0, 32.0, 19.0, 8.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.572265625, -0.5534820556640625, -0.534698486328125, -0.5159149169921875, -0.49713134765625, -0.4783477783203125, -0.459564208984375, -0.4407806396484375, -0.4219970703125, -0.4032135009765625, -0.384429931640625, -0.3656463623046875, -0.34686279296875, -0.3280792236328125, -0.309295654296875, -0.2905120849609375, -0.271728515625, -0.2529449462890625, -0.234161376953125, -0.2153778076171875, -0.19659423828125, -0.1778106689453125, -0.159027099609375, -0.1402435302734375, -0.1214599609375, -0.1026763916015625, -0.083892822265625, -0.0651092529296875, -0.04632568359375, -0.0275421142578125, -0.008758544921875, 0.0100250244140625, 0.02880859375, 0.0475921630859375, 0.066375732421875, 0.0851593017578125, 0.10394287109375, 0.1227264404296875, 0.141510009765625, 0.1602935791015625, 0.1790771484375, 0.1978607177734375, 0.216644287109375, 0.2354278564453125, 0.25421142578125, 0.2729949951171875, 0.291778564453125, 0.3105621337890625, 0.329345703125, 0.3481292724609375, 0.366912841796875, 0.3856964111328125, 0.40447998046875, 0.4232635498046875, 0.442047119140625, 0.4608306884765625, 0.4796142578125, 0.4983978271484375, 0.517181396484375, 0.5359649658203125, 0.55474853515625, 0.5735321044921875, 0.592315673828125, 0.6110992431640625, 0.6298828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 4.0, 7.0, 9.0, 9.0, 15.0, 16.0, 21.0, 16.0, 27.0, 32.0, 26.0, 41.0, 32.0, 43.0, 43.0, 40.0, 43.0, 50.0, 49.0, 32.0, 51.0, 41.0, 48.0, 47.0, 25.0, 24.0, 31.0, 31.0, 21.0, 15.0, 29.0, 18.0, 6.0, 7.0, 13.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.65673828125, -0.6382064819335938, -0.6196746826171875, -0.6011428833007812, -0.582611083984375, -0.5640792846679688, -0.5455474853515625, -0.5270156860351562, -0.50848388671875, -0.48995208740234375, -0.4714202880859375, -0.45288848876953125, -0.434356689453125, -0.41582489013671875, -0.3972930908203125, -0.37876129150390625, -0.3602294921875, -0.34169769287109375, -0.3231658935546875, -0.30463409423828125, -0.286102294921875, -0.26757049560546875, -0.2490386962890625, -0.23050689697265625, -0.21197509765625, -0.19344329833984375, -0.1749114990234375, -0.15637969970703125, -0.137847900390625, -0.11931610107421875, -0.1007843017578125, -0.08225250244140625, -0.063720703125, -0.04518890380859375, -0.0266571044921875, -0.00812530517578125, 0.010406494140625, 0.02893829345703125, 0.0474700927734375, 0.06600189208984375, 0.08453369140625, 0.10306549072265625, 0.1215972900390625, 0.14012908935546875, 0.158660888671875, 0.17719268798828125, 0.1957244873046875, 0.21425628662109375, 0.2327880859375, 0.25131988525390625, 0.2698516845703125, 0.28838348388671875, 0.306915283203125, 0.32544708251953125, 0.3439788818359375, 0.36251068115234375, 0.38104248046875, 0.39957427978515625, 0.4181060791015625, 0.43663787841796875, 0.455169677734375, 0.47370147705078125, 0.4922332763671875, 0.5107650756835938, 0.529296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 18.0, 27.0, 36.0, 35.0, 49.0, 113.0, 142.0, 247.0, 330.0, 604.0, 1057.0, 1818.0, 3542.0, 7103.0, 15579.0, 36163.0, 85685.0, 183725.0, 274149.0, 227294.0, 118487.0, 50960.0, 21529.0, 9552.0, 4707.0, 2306.0, 1259.0, 784.0, 439.0, 282.0, 173.0, 120.0, 89.0, 45.0, 28.0, 26.0, 18.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.12944984436035156, -0.12523269653320312, -0.12101554870605469, -0.11679840087890625, -0.11258125305175781, -0.10836410522460938, -0.10414695739746094, -0.0999298095703125, -0.09571266174316406, -0.09149551391601562, -0.08727836608886719, -0.08306121826171875, -0.07884407043457031, -0.07462692260742188, -0.07040977478027344, -0.066192626953125, -0.06197547912597656, -0.057758331298828125, -0.05354118347167969, -0.04932403564453125, -0.04510688781738281, -0.040889739990234375, -0.03667259216308594, -0.0324554443359375, -0.028238296508789062, -0.024021148681640625, -0.019804000854492188, -0.01558685302734375, -0.011369705200195312, -0.007152557373046875, -0.0029354095458984375, 0.00128173828125, 0.0054988861083984375, 0.009716033935546875, 0.013933181762695312, 0.01815032958984375, 0.022367477416992188, 0.026584625244140625, 0.030801773071289062, 0.0350189208984375, 0.03923606872558594, 0.043453216552734375, 0.04767036437988281, 0.05188751220703125, 0.05610466003417969, 0.060321807861328125, 0.06453895568847656, 0.068756103515625, 0.07297325134277344, 0.07719039916992188, 0.08140754699707031, 0.08562469482421875, 0.08984184265136719, 0.09405899047851562, 0.09827613830566406, 0.1024932861328125, 0.10671043395996094, 0.11092758178710938, 0.11514472961425781, 0.11936187744140625, 0.12357902526855469, 0.12779617309570312, 0.13201332092285156, 0.13623046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 13.0, 11.0, 12.0, 25.0, 26.0, 38.0, 42.0, 43.0, 53.0, 66.0, 75.0, 70.0, 77.0, 72.0, 68.0, 60.0, 47.0, 47.0, 36.0, 23.0, 21.0, 16.0, 16.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3511390686035156e-05, -4.224199801683426e-05, -4.097260534763336e-05, -3.9703212678432465e-05, -3.843382000923157e-05, -3.716442734003067e-05, -3.589503467082977e-05, -3.4625642001628876e-05, -3.335624933242798e-05, -3.208685666322708e-05, -3.0817463994026184e-05, -2.9548071324825287e-05, -2.827867865562439e-05, -2.7009285986423492e-05, -2.5739893317222595e-05, -2.4470500648021698e-05, -2.32011079788208e-05, -2.1931715309619904e-05, -2.0662322640419006e-05, -1.939292997121811e-05, -1.8123537302017212e-05, -1.6854144632816315e-05, -1.5584751963615417e-05, -1.431535929441452e-05, -1.3045966625213623e-05, -1.1776573956012726e-05, -1.0507181286811829e-05, -9.237788617610931e-06, -7.968395948410034e-06, -6.699003279209137e-06, -5.42961061000824e-06, -4.1602179408073425e-06, -2.8908252716064453e-06, -1.621432602405548e-06, -3.520399332046509e-07, 9.173527359962463e-07, 2.1867454051971436e-06, 3.4561380743980408e-06, 4.725530743598938e-06, 5.994923412799835e-06, 7.264316082000732e-06, 8.53370875120163e-06, 9.803101420402527e-06, 1.1072494089603424e-05, 1.2341886758804321e-05, 1.3611279428005219e-05, 1.4880672097206116e-05, 1.6150064766407013e-05, 1.741945743560791e-05, 1.8688850104808807e-05, 1.9958242774009705e-05, 2.1227635443210602e-05, 2.24970281124115e-05, 2.3766420781612396e-05, 2.5035813450813293e-05, 2.630520612001419e-05, 2.7574598789215088e-05, 2.8843991458415985e-05, 3.0113384127616882e-05, 3.138277679681778e-05, 3.265216946601868e-05, 3.3921562135219574e-05, 3.519095480442047e-05, 3.646034747362137e-05, 3.7729740142822266e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 17.0, 24.0, 30.0, 38.0, 63.0, 98.0, 162.0, 308.0, 675.0, 1413.0, 3324.0, 9105.0, 26822.0, 86008.0, 238657.0, 358824.0, 213041.0, 73382.0, 23179.0, 7844.0, 2860.0, 1323.0, 594.0, 293.0, 167.0, 102.0, 55.0, 44.0, 33.0, 13.0, 13.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.17337989807128906, -0.16768264770507812, -0.1619853973388672, -0.15628814697265625, -0.1505908966064453, -0.14489364624023438, -0.13919639587402344, -0.1334991455078125, -0.12780189514160156, -0.12210464477539062, -0.11640739440917969, -0.11071014404296875, -0.10501289367675781, -0.09931564331054688, -0.09361839294433594, -0.087921142578125, -0.08222389221191406, -0.07652664184570312, -0.07082939147949219, -0.06513214111328125, -0.05943489074707031, -0.053737640380859375, -0.04804039001464844, -0.0423431396484375, -0.03664588928222656, -0.030948638916015625, -0.025251388549804688, -0.01955413818359375, -0.013856887817382812, -0.008159637451171875, -0.0024623870849609375, 0.00323486328125, 0.008932113647460938, 0.014629364013671875, 0.020326614379882812, 0.02602386474609375, 0.03172111511230469, 0.037418365478515625, 0.04311561584472656, 0.0488128662109375, 0.05451011657714844, 0.060207366943359375, 0.06590461730957031, 0.07160186767578125, 0.07729911804199219, 0.08299636840820312, 0.08869361877441406, 0.094390869140625, 0.10008811950683594, 0.10578536987304688, 0.11148262023925781, 0.11717987060546875, 0.12287712097167969, 0.12857437133789062, 0.13427162170410156, 0.1399688720703125, 0.14566612243652344, 0.15136337280273438, 0.1570606231689453, 0.16275787353515625, 0.1684551239013672, 0.17415237426757812, 0.17984962463378906, 0.185546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 4.0, 7.0, 11.0, 14.0, 20.0, 30.0, 43.0, 65.0, 65.0, 94.0, 95.0, 116.0, 102.0, 72.0, 73.0, 49.0, 39.0, 35.0, 28.0, 17.0, 7.0, 4.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.147125244140625, -0.13995361328125, -0.132781982421875, -0.1256103515625, -0.118438720703125, -0.11126708984375, -0.104095458984375, -0.096923828125, -0.089752197265625, -0.08258056640625, -0.075408935546875, -0.0682373046875, -0.061065673828125, -0.05389404296875, -0.046722412109375, -0.03955078125, -0.032379150390625, -0.02520751953125, -0.018035888671875, -0.0108642578125, -0.003692626953125, 0.00347900390625, 0.010650634765625, 0.017822265625, 0.024993896484375, 0.03216552734375, 0.039337158203125, 0.0465087890625, 0.053680419921875, 0.06085205078125, 0.068023681640625, 0.0751953125, 0.082366943359375, 0.08953857421875, 0.096710205078125, 0.1038818359375, 0.111053466796875, 0.11822509765625, 0.125396728515625, 0.132568359375, 0.139739990234375, 0.14691162109375, 0.154083251953125, 0.1612548828125, 0.168426513671875, 0.17559814453125, 0.182769775390625, 0.18994140625, 0.197113037109375, 0.20428466796875, 0.211456298828125, 0.2186279296875, 0.225799560546875, 0.23297119140625, 0.240142822265625, 0.247314453125, 0.254486083984375, 0.26165771484375, 0.268829345703125, 0.2760009765625, 0.283172607421875, 0.29034423828125, 0.297515869140625, 0.3046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 9.0, 24.0, 41.0, 81.0, 132.0, 162.0, 201.0, 149.0, 99.0, 41.0, 22.0, 13.0, 8.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5538761615753174, -2.4527816772460938, -2.35168719291687, -2.2505927085876465, -2.1494979858398438, -2.048403739929199, -1.9473090171813965, -1.8462145328521729, -1.7451200485229492, -1.6440255641937256, -1.542931079864502, -1.4418364763259888, -1.3407419919967651, -1.2396475076675415, -1.1385529041290283, -1.0374584197998047, -0.936363935470581, -0.8352694511413574, -0.734174907207489, -0.6330803632736206, -0.531985878944397, -0.43089139461517334, -0.32979685068130493, -0.22870230674743652, -0.1276078224182129, -0.02651330828666687, 0.07458120584487915, 0.17567571997642517, 0.2767702341079712, 0.3778647184371948, 0.47895926237106323, 0.5800538063049316, 0.6811485290527344, 0.782243013381958, 0.8833375573158264, 0.9844321012496948, 1.0855265855789185, 1.186621069908142, 1.2877156734466553, 1.388810157775879, 1.4899046421051025, 1.5909991264343262, 1.6920936107635498, 1.793188214302063, 1.8942826986312866, 1.9953771829605103, 2.0964717864990234, 2.197566270828247, 2.2986607551574707, 2.3997552394866943, 2.500849723815918, 2.6019442081451416, 2.7030386924743652, 2.804133415222168, 2.9052278995513916, 3.0063223838806152, 3.107416868209839, 3.2085113525390625, 3.309605836868286, 3.4107003211975098, 3.5117950439453125, 3.612889289855957, 3.7139840126037598, 3.8150784969329834, 3.916172981262207]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 8.0, 8.0, 5.0, 8.0, 20.0, 11.0, 17.0, 13.0, 21.0, 23.0, 32.0, 34.0, 36.0, 41.0, 25.0, 40.0, 37.0, 50.0, 41.0, 30.0, 45.0, 27.0, 40.0, 42.0, 44.0, 29.0, 31.0, 23.0, 27.0, 24.0, 27.0, 23.0, 24.0, 11.0, 16.0, 14.0, 11.0, 8.0, 7.0, 8.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.451817274093628, -1.4054875373840332, -1.359157681465149, -1.3128279447555542, -1.26649808883667, -1.2201683521270752, -1.1738386154174805, -1.1275087594985962, -1.081178903579712, -1.0348491668701172, -0.9885193109512329, -0.9421895742416382, -0.8958597183227539, -0.8495299816131592, -0.8032001852989197, -0.7568703889846802, -0.7105406522750854, -0.664210855960846, -0.6178810596466064, -0.5715513229370117, -0.5252214670181274, -0.4788917005062103, -0.4325619339942932, -0.3862321376800537, -0.3399023413658142, -0.2935725450515747, -0.2472427636384964, -0.2009129822254181, -0.1545831859111786, -0.10825338959693909, -0.06192362308502197, -0.01559382677078247, 0.03073596954345703, 0.07706575840711594, 0.12339554727077484, 0.16972532868385315, 0.21605512499809265, 0.26238492131233215, 0.30871468782424927, 0.35504448413848877, 0.40137428045272827, 0.4477040767669678, 0.4940338730812073, 0.5403636693954468, 0.5866934061050415, 0.6330232620239258, 0.6793529987335205, 0.72568279504776, 0.7720125913619995, 0.818342387676239, 0.8646721839904785, 0.9110019207000732, 0.9573317766189575, 1.0036615133285522, 1.0499913692474365, 1.0963211059570312, 1.142650842666626, 1.1889805793762207, 1.235310435295105, 1.2816401720046997, 1.327970027923584, 1.3742997646331787, 1.4206295013427734, 1.4669593572616577, 1.513289213180542]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 12.0, 9.0, 25.0, 36.0, 58.0, 84.0, 178.0, 266.0, 424.0, 680.0, 1236.0, 2322.0, 4716.0, 9583.0, 21164.0, 50126.0, 129925.0, 399204.0, 1253434.0, 1515429.0, 531111.0, 166073.0, 60398.0, 24973.0, 11049.0, 5450.0, 2716.0, 1460.0, 841.0, 465.0, 297.0, 198.0, 116.0, 71.0, 52.0, 37.0, 17.0, 14.0, 12.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20380020141601562, -0.19568634033203125, -0.18757247924804688, -0.1794586181640625, -0.17134475708007812, -0.16323089599609375, -0.15511703491210938, -0.147003173828125, -0.13888931274414062, -0.13077545166015625, -0.12266159057617188, -0.1145477294921875, -0.10643386840820312, -0.09832000732421875, -0.09020614624023438, -0.08209228515625, -0.07397842407226562, -0.06586456298828125, -0.057750701904296875, -0.0496368408203125, -0.041522979736328125, -0.03340911865234375, -0.025295257568359375, -0.017181396484375, -0.009067535400390625, -0.00095367431640625, 0.007160186767578125, 0.0152740478515625, 0.023387908935546875, 0.03150177001953125, 0.039615631103515625, 0.0477294921875, 0.055843353271484375, 0.06395721435546875, 0.07207107543945312, 0.0801849365234375, 0.08829879760742188, 0.09641265869140625, 0.10452651977539062, 0.112640380859375, 0.12075424194335938, 0.12886810302734375, 0.13698196411132812, 0.1450958251953125, 0.15320968627929688, 0.16132354736328125, 0.16943740844726562, 0.17755126953125, 0.18566513061523438, 0.19377899169921875, 0.20189285278320312, 0.2100067138671875, 0.21812057495117188, 0.22623443603515625, 0.23434829711914062, 0.242462158203125, 0.2505760192871094, 0.25868988037109375, 0.2668037414550781, 0.2749176025390625, 0.2830314636230469, 0.29114532470703125, 0.2992591857910156, 0.307373046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 10.0, 7.0, 10.0, 10.0, 19.0, 17.0, 21.0, 17.0, 27.0, 30.0, 30.0, 33.0, 37.0, 35.0, 42.0, 43.0, 35.0, 68.0, 45.0, 39.0, 43.0, 42.0, 39.0, 34.0, 31.0, 27.0, 27.0, 33.0, 29.0, 20.0, 20.0, 20.0, 10.0, 9.0, 6.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.1710681915283203, -0.16452407836914062, -0.15797996520996094, -0.15143585205078125, -0.14489173889160156, -0.13834762573242188, -0.1318035125732422, -0.1252593994140625, -0.11871528625488281, -0.11217117309570312, -0.10562705993652344, -0.09908294677734375, -0.09253883361816406, -0.08599472045898438, -0.07945060729980469, -0.072906494140625, -0.06636238098144531, -0.059818267822265625, -0.05327415466308594, -0.04673004150390625, -0.04018592834472656, -0.033641815185546875, -0.027097702026367188, -0.0205535888671875, -0.014009475708007812, -0.007465362548828125, -0.0009212493896484375, 0.00562286376953125, 0.012166976928710938, 0.018711090087890625, 0.025255203247070312, 0.03179931640625, 0.03834342956542969, 0.044887542724609375, 0.05143165588378906, 0.05797576904296875, 0.06451988220214844, 0.07106399536132812, 0.07760810852050781, 0.0841522216796875, 0.09069633483886719, 0.09724044799804688, 0.10378456115722656, 0.11032867431640625, 0.11687278747558594, 0.12341690063476562, 0.1299610137939453, 0.136505126953125, 0.1430492401123047, 0.14959335327148438, 0.15613746643066406, 0.16268157958984375, 0.16922569274902344, 0.17576980590820312, 0.1823139190673828, 0.1888580322265625, 0.1954021453857422, 0.20194625854492188, 0.20849037170410156, 0.21503448486328125, 0.22157859802246094, 0.22812271118164062, 0.2346668243408203, 0.2412109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 10.0, 10.0, 21.0, 31.0, 47.0, 75.0, 117.0, 234.0, 377.0, 733.0, 1586.0, 3614.0, 9974.0, 32123.0, 131044.0, 739088.0, 2640858.0, 499043.0, 97150.0, 24550.0, 7932.0, 2865.0, 1249.0, 669.0, 336.0, 175.0, 128.0, 80.0, 56.0, 34.0, 21.0, 15.0, 9.0, 9.0, 6.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5248146057128906, -0.5091018676757812, -0.4933891296386719, -0.4776763916015625, -0.4619636535644531, -0.44625091552734375, -0.4305381774902344, -0.414825439453125, -0.3991127014160156, -0.38339996337890625, -0.3676872253417969, -0.3519744873046875, -0.3362617492675781, -0.32054901123046875, -0.3048362731933594, -0.28912353515625, -0.2734107971191406, -0.25769805908203125, -0.24198532104492188, -0.2262725830078125, -0.21055984497070312, -0.19484710693359375, -0.17913436889648438, -0.163421630859375, -0.14770889282226562, -0.13199615478515625, -0.11628341674804688, -0.1005706787109375, -0.08485794067382812, -0.06914520263671875, -0.053432464599609375, -0.0377197265625, -0.022006988525390625, -0.00629425048828125, 0.009418487548828125, 0.0251312255859375, 0.040843963623046875, 0.05655670166015625, 0.07226943969726562, 0.087982177734375, 0.10369491577148438, 0.11940765380859375, 0.13512039184570312, 0.1508331298828125, 0.16654586791992188, 0.18225860595703125, 0.19797134399414062, 0.21368408203125, 0.22939682006835938, 0.24510955810546875, 0.2608222961425781, 0.2765350341796875, 0.2922477722167969, 0.30796051025390625, 0.3236732482910156, 0.339385986328125, 0.3550987243652344, 0.37081146240234375, 0.3865242004394531, 0.4022369384765625, 0.4179496765136719, 0.43366241455078125, 0.4493751525878906, 0.465087890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 7.0, 15.0, 8.0, 13.0, 24.0, 31.0, 39.0, 52.0, 70.0, 107.0, 146.0, 191.0, 277.0, 406.0, 599.0, 619.0, 438.0, 320.0, 208.0, 140.0, 98.0, 65.0, 58.0, 41.0, 19.0, 14.0, 15.0, 14.0, 8.0, 4.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3681640625, -0.3545684814453125, -0.340972900390625, -0.3273773193359375, -0.31378173828125, -0.3001861572265625, -0.286590576171875, -0.2729949951171875, -0.2593994140625, -0.2458038330078125, -0.232208251953125, -0.2186126708984375, -0.20501708984375, -0.1914215087890625, -0.177825927734375, -0.1642303466796875, -0.150634765625, -0.1370391845703125, -0.123443603515625, -0.1098480224609375, -0.09625244140625, -0.0826568603515625, -0.069061279296875, -0.0554656982421875, -0.0418701171875, -0.0282745361328125, -0.014678955078125, -0.0010833740234375, 0.01251220703125, 0.0261077880859375, 0.039703369140625, 0.0532989501953125, 0.06689453125, 0.0804901123046875, 0.094085693359375, 0.1076812744140625, 0.12127685546875, 0.1348724365234375, 0.148468017578125, 0.1620635986328125, 0.1756591796875, 0.1892547607421875, 0.202850341796875, 0.2164459228515625, 0.23004150390625, 0.2436370849609375, 0.257232666015625, 0.2708282470703125, 0.284423828125, 0.2980194091796875, 0.311614990234375, 0.3252105712890625, 0.33880615234375, 0.3524017333984375, 0.365997314453125, 0.3795928955078125, 0.3931884765625, 0.4067840576171875, 0.420379638671875, 0.4339752197265625, 0.44757080078125, 0.4611663818359375, 0.474761962890625, 0.4883575439453125, 0.501953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 12.0, 29.0, 40.0, 76.0, 123.0, 129.0, 143.0, 153.0, 119.0, 77.0, 45.0, 20.0, 14.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.283090114593506, -4.17725944519043, -4.0714287757873535, -3.9655983448028564, -3.8597679138183594, -3.753937244415283, -3.648106575012207, -3.54227614402771, -3.436445474624634, -3.3306148052215576, -3.2247843742370605, -3.1189537048339844, -3.0131232738494873, -2.907292604446411, -2.801462173461914, -2.695631504058838, -2.5898008346557617, -2.4839701652526855, -2.3781397342681885, -2.2723090648651123, -2.1664786338806152, -2.060647964477539, -1.9548174142837524, -1.8489868640899658, -1.7431564331054688, -1.6373258829116821, -1.5314953327178955, -1.4256646633148193, -1.3198341131210327, -1.214003562927246, -1.1081730127334595, -1.0023424625396729, -0.8965117931365967, -0.7906812429428101, -0.6848506331443787, -0.579020082950592, -0.47318950295448303, -0.367358922958374, -0.2615283727645874, -0.155697762966156, -0.049867212772369385, 0.05596335977315903, 0.16179393231868744, 0.26762449741363525, 0.37345507740974426, 0.47928565740585327, 0.5851162075996399, 0.6909468173980713, 0.7967773675918579, 0.9026079177856445, 1.0084384679794312, 1.1142690181732178, 1.220099687576294, 1.3259302377700806, 1.4317607879638672, 1.5375914573669434, 1.6434218883514404, 1.749252438545227, 1.8550829887390137, 1.9609136581420898, 2.066744089126587, 2.172574758529663, 2.27840518951416, 2.3842358589172363, 2.4900665283203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 5.0, 8.0, 7.0, 11.0, 14.0, 13.0, 30.0, 18.0, 28.0, 30.0, 21.0, 35.0, 26.0, 34.0, 34.0, 41.0, 28.0, 45.0, 45.0, 50.0, 38.0, 39.0, 39.0, 29.0, 35.0, 29.0, 30.0, 36.0, 25.0, 22.0, 30.0, 19.0, 16.0, 13.0, 13.0, 8.0, 6.0, 9.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.3442909717559814, -1.3058111667633057, -1.2673313617706299, -1.228851556777954, -1.1903717517852783, -1.1518919467926025, -1.1134121417999268, -1.074932336807251, -1.0364525318145752, -0.9979727268218994, -0.9594929218292236, -0.9210131168365479, -0.8825333118438721, -0.8440535068511963, -0.8055737018585205, -0.7670938968658447, -0.728614091873169, -0.6901342868804932, -0.6516544818878174, -0.6131746768951416, -0.5746948719024658, -0.53621506690979, -0.49773526191711426, -0.4592554569244385, -0.4207756519317627, -0.3822958469390869, -0.34381604194641113, -0.30533623695373535, -0.26685643196105957, -0.2283766269683838, -0.189896821975708, -0.15141701698303223, -0.11293721199035645, -0.07445740699768066, -0.03597760200500488, 0.0025022029876708984, 0.04098200798034668, 0.07946181297302246, 0.11794161796569824, 0.15642142295837402, 0.1949012279510498, 0.23338103294372559, 0.27186083793640137, 0.31034064292907715, 0.34882044792175293, 0.3873002529144287, 0.4257800579071045, 0.4642598628997803, 0.502739667892456, 0.5412194728851318, 0.5796992778778076, 0.6181790828704834, 0.6566588878631592, 0.695138692855835, 0.7336184978485107, 0.7720983028411865, 0.8105781078338623, 0.8490579128265381, 0.8875377178192139, 0.9260175228118896, 0.9644973278045654, 1.0029771327972412, 1.041456937789917, 1.0799367427825928, 1.1184165477752686]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 21.0, 30.0, 35.0, 56.0, 62.0, 107.0, 228.0, 350.0, 630.0, 1149.0, 2064.0, 3920.0, 7853.0, 17351.0, 42224.0, 111220.0, 253911.0, 313132.0, 175752.0, 68604.0, 26506.0, 11563.0, 5512.0, 2782.0, 1501.0, 777.0, 473.0, 266.0, 163.0, 90.0, 66.0, 43.0, 36.0, 19.0, 14.0, 13.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.484130859375, -0.4711341857910156, -0.45813751220703125, -0.4451408386230469, -0.4321441650390625, -0.4191474914550781, -0.40615081787109375, -0.3931541442871094, -0.380157470703125, -0.3671607971191406, -0.35416412353515625, -0.3411674499511719, -0.3281707763671875, -0.3151741027832031, -0.30217742919921875, -0.2891807556152344, -0.27618408203125, -0.2631874084472656, -0.25019073486328125, -0.23719406127929688, -0.2241973876953125, -0.21120071411132812, -0.19820404052734375, -0.18520736694335938, -0.172210693359375, -0.15921401977539062, -0.14621734619140625, -0.13322067260742188, -0.1202239990234375, -0.10722732543945312, -0.09423065185546875, -0.08123397827148438, -0.0682373046875, -0.055240631103515625, -0.04224395751953125, -0.029247283935546875, -0.0162506103515625, -0.003253936767578125, 0.00974273681640625, 0.022739410400390625, 0.035736083984375, 0.048732757568359375, 0.06172943115234375, 0.07472610473632812, 0.0877227783203125, 0.10071945190429688, 0.11371612548828125, 0.12671279907226562, 0.13970947265625, 0.15270614624023438, 0.16570281982421875, 0.17869949340820312, 0.1916961669921875, 0.20469284057617188, 0.21768951416015625, 0.23068618774414062, 0.243682861328125, 0.2566795349121094, 0.26967620849609375, 0.2826728820800781, 0.2956695556640625, 0.3086662292480469, 0.32166290283203125, 0.3346595764160156, 0.34765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 16.0, 16.0, 15.0, 20.0, 23.0, 28.0, 28.0, 38.0, 36.0, 35.0, 40.0, 36.0, 50.0, 39.0, 41.0, 51.0, 45.0, 47.0, 49.0, 39.0, 36.0, 32.0, 30.0, 32.0, 29.0, 20.0, 23.0, 11.0, 11.0, 19.0, 10.0, 8.0, 4.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2005615234375, -0.19386672973632812, -0.18717193603515625, -0.18047714233398438, -0.1737823486328125, -0.16708755493164062, -0.16039276123046875, -0.15369796752929688, -0.147003173828125, -0.14030838012695312, -0.13361358642578125, -0.12691879272460938, -0.1202239990234375, -0.11352920532226562, -0.10683441162109375, -0.10013961791992188, -0.09344482421875, -0.08675003051757812, -0.08005523681640625, -0.07336044311523438, -0.0666656494140625, -0.059970855712890625, -0.05327606201171875, -0.046581268310546875, -0.039886474609375, -0.033191680908203125, -0.02649688720703125, -0.019802093505859375, -0.0131072998046875, -0.006412506103515625, 0.00028228759765625, 0.006977081298828125, 0.013671875, 0.020366668701171875, 0.02706146240234375, 0.033756256103515625, 0.0404510498046875, 0.047145843505859375, 0.05384063720703125, 0.060535430908203125, 0.067230224609375, 0.07392501831054688, 0.08061981201171875, 0.08731460571289062, 0.0940093994140625, 0.10070419311523438, 0.10739898681640625, 0.11409378051757812, 0.12078857421875, 0.12748336791992188, 0.13417816162109375, 0.14087295532226562, 0.1475677490234375, 0.15426254272460938, 0.16095733642578125, 0.16765213012695312, 0.174346923828125, 0.18104171752929688, 0.18773651123046875, 0.19443130493164062, 0.2011260986328125, 0.20782089233398438, 0.21451568603515625, 0.22121047973632812, 0.2279052734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 8.0, 8.0, 8.0, 15.0, 24.0, 42.0, 58.0, 78.0, 139.0, 237.0, 425.0, 834.0, 1514.0, 3121.0, 6021.0, 12834.0, 29181.0, 72781.0, 182088.0, 322079.0, 241483.0, 102290.0, 40069.0, 16912.0, 8112.0, 3911.0, 1931.0, 1009.0, 571.0, 306.0, 173.0, 94.0, 64.0, 37.0, 26.0, 18.0, 13.0, 5.0, 11.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3670845031738281, -0.35428619384765625, -0.3414878845214844, -0.3286895751953125, -0.3158912658691406, -0.30309295654296875, -0.2902946472167969, -0.277496337890625, -0.2646980285644531, -0.25189971923828125, -0.23910140991210938, -0.2263031005859375, -0.21350479125976562, -0.20070648193359375, -0.18790817260742188, -0.17510986328125, -0.16231155395507812, -0.14951324462890625, -0.13671493530273438, -0.1239166259765625, -0.11111831665039062, -0.09832000732421875, -0.08552169799804688, -0.072723388671875, -0.059925079345703125, -0.04712677001953125, -0.034328460693359375, -0.0215301513671875, -0.008731842041015625, 0.00406646728515625, 0.016864776611328125, 0.0296630859375, 0.042461395263671875, 0.05525970458984375, 0.06805801391601562, 0.0808563232421875, 0.09365463256835938, 0.10645294189453125, 0.11925125122070312, 0.132049560546875, 0.14484786987304688, 0.15764617919921875, 0.17044448852539062, 0.1832427978515625, 0.19604110717773438, 0.20883941650390625, 0.22163772583007812, 0.23443603515625, 0.24723434448242188, 0.26003265380859375, 0.2728309631347656, 0.2856292724609375, 0.2984275817871094, 0.31122589111328125, 0.3240242004394531, 0.336822509765625, 0.3496208190917969, 0.36241912841796875, 0.3752174377441406, 0.3880157470703125, 0.4008140563964844, 0.41361236572265625, 0.4264106750488281, 0.439208984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 7.0, 11.0, 6.0, 13.0, 13.0, 13.0, 17.0, 17.0, 28.0, 30.0, 27.0, 41.0, 41.0, 45.0, 35.0, 53.0, 48.0, 55.0, 49.0, 44.0, 52.0, 40.0, 44.0, 36.0, 33.0, 29.0, 27.0, 21.0, 31.0, 19.0, 20.0, 11.0, 12.0, 8.0, 9.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.677734375, -0.6579818725585938, -0.6382293701171875, -0.6184768676757812, -0.598724365234375, -0.5789718627929688, -0.5592193603515625, -0.5394668579101562, -0.51971435546875, -0.49996185302734375, -0.4802093505859375, -0.46045684814453125, -0.440704345703125, -0.42095184326171875, -0.4011993408203125, -0.38144683837890625, -0.3616943359375, -0.34194183349609375, -0.3221893310546875, -0.30243682861328125, -0.282684326171875, -0.26293182373046875, -0.2431793212890625, -0.22342681884765625, -0.20367431640625, -0.18392181396484375, -0.1641693115234375, -0.14441680908203125, -0.124664306640625, -0.10491180419921875, -0.0851593017578125, -0.06540679931640625, -0.045654296875, -0.02590179443359375, -0.0061492919921875, 0.01360321044921875, 0.033355712890625, 0.05310821533203125, 0.0728607177734375, 0.09261322021484375, 0.11236572265625, 0.13211822509765625, 0.1518707275390625, 0.17162322998046875, 0.191375732421875, 0.21112823486328125, 0.2308807373046875, 0.25063323974609375, 0.2703857421875, 0.29013824462890625, 0.3098907470703125, 0.32964324951171875, 0.349395751953125, 0.36914825439453125, 0.3889007568359375, 0.40865325927734375, 0.42840576171875, 0.44815826416015625, 0.4679107666015625, 0.48766326904296875, 0.507415771484375, 0.5271682739257812, 0.5469207763671875, 0.5666732788085938, 0.58642578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 6.0, 12.0, 25.0, 28.0, 49.0, 59.0, 113.0, 186.0, 294.0, 515.0, 929.0, 1774.0, 3399.0, 6590.0, 13699.0, 29905.0, 70039.0, 164068.0, 290699.0, 250128.0, 121722.0, 50820.0, 22160.0, 10473.0, 5167.0, 2568.0, 1349.0, 730.0, 402.0, 255.0, 151.0, 73.0, 59.0, 37.0, 18.0, 11.0, 9.0, 7.0, 5.0, 7.0, 3.0, 7.0, 2.0], "bins": [-0.1646728515625, -0.1605367660522461, -0.1564006805419922, -0.15226459503173828, -0.14812850952148438, -0.14399242401123047, -0.13985633850097656, -0.13572025299072266, -0.13158416748046875, -0.12744808197021484, -0.12331199645996094, -0.11917591094970703, -0.11503982543945312, -0.11090373992919922, -0.10676765441894531, -0.1026315689086914, -0.0984954833984375, -0.0943593978881836, -0.09022331237792969, -0.08608722686767578, -0.08195114135742188, -0.07781505584716797, -0.07367897033691406, -0.06954288482666016, -0.06540679931640625, -0.061270713806152344, -0.05713462829589844, -0.05299854278564453, -0.048862457275390625, -0.04472637176513672, -0.04059028625488281, -0.036454200744628906, -0.032318115234375, -0.028182029724121094, -0.024045944213867188, -0.01990985870361328, -0.015773773193359375, -0.011637687683105469, -0.0075016021728515625, -0.0033655166625976562, 0.00077056884765625, 0.004906654357910156, 0.009042739868164062, 0.013178825378417969, 0.017314910888671875, 0.02145099639892578, 0.025587081909179688, 0.029723167419433594, 0.0338592529296875, 0.037995338439941406, 0.04213142395019531, 0.04626750946044922, 0.050403594970703125, 0.05453968048095703, 0.05867576599121094, 0.06281185150146484, 0.06694793701171875, 0.07108402252197266, 0.07522010803222656, 0.07935619354248047, 0.08349227905273438, 0.08762836456298828, 0.09176445007324219, 0.0959005355834961, 0.10003662109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 9.0, 11.0, 13.0, 23.0, 27.0, 42.0, 61.0, 107.0, 120.0, 138.0, 137.0, 90.0, 62.0, 34.0, 33.0, 23.0, 15.0, 17.0, 12.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.751848220825195e-05, -5.5339187383651733e-05, -5.3159892559051514e-05, -5.0980597734451294e-05, -4.8801302909851074e-05, -4.6622008085250854e-05, -4.4442713260650635e-05, -4.2263418436050415e-05, -4.0084123611450195e-05, -3.7904828786849976e-05, -3.5725533962249756e-05, -3.3546239137649536e-05, -3.1366944313049316e-05, -2.9187649488449097e-05, -2.7008354663848877e-05, -2.4829059839248657e-05, -2.2649765014648438e-05, -2.0470470190048218e-05, -1.8291175365447998e-05, -1.611188054084778e-05, -1.3932585716247559e-05, -1.1753290891647339e-05, -9.573996067047119e-06, -7.394701242446899e-06, -5.21540641784668e-06, -3.03611159324646e-06, -8.568167686462402e-07, 1.3224780559539795e-06, 3.5017728805541992e-06, 5.681067705154419e-06, 7.860362529754639e-06, 1.0039657354354858e-05, 1.2218952178955078e-05, 1.4398247003555298e-05, 1.6577541828155518e-05, 1.8756836652755737e-05, 2.0936131477355957e-05, 2.3115426301956177e-05, 2.5294721126556396e-05, 2.7474015951156616e-05, 2.9653310775756836e-05, 3.1832605600357056e-05, 3.4011900424957275e-05, 3.6191195249557495e-05, 3.8370490074157715e-05, 4.0549784898757935e-05, 4.2729079723358154e-05, 4.4908374547958374e-05, 4.7087669372558594e-05, 4.9266964197158813e-05, 5.144625902175903e-05, 5.362555384635925e-05, 5.580484867095947e-05, 5.798414349555969e-05, 6.016343832015991e-05, 6.234273314476013e-05, 6.452202796936035e-05, 6.670132279396057e-05, 6.888061761856079e-05, 7.105991244316101e-05, 7.323920726776123e-05, 7.541850209236145e-05, 7.759779691696167e-05, 7.977709174156189e-05, 8.195638656616211e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 5.0, 17.0, 22.0, 29.0, 39.0, 52.0, 69.0, 127.0, 171.0, 263.0, 410.0, 740.0, 1429.0, 2812.0, 5442.0, 11232.0, 24141.0, 54925.0, 118129.0, 214855.0, 258346.0, 183274.0, 93112.0, 41746.0, 19084.0, 8754.0, 4257.0, 2136.0, 1147.0, 654.0, 416.0, 222.0, 155.0, 100.0, 55.0, 49.0, 39.0, 21.0, 20.0, 11.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1158447265625, -0.11202621459960938, -0.10820770263671875, -0.10438919067382812, -0.1005706787109375, -0.09675216674804688, -0.09293365478515625, -0.08911514282226562, -0.085296630859375, -0.08147811889648438, -0.07765960693359375, -0.07384109497070312, -0.0700225830078125, -0.06620407104492188, -0.06238555908203125, -0.058567047119140625, -0.05474853515625, -0.050930023193359375, -0.04711151123046875, -0.043292999267578125, -0.0394744873046875, -0.035655975341796875, -0.03183746337890625, -0.028018951416015625, -0.024200439453125, -0.020381927490234375, -0.01656341552734375, -0.012744903564453125, -0.0089263916015625, -0.005107879638671875, -0.00128936767578125, 0.002529144287109375, 0.00634765625, 0.010166168212890625, 0.01398468017578125, 0.017803192138671875, 0.0216217041015625, 0.025440216064453125, 0.02925872802734375, 0.033077239990234375, 0.036895751953125, 0.040714263916015625, 0.04453277587890625, 0.048351287841796875, 0.0521697998046875, 0.055988311767578125, 0.05980682373046875, 0.06362533569335938, 0.06744384765625, 0.07126235961914062, 0.07508087158203125, 0.07889938354492188, 0.0827178955078125, 0.08653640747070312, 0.09035491943359375, 0.09417343139648438, 0.097991943359375, 0.10181045532226562, 0.10562896728515625, 0.10944747924804688, 0.1132659912109375, 0.11708450317382812, 0.12090301513671875, 0.12472152709960938, 0.1285400390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 10.0, 16.0, 27.0, 35.0, 34.0, 52.0, 55.0, 75.0, 66.0, 76.0, 87.0, 62.0, 63.0, 61.0, 52.0, 41.0, 36.0, 26.0, 20.0, 14.0, 16.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.185791015625, -0.1803741455078125, -0.174957275390625, -0.1695404052734375, -0.16412353515625, -0.1587066650390625, -0.153289794921875, -0.1478729248046875, -0.1424560546875, -0.1370391845703125, -0.131622314453125, -0.1262054443359375, -0.12078857421875, -0.1153717041015625, -0.109954833984375, -0.1045379638671875, -0.09912109375, -0.0937042236328125, -0.088287353515625, -0.0828704833984375, -0.07745361328125, -0.0720367431640625, -0.066619873046875, -0.0612030029296875, -0.0557861328125, -0.0503692626953125, -0.044952392578125, -0.0395355224609375, -0.03411865234375, -0.0287017822265625, -0.023284912109375, -0.0178680419921875, -0.012451171875, -0.0070343017578125, -0.001617431640625, 0.0037994384765625, 0.00921630859375, 0.0146331787109375, 0.020050048828125, 0.0254669189453125, 0.0308837890625, 0.0363006591796875, 0.041717529296875, 0.0471343994140625, 0.05255126953125, 0.0579681396484375, 0.063385009765625, 0.0688018798828125, 0.07421875, 0.0796356201171875, 0.085052490234375, 0.0904693603515625, 0.09588623046875, 0.1013031005859375, 0.106719970703125, 0.1121368408203125, 0.1175537109375, 0.1229705810546875, 0.128387451171875, 0.1338043212890625, 0.13922119140625, 0.1446380615234375, 0.150054931640625, 0.1554718017578125, 0.160888671875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 11.0, 15.0, 55.0, 139.0, 252.0, 274.0, 150.0, 66.0, 22.0, 11.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9352967739105225, -2.771942615509033, -2.608588695526123, -2.445234537124634, -2.2818803787231445, -2.1185264587402344, -1.9551723003387451, -1.7918182611465454, -1.6284642219543457, -1.465110182762146, -1.3017561435699463, -1.138401985168457, -0.9750479459762573, -0.8116939067840576, -0.6483398079872131, -0.48498570919036865, -0.32163166999816895, -0.15827760100364685, 0.005076467990875244, 0.16843053698539734, 0.33178460597991943, 0.49513864517211914, 0.6584927439689636, 0.8218468427658081, 0.9852008819580078, 1.1485549211502075, 1.3119089603424072, 1.4752631187438965, 1.6386171579360962, 1.801971197128296, 1.9653253555297852, 2.1286792755126953, 2.2920331954956055, 2.4553873538970947, 2.618741273880005, 2.782095432281494, 2.9454493522644043, 3.1088035106658936, 3.272157669067383, 3.435511589050293, 3.5988657474517822, 3.7622199058532715, 3.9255738258361816, 4.088927745819092, 4.25228214263916, 4.41563606262207, 4.5789899826049805, 4.742344379425049, 4.905698299407959, 5.069052219390869, 5.2324066162109375, 5.395760536193848, 5.559114456176758, 5.722468376159668, 5.885822772979736, 6.0491766929626465, 6.212531089782715, 6.375885009765625, 6.539239406585693, 6.7025933265686035, 6.865947246551514, 7.029301643371582, 7.192655563354492, 7.356009483337402, 7.5193634033203125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 4.0, 6.0, 4.0, 7.0, 11.0, 18.0, 14.0, 15.0, 20.0, 21.0, 24.0, 24.0, 22.0, 40.0, 26.0, 32.0, 26.0, 40.0, 27.0, 24.0, 30.0, 46.0, 42.0, 43.0, 38.0, 36.0, 36.0, 34.0, 30.0, 25.0, 31.0, 29.0, 13.0, 30.0, 19.0, 16.0, 10.0, 12.0, 7.0, 10.0, 15.0, 9.0, 8.0, 11.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4249085187911987, -1.3807636499404907, -1.3366187810897827, -1.2924739122390747, -1.2483291625976562, -1.2041842937469482, -1.1600394248962402, -1.1158945560455322, -1.0717496871948242, -1.0276048183441162, -0.9834599494934082, -0.939315140247345, -0.895170271396637, -0.851025402545929, -0.8068805932998657, -0.7627357244491577, -0.7185908555984497, -0.6744459867477417, -0.6303011178970337, -0.5861563086509705, -0.5420114398002625, -0.49786657094955444, -0.4537217319011688, -0.4095768928527832, -0.3654320240020752, -0.3212871551513672, -0.27714231610298157, -0.23299746215343475, -0.18885260820388794, -0.14470775425434113, -0.10056290030479431, -0.05641806125640869, -0.012273311614990234, 0.03187154233455658, 0.0760163962841034, 0.12016125023365021, 0.16430610418319702, 0.20845095813274384, 0.25259581208229065, 0.29674065113067627, 0.3408855199813843, 0.3850303888320923, 0.4291752278804779, 0.4733200669288635, 0.5174649357795715, 0.5616098046302795, 0.6057546138763428, 0.6498994827270508, 0.6940443515777588, 0.7381892204284668, 0.7823340892791748, 0.826478898525238, 0.870623767375946, 0.914768636226654, 0.9589134454727173, 1.0030583143234253, 1.0472031831741333, 1.0913480520248413, 1.1354929208755493, 1.1796377897262573, 1.2237825393676758, 1.2679274082183838, 1.3120722770690918, 1.3562171459197998, 1.4003620147705078]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 16.0, 21.0, 35.0, 45.0, 83.0, 124.0, 192.0, 244.0, 421.0, 704.0, 1084.0, 1935.0, 3224.0, 5390.0, 9608.0, 17428.0, 33312.0, 66206.0, 136676.0, 302434.0, 662435.0, 1139512.0, 942053.0, 466947.0, 208195.0, 95385.0, 46223.0, 23999.0, 12694.0, 7178.0, 4034.0, 2420.0, 1551.0, 933.0, 544.0, 312.0, 216.0, 129.0, 92.0, 79.0, 44.0, 35.0, 27.0, 22.0, 7.0, 4.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.17626953125, -0.17053985595703125, -0.1648101806640625, -0.15908050537109375, -0.153350830078125, -0.14762115478515625, -0.1418914794921875, -0.13616180419921875, -0.13043212890625, -0.12470245361328125, -0.1189727783203125, -0.11324310302734375, -0.107513427734375, -0.10178375244140625, -0.0960540771484375, -0.09032440185546875, -0.0845947265625, -0.07886505126953125, -0.0731353759765625, -0.06740570068359375, -0.061676025390625, -0.05594635009765625, -0.0502166748046875, -0.04448699951171875, -0.03875732421875, -0.03302764892578125, -0.0272979736328125, -0.02156829833984375, -0.015838623046875, -0.01010894775390625, -0.0043792724609375, 0.00135040283203125, 0.007080078125, 0.01280975341796875, 0.0185394287109375, 0.02426910400390625, 0.029998779296875, 0.03572845458984375, 0.0414581298828125, 0.04718780517578125, 0.05291748046875, 0.05864715576171875, 0.0643768310546875, 0.07010650634765625, 0.075836181640625, 0.08156585693359375, 0.0872955322265625, 0.09302520751953125, 0.0987548828125, 0.10448455810546875, 0.1102142333984375, 0.11594390869140625, 0.121673583984375, 0.12740325927734375, 0.1331329345703125, 0.13886260986328125, 0.14459228515625, 0.15032196044921875, 0.1560516357421875, 0.16178131103515625, 0.167510986328125, 0.17324066162109375, 0.1789703369140625, 0.18470001220703125, 0.1904296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 10.0, 12.0, 7.0, 15.0, 18.0, 15.0, 15.0, 22.0, 22.0, 36.0, 31.0, 33.0, 41.0, 41.0, 50.0, 42.0, 53.0, 53.0, 60.0, 35.0, 55.0, 40.0, 46.0, 44.0, 31.0, 28.0, 29.0, 26.0, 20.0, 20.0, 21.0, 10.0, 4.0, 4.0, 1.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23779296875, -0.2305450439453125, -0.223297119140625, -0.2160491943359375, -0.20880126953125, -0.2015533447265625, -0.194305419921875, -0.1870574951171875, -0.1798095703125, -0.1725616455078125, -0.165313720703125, -0.1580657958984375, -0.15081787109375, -0.1435699462890625, -0.136322021484375, -0.1290740966796875, -0.121826171875, -0.1145782470703125, -0.107330322265625, -0.1000823974609375, -0.09283447265625, -0.0855865478515625, -0.078338623046875, -0.0710906982421875, -0.0638427734375, -0.0565948486328125, -0.049346923828125, -0.0420989990234375, -0.03485107421875, -0.0276031494140625, -0.020355224609375, -0.0131072998046875, -0.005859375, 0.0013885498046875, 0.008636474609375, 0.0158843994140625, 0.02313232421875, 0.0303802490234375, 0.037628173828125, 0.0448760986328125, 0.0521240234375, 0.0593719482421875, 0.066619873046875, 0.0738677978515625, 0.08111572265625, 0.0883636474609375, 0.095611572265625, 0.1028594970703125, 0.110107421875, 0.1173553466796875, 0.124603271484375, 0.1318511962890625, 0.13909912109375, 0.1463470458984375, 0.153594970703125, 0.1608428955078125, 0.1680908203125, 0.1753387451171875, 0.182586669921875, 0.1898345947265625, 0.19708251953125, 0.2043304443359375, 0.211578369140625, 0.2188262939453125, 0.22607421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 7.0, 15.0, 11.0, 34.0, 35.0, 54.0, 123.0, 165.0, 304.0, 605.0, 1310.0, 3393.0, 10106.0, 37172.0, 174952.0, 1193251.0, 2330249.0, 351298.0, 66125.0, 16380.0, 5031.0, 1942.0, 808.0, 395.0, 187.0, 121.0, 83.0, 33.0, 28.0, 19.0, 12.0, 12.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3784599304199219, -0.36214447021484375, -0.3458290100097656, -0.3295135498046875, -0.3131980895996094, -0.29688262939453125, -0.2805671691894531, -0.264251708984375, -0.24793624877929688, -0.23162078857421875, -0.21530532836914062, -0.1989898681640625, -0.18267440795898438, -0.16635894775390625, -0.15004348754882812, -0.13372802734375, -0.11741256713867188, -0.10109710693359375, -0.08478164672851562, -0.0684661865234375, -0.052150726318359375, -0.03583526611328125, -0.019519805908203125, -0.003204345703125, 0.013111114501953125, 0.02942657470703125, 0.045742034912109375, 0.0620574951171875, 0.07837295532226562, 0.09468841552734375, 0.11100387573242188, 0.1273193359375, 0.14363479614257812, 0.15995025634765625, 0.17626571655273438, 0.1925811767578125, 0.20889663696289062, 0.22521209716796875, 0.24152755737304688, 0.257843017578125, 0.2741584777832031, 0.29047393798828125, 0.3067893981933594, 0.3231048583984375, 0.3394203186035156, 0.35573577880859375, 0.3720512390136719, 0.38836669921875, 0.4046821594238281, 0.42099761962890625, 0.4373130798339844, 0.4536285400390625, 0.4699440002441406, 0.48625946044921875, 0.5025749206542969, 0.518890380859375, 0.5352058410644531, 0.5515213012695312, 0.5678367614746094, 0.5841522216796875, 0.6004676818847656, 0.6167831420898438, 0.6330986022949219, 0.6494140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 5.0, 6.0, 10.0, 13.0, 15.0, 16.0, 26.0, 36.0, 55.0, 68.0, 99.0, 143.0, 174.0, 228.0, 363.0, 431.0, 548.0, 424.0, 391.0, 262.0, 189.0, 146.0, 104.0, 75.0, 64.0, 48.0, 30.0, 18.0, 13.0, 15.0, 14.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3437004089355469, -0.33119964599609375, -0.3186988830566406, -0.3061981201171875, -0.2936973571777344, -0.28119659423828125, -0.2686958312988281, -0.256195068359375, -0.24369430541992188, -0.23119354248046875, -0.21869277954101562, -0.2061920166015625, -0.19369125366210938, -0.18119049072265625, -0.16868972778320312, -0.15618896484375, -0.14368820190429688, -0.13118743896484375, -0.11868667602539062, -0.1061859130859375, -0.09368515014648438, -0.08118438720703125, -0.06868362426757812, -0.056182861328125, -0.043682098388671875, -0.03118133544921875, -0.018680572509765625, -0.0061798095703125, 0.006320953369140625, 0.01882171630859375, 0.031322479248046875, 0.0438232421875, 0.056324005126953125, 0.06882476806640625, 0.08132553100585938, 0.0938262939453125, 0.10632705688476562, 0.11882781982421875, 0.13132858276367188, 0.143829345703125, 0.15633010864257812, 0.16883087158203125, 0.18133163452148438, 0.1938323974609375, 0.20633316040039062, 0.21883392333984375, 0.23133468627929688, 0.24383544921875, 0.2563362121582031, 0.26883697509765625, 0.2813377380371094, 0.2938385009765625, 0.3063392639160156, 0.31884002685546875, 0.3313407897949219, 0.343841552734375, 0.3563423156738281, 0.36884307861328125, 0.3813438415527344, 0.3938446044921875, 0.4063453674316406, 0.41884613037109375, 0.4313468933105469, 0.44384765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 9.0, 15.0, 25.0, 53.0, 68.0, 86.0, 115.0, 143.0, 139.0, 109.0, 89.0, 50.0, 32.0, 21.0, 17.0, 6.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.999173164367676, -2.9131922721862793, -2.827211380004883, -2.7412302494049072, -2.6552493572235107, -2.5692684650421143, -2.4832873344421387, -2.397306442260742, -2.3113255500793457, -2.225344657897949, -2.1393637657165527, -2.053382635116577, -1.9674017429351807, -1.8814208507537842, -1.7954398393630981, -1.709458827972412, -1.6234779357910156, -1.5374970436096191, -1.451516032218933, -1.365535020828247, -1.2795541286468506, -1.193573236465454, -1.107592225074768, -1.021611213684082, -0.9356303215026855, -0.8496493697166443, -0.763668417930603, -0.6776874661445618, -0.5917065143585205, -0.5057255625724792, -0.419744610786438, -0.33376365900039673, -0.24778270721435547, -0.1618017554283142, -0.07582080364227295, 0.01016014814376831, 0.09614109992980957, 0.18212205171585083, 0.2681030035018921, 0.35408395528793335, 0.4400649070739746, 0.5260458588600159, 0.6120268106460571, 0.6980077624320984, 0.7839887142181396, 0.8699696660041809, 0.9559506177902222, 1.0419316291809082, 1.1279125213623047, 1.2138934135437012, 1.2998744249343872, 1.3858554363250732, 1.4718363285064697, 1.5578172206878662, 1.6437982320785522, 1.7297792434692383, 1.8157601356506348, 1.9017410278320312, 1.9877220392227173, 2.0737030506134033, 2.1596839427948, 2.2456648349761963, 2.331645965576172, 2.4176268577575684, 2.503607749938965]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 6.0, 6.0, 11.0, 9.0, 15.0, 18.0, 9.0, 12.0, 20.0, 20.0, 26.0, 35.0, 21.0, 28.0, 31.0, 47.0, 46.0, 38.0, 41.0, 44.0, 45.0, 46.0, 60.0, 43.0, 49.0, 29.0, 25.0, 39.0, 30.0, 26.0, 26.0, 14.0, 18.0, 18.0, 9.0, 9.0, 5.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7047348022460938, -1.6578364372253418, -1.6109380722045898, -1.564039707183838, -1.5171414613723755, -1.4702430963516235, -1.4233447313308716, -1.3764463663101196, -1.3295480012893677, -1.2826496362686157, -1.2357512712478638, -1.1888530254364014, -1.1419546604156494, -1.0950562953948975, -1.0481579303741455, -1.0012595653533936, -0.9543612599372864, -0.9074628949165344, -0.8605645895004272, -0.8136662244796753, -0.7667678594589233, -0.7198694944381714, -0.6729711890220642, -0.6260728240013123, -0.5791745185852051, -0.5322761535644531, -0.48537781834602356, -0.438479483127594, -0.39158111810684204, -0.3446827828884125, -0.2977844476699829, -0.25088608264923096, -0.203987717628479, -0.15708936750888824, -0.11019102483987808, -0.06329268217086792, -0.01639433205127716, 0.0305040180683136, 0.07740235328674316, 0.12430071830749512, 0.17119905352592468, 0.21809740364551544, 0.2649957537651062, 0.31189408898353577, 0.35879242420196533, 0.4056907892227173, 0.45258912444114685, 0.4994874894618988, 0.5463858246803284, 0.5932841897010803, 0.6401824951171875, 0.6870808601379395, 0.7339792251586914, 0.7808775901794434, 0.8277758955955505, 0.8746742606163025, 0.9215725660324097, 0.9684709310531616, 1.0153692960739136, 1.062267541885376, 1.109165906906128, 1.1560642719268799, 1.2029626369476318, 1.2498610019683838, 1.2967593669891357]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 14.0, 33.0, 45.0, 84.0, 139.0, 241.0, 447.0, 893.0, 1679.0, 3324.0, 6948.0, 14865.0, 35873.0, 96663.0, 235101.0, 321310.0, 199470.0, 77992.0, 29021.0, 12513.0, 5767.0, 2949.0, 1504.0, 777.0, 374.0, 227.0, 100.0, 70.0, 45.0, 18.0, 15.0, 16.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444091796875, -0.4289817810058594, -0.41387176513671875, -0.3987617492675781, -0.3836517333984375, -0.3685417175292969, -0.35343170166015625, -0.3383216857910156, -0.323211669921875, -0.3081016540527344, -0.29299163818359375, -0.2778816223144531, -0.2627716064453125, -0.24766159057617188, -0.23255157470703125, -0.21744155883789062, -0.20233154296875, -0.18722152709960938, -0.17211151123046875, -0.15700149536132812, -0.1418914794921875, -0.12678146362304688, -0.11167144775390625, -0.09656143188476562, -0.081451416015625, -0.06634140014648438, -0.05123138427734375, -0.036121368408203125, -0.0210113525390625, -0.005901336669921875, 0.00920867919921875, 0.024318695068359375, 0.0394287109375, 0.054538726806640625, 0.06964874267578125, 0.08475875854492188, 0.0998687744140625, 0.11497879028320312, 0.13008880615234375, 0.14519882202148438, 0.160308837890625, 0.17541885375976562, 0.19052886962890625, 0.20563888549804688, 0.2207489013671875, 0.23585891723632812, 0.25096893310546875, 0.2660789489746094, 0.28118896484375, 0.2962989807128906, 0.31140899658203125, 0.3265190124511719, 0.3416290283203125, 0.3567390441894531, 0.37184906005859375, 0.3869590759277344, 0.402069091796875, 0.4171791076660156, 0.43228912353515625, 0.4473991394042969, 0.4625091552734375, 0.4776191711425781, 0.49272918701171875, 0.5078392028808594, 0.52294921875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 8.0, 13.0, 12.0, 10.0, 10.0, 17.0, 14.0, 12.0, 24.0, 31.0, 30.0, 29.0, 31.0, 37.0, 33.0, 41.0, 36.0, 45.0, 43.0, 48.0, 41.0, 37.0, 54.0, 33.0, 37.0, 34.0, 28.0, 22.0, 24.0, 27.0, 18.0, 20.0, 16.0, 14.0, 8.0, 10.0, 11.0, 10.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.1758136749267578, -0.16937637329101562, -0.16293907165527344, -0.15650177001953125, -0.15006446838378906, -0.14362716674804688, -0.1371898651123047, -0.1307525634765625, -0.12431526184082031, -0.11787796020507812, -0.11144065856933594, -0.10500335693359375, -0.09856605529785156, -0.09212875366210938, -0.08569145202636719, -0.079254150390625, -0.07281684875488281, -0.06637954711914062, -0.05994224548339844, -0.05350494384765625, -0.04706764221191406, -0.040630340576171875, -0.03419303894042969, -0.0277557373046875, -0.021318435668945312, -0.014881134033203125, -0.008443832397460938, -0.00200653076171875, 0.0044307708740234375, 0.010868072509765625, 0.017305374145507812, 0.02374267578125, 0.030179977416992188, 0.036617279052734375, 0.04305458068847656, 0.04949188232421875, 0.05592918395996094, 0.062366485595703125, 0.06880378723144531, 0.0752410888671875, 0.08167839050292969, 0.08811569213867188, 0.09455299377441406, 0.10099029541015625, 0.10742759704589844, 0.11386489868164062, 0.12030220031738281, 0.126739501953125, 0.1331768035888672, 0.13961410522460938, 0.14605140686035156, 0.15248870849609375, 0.15892601013183594, 0.16536331176757812, 0.1718006134033203, 0.1782379150390625, 0.1846752166748047, 0.19111251831054688, 0.19754981994628906, 0.20398712158203125, 0.21042442321777344, 0.21686172485351562, 0.2232990264892578, 0.229736328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 8.0, 15.0, 8.0, 19.0, 31.0, 35.0, 75.0, 117.0, 227.0, 438.0, 1135.0, 3037.0, 9037.0, 29719.0, 124726.0, 434887.0, 334296.0, 79950.0, 20261.0, 6487.0, 2277.0, 863.0, 385.0, 191.0, 124.0, 71.0, 38.0, 35.0, 19.0, 9.0, 7.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80908203125, -0.784454345703125, -0.75982666015625, -0.735198974609375, -0.7105712890625, -0.685943603515625, -0.66131591796875, -0.636688232421875, -0.612060546875, -0.587432861328125, -0.56280517578125, -0.538177490234375, -0.5135498046875, -0.488922119140625, -0.46429443359375, -0.439666748046875, -0.4150390625, -0.390411376953125, -0.36578369140625, -0.341156005859375, -0.3165283203125, -0.291900634765625, -0.26727294921875, -0.242645263671875, -0.218017578125, -0.193389892578125, -0.16876220703125, -0.144134521484375, -0.1195068359375, -0.094879150390625, -0.07025146484375, -0.045623779296875, -0.02099609375, 0.003631591796875, 0.02825927734375, 0.052886962890625, 0.0775146484375, 0.102142333984375, 0.12677001953125, 0.151397705078125, 0.176025390625, 0.200653076171875, 0.22528076171875, 0.249908447265625, 0.2745361328125, 0.299163818359375, 0.32379150390625, 0.348419189453125, 0.373046875, 0.397674560546875, 0.42230224609375, 0.446929931640625, 0.4715576171875, 0.496185302734375, 0.52081298828125, 0.545440673828125, 0.570068359375, 0.594696044921875, 0.61932373046875, 0.643951416015625, 0.6685791015625, 0.693206787109375, 0.71783447265625, 0.742462158203125, 0.76708984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 10.0, 13.0, 7.0, 21.0, 18.0, 27.0, 24.0, 16.0, 33.0, 31.0, 24.0, 51.0, 48.0, 41.0, 46.0, 36.0, 49.0, 49.0, 43.0, 45.0, 45.0, 38.0, 37.0, 30.0, 36.0, 23.0, 16.0, 23.0, 20.0, 19.0, 16.0, 12.0, 10.0, 9.0, 3.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6669921875, -0.6449661254882812, -0.6229400634765625, -0.6009140014648438, -0.578887939453125, -0.5568618774414062, -0.5348358154296875, -0.5128097534179688, -0.49078369140625, -0.46875762939453125, -0.4467315673828125, -0.42470550537109375, -0.402679443359375, -0.38065338134765625, -0.3586273193359375, -0.33660125732421875, -0.3145751953125, -0.29254913330078125, -0.2705230712890625, -0.24849700927734375, -0.226470947265625, -0.20444488525390625, -0.1824188232421875, -0.16039276123046875, -0.13836669921875, -0.11634063720703125, -0.0943145751953125, -0.07228851318359375, -0.050262451171875, -0.02823638916015625, -0.0062103271484375, 0.01581573486328125, 0.037841796875, 0.05986785888671875, 0.0818939208984375, 0.10391998291015625, 0.125946044921875, 0.14797210693359375, 0.1699981689453125, 0.19202423095703125, 0.21405029296875, 0.23607635498046875, 0.2581024169921875, 0.28012847900390625, 0.302154541015625, 0.32418060302734375, 0.3462066650390625, 0.36823272705078125, 0.3902587890625, 0.41228485107421875, 0.4343109130859375, 0.45633697509765625, 0.478363037109375, 0.5003890991210938, 0.5224151611328125, 0.5444412231445312, 0.56646728515625, 0.5884933471679688, 0.6105194091796875, 0.6325454711914062, 0.654571533203125, 0.6765975952148438, 0.6986236572265625, 0.7206497192382812, 0.74267578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 14.0, 12.0, 25.0, 49.0, 71.0, 111.0, 167.0, 270.0, 492.0, 837.0, 1399.0, 2460.0, 4692.0, 9055.0, 18211.0, 43110.0, 111206.0, 253851.0, 309037.0, 172691.0, 67226.0, 26795.0, 12434.0, 6409.0, 3443.0, 1964.0, 988.0, 578.0, 338.0, 218.0, 122.0, 93.0, 52.0, 31.0, 33.0, 24.0, 8.0, 7.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1573486328125, -0.15261459350585938, -0.14788055419921875, -0.14314651489257812, -0.1384124755859375, -0.13367843627929688, -0.12894439697265625, -0.12421035766601562, -0.119476318359375, -0.11474227905273438, -0.11000823974609375, -0.10527420043945312, -0.1005401611328125, -0.09580612182617188, -0.09107208251953125, -0.08633804321289062, -0.08160400390625, -0.07686996459960938, -0.07213592529296875, -0.06740188598632812, -0.0626678466796875, -0.057933807373046875, -0.05319976806640625, -0.048465728759765625, -0.043731689453125, -0.038997650146484375, -0.03426361083984375, -0.029529571533203125, -0.0247955322265625, -0.020061492919921875, -0.01532745361328125, -0.010593414306640625, -0.005859375, -0.001125335693359375, 0.00360870361328125, 0.008342742919921875, 0.0130767822265625, 0.017810821533203125, 0.02254486083984375, 0.027278900146484375, 0.032012939453125, 0.036746978759765625, 0.04148101806640625, 0.046215057373046875, 0.0509490966796875, 0.055683135986328125, 0.06041717529296875, 0.06515121459960938, 0.06988525390625, 0.07461929321289062, 0.07935333251953125, 0.08408737182617188, 0.0888214111328125, 0.09355545043945312, 0.09828948974609375, 0.10302352905273438, 0.107757568359375, 0.11249160766601562, 0.11722564697265625, 0.12195968627929688, 0.1266937255859375, 0.13142776489257812, 0.13616180419921875, 0.14089584350585938, 0.1456298828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 12.0, 19.0, 28.0, 34.0, 50.0, 67.0, 83.0, 104.0, 118.0, 97.0, 87.0, 70.0, 69.0, 34.0, 27.0, 21.0, 16.0, 5.0, 8.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.312131881713867e-05, -6.10649585723877e-05, -5.900859832763672e-05, -5.695223808288574e-05, -5.4895877838134766e-05, -5.283951759338379e-05, -5.078315734863281e-05, -4.8726797103881836e-05, -4.667043685913086e-05, -4.461407661437988e-05, -4.2557716369628906e-05, -4.050135612487793e-05, -3.844499588012695e-05, -3.6388635635375977e-05, -3.4332275390625e-05, -3.2275915145874023e-05, -3.0219554901123047e-05, -2.816319465637207e-05, -2.6106834411621094e-05, -2.4050474166870117e-05, -2.199411392211914e-05, -1.9937753677368164e-05, -1.7881393432617188e-05, -1.582503318786621e-05, -1.3768672943115234e-05, -1.1712312698364258e-05, -9.655952453613281e-06, -7.599592208862305e-06, -5.543231964111328e-06, -3.4868717193603516e-06, -1.430511474609375e-06, 6.258487701416016e-07, 2.682209014892578e-06, 4.738569259643555e-06, 6.794929504394531e-06, 8.851289749145508e-06, 1.0907649993896484e-05, 1.2964010238647461e-05, 1.5020370483398438e-05, 1.7076730728149414e-05, 1.913309097290039e-05, 2.1189451217651367e-05, 2.3245811462402344e-05, 2.530217170715332e-05, 2.7358531951904297e-05, 2.9414892196655273e-05, 3.147125244140625e-05, 3.3527612686157227e-05, 3.55839729309082e-05, 3.764033317565918e-05, 3.9696693420410156e-05, 4.175305366516113e-05, 4.380941390991211e-05, 4.5865774154663086e-05, 4.792213439941406e-05, 4.997849464416504e-05, 5.2034854888916016e-05, 5.409121513366699e-05, 5.614757537841797e-05, 5.8203935623168945e-05, 6.026029586791992e-05, 6.23166561126709e-05, 6.437301635742188e-05, 6.642937660217285e-05, 6.848573684692383e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 6.0, 8.0, 15.0, 16.0, 27.0, 41.0, 99.0, 132.0, 256.0, 442.0, 989.0, 2198.0, 5811.0, 16260.0, 49573.0, 149797.0, 327879.0, 303718.0, 127480.0, 41128.0, 13827.0, 4995.0, 1913.0, 880.0, 444.0, 247.0, 155.0, 67.0, 57.0, 32.0, 16.0, 12.0, 8.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.187255859375, -0.18156814575195312, -0.17588043212890625, -0.17019271850585938, -0.1645050048828125, -0.15881729125976562, -0.15312957763671875, -0.14744186401367188, -0.141754150390625, -0.13606643676757812, -0.13037872314453125, -0.12469100952148438, -0.1190032958984375, -0.11331558227539062, -0.10762786865234375, -0.10194015502929688, -0.09625244140625, -0.09056472778320312, -0.08487701416015625, -0.07918930053710938, -0.0735015869140625, -0.06781387329101562, -0.06212615966796875, -0.056438446044921875, -0.050750732421875, -0.045063018798828125, -0.03937530517578125, -0.033687591552734375, -0.0279998779296875, -0.022312164306640625, -0.01662445068359375, -0.010936737060546875, -0.0052490234375, 0.000438690185546875, 0.00612640380859375, 0.011814117431640625, 0.0175018310546875, 0.023189544677734375, 0.02887725830078125, 0.034564971923828125, 0.040252685546875, 0.045940399169921875, 0.05162811279296875, 0.057315826416015625, 0.0630035400390625, 0.06869125366210938, 0.07437896728515625, 0.08006668090820312, 0.08575439453125, 0.09144210815429688, 0.09712982177734375, 0.10281753540039062, 0.1085052490234375, 0.11419296264648438, 0.11988067626953125, 0.12556838989257812, 0.131256103515625, 0.13694381713867188, 0.14263153076171875, 0.14831924438476562, 0.1540069580078125, 0.15969467163085938, 0.16538238525390625, 0.17107009887695312, 0.1767578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 12.0, 14.0, 11.0, 16.0, 17.0, 36.0, 33.0, 33.0, 31.0, 46.0, 46.0, 43.0, 44.0, 68.0, 61.0, 65.0, 74.0, 64.0, 39.0, 35.0, 38.0, 32.0, 22.0, 21.0, 18.0, 13.0, 12.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12562179565429688, -0.12062835693359375, -0.11563491821289062, -0.1106414794921875, -0.10564804077148438, -0.10065460205078125, -0.09566116333007812, -0.090667724609375, -0.08567428588867188, -0.08068084716796875, -0.07568740844726562, -0.0706939697265625, -0.06570053100585938, -0.06070709228515625, -0.055713653564453125, -0.05072021484375, -0.045726776123046875, -0.04073333740234375, -0.035739898681640625, -0.0307464599609375, -0.025753021240234375, -0.02075958251953125, -0.015766143798828125, -0.010772705078125, -0.005779266357421875, -0.00078582763671875, 0.004207611083984375, 0.0092010498046875, 0.014194488525390625, 0.01918792724609375, 0.024181365966796875, 0.0291748046875, 0.034168243408203125, 0.03916168212890625, 0.044155120849609375, 0.0491485595703125, 0.054141998291015625, 0.05913543701171875, 0.06412887573242188, 0.069122314453125, 0.07411575317382812, 0.07910919189453125, 0.08410263061523438, 0.0890960693359375, 0.09408950805664062, 0.09908294677734375, 0.10407638549804688, 0.10906982421875, 0.11406326293945312, 0.11905670166015625, 0.12405014038085938, 0.1290435791015625, 0.13403701782226562, 0.13903045654296875, 0.14402389526367188, 0.149017333984375, 0.15401077270507812, 0.15900421142578125, 0.16399765014648438, 0.1689910888671875, 0.17398452758789062, 0.17897796630859375, 0.18397140502929688, 0.18896484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 0.0, 6.0, 9.0, 19.0, 31.0, 55.0, 75.0, 120.0, 153.0, 170.0, 140.0, 81.0, 63.0, 37.0, 17.0, 13.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9310479164123535, -2.8197879791259766, -2.7085282802581787, -2.5972683429718018, -2.486008644104004, -2.374748706817627, -2.26348876953125, -2.152229070663452, -2.0409693717956543, -1.929709553718567, -1.8184497356414795, -1.7071897983551025, -1.5959300994873047, -1.4846701622009277, -1.3734103441238403, -1.262150526046753, -1.150890588760376, -1.0396307706832886, -0.9283709526062012, -0.817111074924469, -0.7058512568473816, -0.5945914387702942, -0.483331561088562, -0.3720717430114746, -0.2608119249343872, -0.1495520919561386, -0.038292258977890015, 0.07296758890151978, 0.18422740697860718, 0.2954872250556946, 0.40674710273742676, 0.5180069208145142, 0.6292667388916016, 0.740526556968689, 0.8517863750457764, 0.9630462527275085, 1.0743060111999512, 1.1855659484863281, 1.2968257665634155, 1.408085584640503, 1.5193454027175903, 1.6306052207946777, 1.7418650388717651, 1.8531248569488525, 1.9643847942352295, 2.0756444931030273, 2.1869044303894043, 2.2981643676757812, 2.409424066543579, 2.520684003829956, 2.631943702697754, 2.743203639984131, 2.8544633388519287, 2.9657232761383057, 3.0769829750061035, 3.1882429122924805, 3.2995028495788574, 3.4107627868652344, 3.5220224857330322, 3.633282423019409, 3.744542121887207, 3.855802059173584, 3.967061996459961, 4.07832145690918, 4.189581394195557]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 11.0, 10.0, 17.0, 17.0, 13.0, 19.0, 21.0, 27.0, 24.0, 27.0, 32.0, 28.0, 32.0, 34.0, 34.0, 41.0, 44.0, 39.0, 44.0, 38.0, 35.0, 41.0, 46.0, 44.0, 24.0, 31.0, 37.0, 35.0, 16.0, 26.0, 15.0, 14.0, 16.0, 10.0, 13.0, 8.0, 10.0, 2.0, 9.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.9154976606369019, -1.8640453815460205, -1.8125929832458496, -1.7611405849456787, -1.7096883058547974, -1.658236026763916, -1.6067836284637451, -1.5553312301635742, -1.5038789510726929, -1.4524266719818115, -1.4009742736816406, -1.3495218753814697, -1.2980695962905884, -1.246617317199707, -1.1951649188995361, -1.1437125205993652, -1.0922602415084839, -1.0408079624176025, -0.9893555641174316, -0.9379032254219055, -0.8864508867263794, -0.8349985480308533, -0.7835462093353271, -0.732093870639801, -0.6806415319442749, -0.6291891932487488, -0.5777368545532227, -0.5262845158576965, -0.4748321771621704, -0.4233798384666443, -0.37192749977111816, -0.32047516107559204, -0.26902270317077637, -0.21757036447525024, -0.16611802577972412, -0.114665687084198, -0.06321334838867188, -0.011761009693145752, 0.03969132900238037, 0.0911436676979065, 0.14259600639343262, 0.19404834508895874, 0.24550068378448486, 0.296953022480011, 0.3484053611755371, 0.39985769987106323, 0.45131003856658936, 0.5027623772621155, 0.5542147159576416, 0.6056670546531677, 0.6571193933486938, 0.70857173204422, 0.7600240707397461, 0.8114764094352722, 0.8629287481307983, 0.9143810868263245, 0.9658334255218506, 1.0172858238220215, 1.0687381029129028, 1.1201903820037842, 1.171642780303955, 1.223095178604126, 1.2745474576950073, 1.3259997367858887, 1.3774521350860596]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 10.0, 19.0, 16.0, 34.0, 42.0, 71.0, 126.0, 158.0, 231.0, 432.0, 711.0, 1213.0, 2031.0, 3451.0, 6076.0, 11007.0, 21756.0, 43937.0, 96380.0, 221005.0, 501852.0, 989783.0, 1135452.0, 645504.0, 285541.0, 119807.0, 53043.0, 25284.0, 13088.0, 6781.0, 3847.0, 2141.0, 1265.0, 825.0, 500.0, 286.0, 200.0, 136.0, 80.0, 56.0, 33.0, 21.0, 23.0, 9.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.17130088806152344, -0.16498947143554688, -0.1586780548095703, -0.15236663818359375, -0.1460552215576172, -0.13974380493164062, -0.13343238830566406, -0.1271209716796875, -0.12080955505371094, -0.11449813842773438, -0.10818672180175781, -0.10187530517578125, -0.09556388854980469, -0.08925247192382812, -0.08294105529785156, -0.076629638671875, -0.07031822204589844, -0.06400680541992188, -0.05769538879394531, -0.05138397216796875, -0.04507255554199219, -0.038761138916015625, -0.03244972229003906, -0.0261383056640625, -0.019826889038085938, -0.013515472412109375, -0.0072040557861328125, -0.00089263916015625, 0.0054187774658203125, 0.011730194091796875, 0.018041610717773438, 0.02435302734375, 0.030664443969726562, 0.036975860595703125, 0.04328727722167969, 0.04959869384765625, 0.05591011047363281, 0.062221527099609375, 0.06853294372558594, 0.0748443603515625, 0.08115577697753906, 0.08746719360351562, 0.09377861022949219, 0.10009002685546875, 0.10640144348144531, 0.11271286010742188, 0.11902427673339844, 0.125335693359375, 0.13164710998535156, 0.13795852661132812, 0.1442699432373047, 0.15058135986328125, 0.1568927764892578, 0.16320419311523438, 0.16951560974121094, 0.1758270263671875, 0.18213844299316406, 0.18844985961914062, 0.1947612762451172, 0.20107269287109375, 0.2073841094970703, 0.21369552612304688, 0.22000694274902344, 0.226318359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 14.0, 13.0, 5.0, 11.0, 24.0, 20.0, 21.0, 18.0, 24.0, 20.0, 32.0, 35.0, 40.0, 38.0, 50.0, 42.0, 48.0, 47.0, 43.0, 36.0, 38.0, 38.0, 37.0, 39.0, 23.0, 30.0, 26.0, 23.0, 22.0, 18.0, 18.0, 14.0, 7.0, 12.0, 11.0, 6.0, 6.0, 10.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1881103515625, -0.18162155151367188, -0.17513275146484375, -0.16864395141601562, -0.1621551513671875, -0.15566635131835938, -0.14917755126953125, -0.14268875122070312, -0.136199951171875, -0.12971115112304688, -0.12322235107421875, -0.11673355102539062, -0.1102447509765625, -0.10375595092773438, -0.09726715087890625, -0.09077835083007812, -0.08428955078125, -0.07780075073242188, -0.07131195068359375, -0.06482315063476562, -0.0583343505859375, -0.051845550537109375, -0.04535675048828125, -0.038867950439453125, -0.032379150390625, -0.025890350341796875, -0.01940155029296875, -0.012912750244140625, -0.0064239501953125, 6.4849853515625e-05, 0.00655364990234375, 0.013042449951171875, 0.01953125, 0.026020050048828125, 0.03250885009765625, 0.038997650146484375, 0.0454864501953125, 0.051975250244140625, 0.05846405029296875, 0.06495285034179688, 0.071441650390625, 0.07793045043945312, 0.08441925048828125, 0.09090805053710938, 0.0973968505859375, 0.10388565063476562, 0.11037445068359375, 0.11686325073242188, 0.12335205078125, 0.12984085083007812, 0.13632965087890625, 0.14281845092773438, 0.1493072509765625, 0.15579605102539062, 0.16228485107421875, 0.16877365112304688, 0.175262451171875, 0.18175125122070312, 0.18824005126953125, 0.19472885131835938, 0.2012176513671875, 0.20770645141601562, 0.21419525146484375, 0.22068405151367188, 0.2271728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 10.0, 10.0, 17.0, 33.0, 48.0, 69.0, 131.0, 249.0, 436.0, 968.0, 2332.0, 6455.0, 20357.0, 80436.0, 421312.0, 2449237.0, 1000042.0, 159054.0, 36237.0, 10414.0, 3677.0, 1414.0, 616.0, 293.0, 197.0, 87.0, 60.0, 34.0, 21.0, 13.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3900489807128906, -0.37360382080078125, -0.3571586608886719, -0.3407135009765625, -0.3242683410644531, -0.30782318115234375, -0.2913780212402344, -0.274932861328125, -0.2584877014160156, -0.24204254150390625, -0.22559738159179688, -0.2091522216796875, -0.19270706176757812, -0.17626190185546875, -0.15981674194335938, -0.14337158203125, -0.12692642211914062, -0.11048126220703125, -0.09403610229492188, -0.0775909423828125, -0.061145782470703125, -0.04470062255859375, -0.028255462646484375, -0.011810302734375, 0.004634857177734375, 0.02108001708984375, 0.037525177001953125, 0.0539703369140625, 0.07041549682617188, 0.08686065673828125, 0.10330581665039062, 0.1197509765625, 0.13619613647460938, 0.15264129638671875, 0.16908645629882812, 0.1855316162109375, 0.20197677612304688, 0.21842193603515625, 0.23486709594726562, 0.251312255859375, 0.2677574157714844, 0.28420257568359375, 0.3006477355957031, 0.3170928955078125, 0.3335380554199219, 0.34998321533203125, 0.3664283752441406, 0.38287353515625, 0.3993186950683594, 0.41576385498046875, 0.4322090148925781, 0.4486541748046875, 0.4650993347167969, 0.48154449462890625, 0.4979896545410156, 0.514434814453125, 0.5308799743652344, 0.5473251342773438, 0.5637702941894531, 0.5802154541015625, 0.5966606140136719, 0.6131057739257812, 0.6295509338378906, 0.64599609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 12.0, 15.0, 23.0, 34.0, 43.0, 74.0, 109.0, 133.0, 277.0, 408.0, 610.0, 696.0, 519.0, 388.0, 223.0, 168.0, 113.0, 74.0, 51.0, 28.0, 22.0, 17.0, 16.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3515625, -0.33330535888671875, -0.3150482177734375, -0.29679107666015625, -0.278533935546875, -0.26027679443359375, -0.2420196533203125, -0.22376251220703125, -0.20550537109375, -0.18724822998046875, -0.1689910888671875, -0.15073394775390625, -0.132476806640625, -0.11421966552734375, -0.0959625244140625, -0.07770538330078125, -0.0594482421875, -0.04119110107421875, -0.0229339599609375, -0.00467681884765625, 0.013580322265625, 0.03183746337890625, 0.0500946044921875, 0.06835174560546875, 0.08660888671875, 0.10486602783203125, 0.1231231689453125, 0.14138031005859375, 0.159637451171875, 0.17789459228515625, 0.1961517333984375, 0.21440887451171875, 0.232666015625, 0.25092315673828125, 0.2691802978515625, 0.28743743896484375, 0.305694580078125, 0.32395172119140625, 0.3422088623046875, 0.36046600341796875, 0.37872314453125, 0.39698028564453125, 0.4152374267578125, 0.43349456787109375, 0.451751708984375, 0.47000885009765625, 0.4882659912109375, 0.5065231323242188, 0.5247802734375, 0.5430374145507812, 0.5612945556640625, 0.5795516967773438, 0.597808837890625, 0.6160659790039062, 0.6343231201171875, 0.6525802612304688, 0.67083740234375, 0.6890945434570312, 0.7073516845703125, 0.7256088256835938, 0.743865966796875, 0.7621231079101562, 0.7803802490234375, 0.7986373901367188, 0.81689453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 7.0, 33.0, 83.0, 179.0, 297.0, 211.0, 121.0, 43.0, 15.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668066024780273, -6.467572212219238, -6.267077922821045, -6.06658411026001, -5.866089820861816, -5.665596008300781, -5.465102195739746, -5.264607906341553, -5.064113616943359, -4.863619804382324, -4.663125514984131, -4.462631702423096, -4.262137413024902, -4.061643600463867, -3.861149549484253, -3.6606554985046387, -3.4601616859436035, -3.2596676349639893, -3.059173583984375, -2.85867977142334, -2.6581854820251465, -2.4576916694641113, -2.257197618484497, -2.056703567504883, -1.8562095165252686, -1.6557154655456543, -1.45522141456604, -1.2547274827957153, -1.054233431816101, -0.8537393808364868, -0.6532454490661621, -0.45275139808654785, -0.2522573471069336, -0.051763325929641724, 0.14873069524765015, 0.34922468662261963, 0.5497187376022339, 0.7502127885818481, 0.9507067203521729, 1.151200771331787, 1.3516948223114014, 1.5521888732910156, 1.7526829242706299, 1.9531768560409546, 2.1536707878112793, 2.3541650772094727, 2.554658889770508, 2.755152940750122, 2.9556469917297363, 3.1561410427093506, 3.356635093688965, 3.55712890625, 3.7576231956481934, 3.9581170082092285, 4.158611297607422, 4.359105110168457, 4.559598922729492, 4.760092735290527, 4.960587024688721, 5.161080837249756, 5.361575126647949, 5.562068939208984, 5.7625627517700195, 5.963057041168213, 6.163551330566406]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 4.0, 3.0, 8.0, 7.0, 6.0, 10.0, 10.0, 13.0, 16.0, 18.0, 18.0, 28.0, 22.0, 34.0, 33.0, 22.0, 28.0, 35.0, 43.0, 41.0, 40.0, 33.0, 45.0, 40.0, 41.0, 43.0, 36.0, 39.0, 32.0, 24.0, 24.0, 21.0, 29.0, 26.0, 19.0, 17.0, 11.0, 17.0, 11.0, 13.0, 9.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-1.6624239683151245, -1.6147022247314453, -1.5669806003570557, -1.5192588567733765, -1.4715372323989868, -1.4238154888153076, -1.376093864440918, -1.3283721208572388, -1.2806503772735596, -1.2329286336898804, -1.1852070093154907, -1.1374852657318115, -1.0897636413574219, -1.0420418977737427, -0.9943202137947083, -0.9465985298156738, -0.8988768458366394, -0.851155161857605, -0.8034334778785706, -0.7557117938995361, -0.7079900503158569, -0.6602683663368225, -0.6125466823577881, -0.5648249387741089, -0.5171033143997192, -0.4693816304206848, -0.421659916639328, -0.3739382326602936, -0.32621651887893677, -0.27849483489990234, -0.23077315092086792, -0.1830514371395111, -0.1353297233581543, -0.08760802447795868, -0.03988633304834366, 0.007835358381271362, 0.05555705726146698, 0.1032787561416626, 0.15100044012069702, 0.19872215390205383, 0.24644383788108826, 0.2941655218601227, 0.3418872356414795, 0.3896089196205139, 0.43733060359954834, 0.48505231738090515, 0.5327739715576172, 0.5804957151412964, 0.6282173991203308, 0.6759390830993652, 0.7236607670783997, 0.7713824510574341, 0.8191041946411133, 0.8668258786201477, 0.9145475625991821, 0.9622693061828613, 1.009990930557251, 1.0577126741409302, 1.1054342985153198, 1.153156042098999, 1.2008776664733887, 1.2485994100570679, 1.296321153640747, 1.3440427780151367, 1.391764521598816]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 5.0, 10.0, 26.0, 16.0, 26.0, 40.0, 73.0, 80.0, 122.0, 234.0, 377.0, 584.0, 1002.0, 1875.0, 3620.0, 7460.0, 16431.0, 39754.0, 95109.0, 194353.0, 268755.0, 217967.0, 113809.0, 48890.0, 19918.0, 8714.0, 4076.0, 2186.0, 1171.0, 731.0, 415.0, 250.0, 153.0, 111.0, 73.0, 37.0, 23.0, 21.0, 19.0, 14.0, 11.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.397216796875, -0.38465118408203125, -0.3720855712890625, -0.35951995849609375, -0.346954345703125, -0.33438873291015625, -0.3218231201171875, -0.30925750732421875, -0.29669189453125, -0.28412628173828125, -0.2715606689453125, -0.25899505615234375, -0.246429443359375, -0.23386383056640625, -0.2212982177734375, -0.20873260498046875, -0.1961669921875, -0.18360137939453125, -0.1710357666015625, -0.15847015380859375, -0.145904541015625, -0.13333892822265625, -0.1207733154296875, -0.10820770263671875, -0.09564208984375, -0.08307647705078125, -0.0705108642578125, -0.05794525146484375, -0.045379638671875, -0.03281402587890625, -0.0202484130859375, -0.00768280029296875, 0.0048828125, 0.01744842529296875, 0.0300140380859375, 0.04257965087890625, 0.055145263671875, 0.06771087646484375, 0.0802764892578125, 0.09284210205078125, 0.10540771484375, 0.11797332763671875, 0.1305389404296875, 0.14310455322265625, 0.155670166015625, 0.16823577880859375, 0.1808013916015625, 0.19336700439453125, 0.2059326171875, 0.21849822998046875, 0.2310638427734375, 0.24362945556640625, 0.256195068359375, 0.26876068115234375, 0.2813262939453125, 0.29389190673828125, 0.30645751953125, 0.31902313232421875, 0.3315887451171875, 0.34415435791015625, 0.356719970703125, 0.36928558349609375, 0.3818511962890625, 0.39441680908203125, 0.406982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 7.0, 13.0, 8.0, 17.0, 14.0, 19.0, 22.0, 23.0, 32.0, 25.0, 38.0, 37.0, 53.0, 30.0, 34.0, 33.0, 39.0, 39.0, 43.0, 41.0, 47.0, 47.0, 42.0, 33.0, 38.0, 34.0, 24.0, 27.0, 22.0, 20.0, 16.0, 11.0, 14.0, 9.0, 9.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2294921875, -0.22152328491210938, -0.21355438232421875, -0.20558547973632812, -0.1976165771484375, -0.18964767456054688, -0.18167877197265625, -0.17370986938476562, -0.165740966796875, -0.15777206420898438, -0.14980316162109375, -0.14183425903320312, -0.1338653564453125, -0.12589645385742188, -0.11792755126953125, -0.10995864868164062, -0.10198974609375, -0.09402084350585938, -0.08605194091796875, -0.07808303833007812, -0.0701141357421875, -0.062145233154296875, -0.05417633056640625, -0.046207427978515625, -0.038238525390625, -0.030269622802734375, -0.02230072021484375, -0.014331817626953125, -0.0063629150390625, 0.001605987548828125, 0.00957489013671875, 0.017543792724609375, 0.0255126953125, 0.033481597900390625, 0.04145050048828125, 0.049419403076171875, 0.0573883056640625, 0.06535720825195312, 0.07332611083984375, 0.08129501342773438, 0.089263916015625, 0.09723281860351562, 0.10520172119140625, 0.11317062377929688, 0.1211395263671875, 0.12910842895507812, 0.13707733154296875, 0.14504623413085938, 0.15301513671875, 0.16098403930664062, 0.16895294189453125, 0.17692184448242188, 0.1848907470703125, 0.19285964965820312, 0.20082855224609375, 0.20879745483398438, 0.216766357421875, 0.22473526000976562, 0.23270416259765625, 0.24067306518554688, 0.2486419677734375, 0.2566108703613281, 0.26457977294921875, 0.2725486755371094, 0.280517578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 13.0, 22.0, 43.0, 52.0, 104.0, 164.0, 327.0, 666.0, 1192.0, 2603.0, 5693.0, 13766.0, 38079.0, 111645.0, 280261.0, 337954.0, 164645.0, 56356.0, 20058.0, 8064.0, 3580.0, 1578.0, 764.0, 377.0, 226.0, 137.0, 74.0, 26.0, 18.0, 16.0, 15.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5810546875, -0.5654296875, -0.5498046875, -0.5341796875, -0.5185546875, -0.5029296875, -0.4873046875, -0.4716796875, -0.4560546875, -0.4404296875, -0.4248046875, -0.4091796875, -0.3935546875, -0.3779296875, -0.3623046875, -0.3466796875, -0.3310546875, -0.3154296875, -0.2998046875, -0.2841796875, -0.2685546875, -0.2529296875, -0.2373046875, -0.2216796875, -0.2060546875, -0.1904296875, -0.1748046875, -0.1591796875, -0.1435546875, -0.1279296875, -0.1123046875, -0.0966796875, -0.0810546875, -0.0654296875, -0.0498046875, -0.0341796875, -0.0185546875, -0.0029296875, 0.0126953125, 0.0283203125, 0.0439453125, 0.0595703125, 0.0751953125, 0.0908203125, 0.1064453125, 0.1220703125, 0.1376953125, 0.1533203125, 0.1689453125, 0.1845703125, 0.2001953125, 0.2158203125, 0.2314453125, 0.2470703125, 0.2626953125, 0.2783203125, 0.2939453125, 0.3095703125, 0.3251953125, 0.3408203125, 0.3564453125, 0.3720703125, 0.3876953125, 0.4033203125, 0.4189453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 11.0, 14.0, 13.0, 9.0, 17.0, 17.0, 22.0, 22.0, 23.0, 31.0, 48.0, 47.0, 56.0, 49.0, 46.0, 45.0, 41.0, 46.0, 61.0, 39.0, 43.0, 36.0, 34.0, 35.0, 41.0, 19.0, 21.0, 17.0, 16.0, 15.0, 8.0, 8.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6678314208984375, -0.644744873046875, -0.6216583251953125, -0.59857177734375, -0.5754852294921875, -0.552398681640625, -0.5293121337890625, -0.5062255859375, -0.4831390380859375, -0.460052490234375, -0.4369659423828125, -0.41387939453125, -0.3907928466796875, -0.367706298828125, -0.3446197509765625, -0.321533203125, -0.2984466552734375, -0.275360107421875, -0.2522735595703125, -0.22918701171875, -0.2061004638671875, -0.183013916015625, -0.1599273681640625, -0.1368408203125, -0.1137542724609375, -0.090667724609375, -0.0675811767578125, -0.04449462890625, -0.0214080810546875, 0.001678466796875, 0.0247650146484375, 0.0478515625, 0.0709381103515625, 0.094024658203125, 0.1171112060546875, 0.14019775390625, 0.1632843017578125, 0.186370849609375, 0.2094573974609375, 0.2325439453125, 0.2556304931640625, 0.278717041015625, 0.3018035888671875, 0.32489013671875, 0.3479766845703125, 0.371063232421875, 0.3941497802734375, 0.417236328125, 0.4403228759765625, 0.463409423828125, 0.4864959716796875, 0.50958251953125, 0.5326690673828125, 0.555755615234375, 0.5788421630859375, 0.6019287109375, 0.6250152587890625, 0.648101806640625, 0.6711883544921875, 0.69427490234375, 0.7173614501953125, 0.740447998046875, 0.7635345458984375, 0.78662109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 16.0, 28.0, 59.0, 107.0, 161.0, 363.0, 787.0, 1724.0, 4557.0, 11837.0, 32471.0, 88906.0, 213075.0, 320852.0, 222534.0, 95113.0, 34913.0, 12619.0, 4830.0, 1985.0, 862.0, 363.0, 155.0, 90.0, 53.0, 39.0, 14.0, 3.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10772705078125, -0.1036672592163086, -0.09960746765136719, -0.09554767608642578, -0.09148788452148438, -0.08742809295654297, -0.08336830139160156, -0.07930850982666016, -0.07524871826171875, -0.07118892669677734, -0.06712913513183594, -0.06306934356689453, -0.059009552001953125, -0.05494976043701172, -0.05088996887207031, -0.046830177307128906, -0.0427703857421875, -0.038710594177246094, -0.03465080261230469, -0.03059101104736328, -0.026531219482421875, -0.02247142791748047, -0.018411636352539062, -0.014351844787597656, -0.01029205322265625, -0.006232261657714844, -0.0021724700927734375, 0.0018873214721679688, 0.005947113037109375, 0.010006904602050781, 0.014066696166992188, 0.018126487731933594, 0.022186279296875, 0.026246070861816406, 0.030305862426757812, 0.03436565399169922, 0.038425445556640625, 0.04248523712158203, 0.04654502868652344, 0.050604820251464844, 0.05466461181640625, 0.058724403381347656, 0.06278419494628906, 0.06684398651123047, 0.07090377807617188, 0.07496356964111328, 0.07902336120605469, 0.0830831527709961, 0.0871429443359375, 0.0912027359008789, 0.09526252746582031, 0.09932231903076172, 0.10338211059570312, 0.10744190216064453, 0.11150169372558594, 0.11556148529052734, 0.11962127685546875, 0.12368106842041016, 0.12774085998535156, 0.13180065155029297, 0.13586044311523438, 0.13992023468017578, 0.1439800262451172, 0.1480398178100586, 0.152099609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 7.0, 4.0, 5.0, 14.0, 18.0, 26.0, 28.0, 41.0, 37.0, 49.0, 66.0, 69.0, 89.0, 75.0, 72.0, 71.0, 55.0, 47.0, 50.0, 35.0, 39.0, 24.0, 16.0, 12.0, 7.0, 4.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.2928924560546875e-05, -5.1480717957019806e-05, -5.003251135349274e-05, -4.858430474996567e-05, -4.71360981464386e-05, -4.568789154291153e-05, -4.423968493938446e-05, -4.279147833585739e-05, -4.134327173233032e-05, -3.989506512880325e-05, -3.8446858525276184e-05, -3.6998651921749115e-05, -3.5550445318222046e-05, -3.410223871469498e-05, -3.265403211116791e-05, -3.120582550764084e-05, -2.975761890411377e-05, -2.83094123005867e-05, -2.686120569705963e-05, -2.5412999093532562e-05, -2.3964792490005493e-05, -2.2516585886478424e-05, -2.1068379282951355e-05, -1.9620172679424286e-05, -1.8171966075897217e-05, -1.6723759472370148e-05, -1.527555286884308e-05, -1.382734626531601e-05, -1.237913966178894e-05, -1.0930933058261871e-05, -9.482726454734802e-06, -8.034519851207733e-06, -6.586313247680664e-06, -5.138106644153595e-06, -3.689900040626526e-06, -2.2416934370994568e-06, -7.934868335723877e-07, 6.547197699546814e-07, 2.1029263734817505e-06, 3.5511329770088196e-06, 4.999339580535889e-06, 6.447546184062958e-06, 7.895752787590027e-06, 9.343959391117096e-06, 1.0792165994644165e-05, 1.2240372598171234e-05, 1.3688579201698303e-05, 1.5136785805225372e-05, 1.658499240875244e-05, 1.803319901227951e-05, 1.948140561580658e-05, 2.092961221933365e-05, 2.2377818822860718e-05, 2.3826025426387787e-05, 2.5274232029914856e-05, 2.6722438633441925e-05, 2.8170645236968994e-05, 2.9618851840496063e-05, 3.106705844402313e-05, 3.25152650475502e-05, 3.396347165107727e-05, 3.541167825460434e-05, 3.685988485813141e-05, 3.830809146165848e-05, 3.975629806518555e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 3.0, 14.0, 11.0, 13.0, 43.0, 58.0, 75.0, 113.0, 181.0, 323.0, 604.0, 1028.0, 2024.0, 4187.0, 9307.0, 21142.0, 49221.0, 109415.0, 204692.0, 263349.0, 197124.0, 103052.0, 45832.0, 19797.0, 8690.0, 3989.0, 1918.0, 996.0, 531.0, 306.0, 206.0, 88.0, 71.0, 52.0, 32.0, 18.0, 9.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.12481689453125, -0.12129688262939453, -0.11777687072753906, -0.1142568588256836, -0.11073684692382812, -0.10721683502197266, -0.10369682312011719, -0.10017681121826172, -0.09665679931640625, -0.09313678741455078, -0.08961677551269531, -0.08609676361083984, -0.08257675170898438, -0.0790567398071289, -0.07553672790527344, -0.07201671600341797, -0.0684967041015625, -0.06497669219970703, -0.06145668029785156, -0.057936668395996094, -0.054416656494140625, -0.050896644592285156, -0.04737663269042969, -0.04385662078857422, -0.04033660888671875, -0.03681659698486328, -0.03329658508300781, -0.029776573181152344, -0.026256561279296875, -0.022736549377441406, -0.019216537475585938, -0.01569652557373047, -0.012176513671875, -0.008656501770019531, -0.0051364898681640625, -0.0016164779663085938, 0.001903533935546875, 0.005423545837402344, 0.008943557739257812, 0.012463569641113281, 0.01598358154296875, 0.01950359344482422, 0.023023605346679688, 0.026543617248535156, 0.030063629150390625, 0.033583641052246094, 0.03710365295410156, 0.04062366485595703, 0.0441436767578125, 0.04766368865966797, 0.05118370056152344, 0.054703712463378906, 0.058223724365234375, 0.061743736267089844, 0.06526374816894531, 0.06878376007080078, 0.07230377197265625, 0.07582378387451172, 0.07934379577636719, 0.08286380767822266, 0.08638381958007812, 0.0899038314819336, 0.09342384338378906, 0.09694385528564453, 0.1004638671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 10.0, 7.0, 13.0, 11.0, 12.0, 14.0, 17.0, 26.0, 32.0, 28.0, 46.0, 43.0, 46.0, 54.0, 65.0, 63.0, 47.0, 57.0, 51.0, 53.0, 40.0, 39.0, 41.0, 44.0, 30.0, 20.0, 20.0, 16.0, 15.0, 12.0, 8.0, 7.0, 9.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14590072631835938, -0.14153289794921875, -0.13716506958007812, -0.1327972412109375, -0.12842941284179688, -0.12406158447265625, -0.11969375610351562, -0.115325927734375, -0.11095809936523438, -0.10659027099609375, -0.10222244262695312, -0.0978546142578125, -0.09348678588867188, -0.08911895751953125, -0.08475112915039062, -0.08038330078125, -0.07601547241210938, -0.07164764404296875, -0.06727981567382812, -0.0629119873046875, -0.058544158935546875, -0.05417633056640625, -0.049808502197265625, -0.045440673828125, -0.041072845458984375, -0.03670501708984375, -0.032337188720703125, -0.0279693603515625, -0.023601531982421875, -0.01923370361328125, -0.014865875244140625, -0.010498046875, -0.006130218505859375, -0.00176239013671875, 0.002605438232421875, 0.0069732666015625, 0.011341094970703125, 0.01570892333984375, 0.020076751708984375, 0.024444580078125, 0.028812408447265625, 0.03318023681640625, 0.037548065185546875, 0.0419158935546875, 0.046283721923828125, 0.05065155029296875, 0.055019378662109375, 0.05938720703125, 0.06375503540039062, 0.06812286376953125, 0.07249069213867188, 0.0768585205078125, 0.08122634887695312, 0.08559417724609375, 0.08996200561523438, 0.094329833984375, 0.09869766235351562, 0.10306549072265625, 0.10743331909179688, 0.1118011474609375, 0.11616897583007812, 0.12053680419921875, 0.12490463256835938, 0.1292724609375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 5.0, 5.0, 27.0, 35.0, 38.0, 74.0, 94.0, 146.0, 145.0, 156.0, 97.0, 65.0, 46.0, 28.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0944294929504395, -1.9904919862747192, -1.8865545988082886, -1.7826170921325684, -1.6786795854568481, -1.574742078781128, -1.4708046913146973, -1.366867184638977, -1.2629296779632568, -1.1589921712875366, -1.055054783821106, -0.9511172771453857, -0.8471797704696655, -0.7432423233985901, -0.6393048763275146, -0.5353673696517944, -0.43142998218536377, -0.32749250531196594, -0.2235550433397293, -0.11961758136749268, -0.01568010449409485, 0.08825737237930298, 0.19219481945037842, 0.29613232612609863, 0.4000697731971741, 0.5040072202682495, 0.6079447269439697, 0.7118821740150452, 0.8158196210861206, 0.9197571277618408, 1.0236945152282715, 1.1276321411132812, 1.231569528579712, 1.3355070352554321, 1.4394444227218628, 1.543381929397583, 1.6473194360733032, 1.7512569427490234, 1.855194330215454, 1.9591318368911743, 2.0630693435668945, 2.167006731033325, 2.270944356918335, 2.3748817443847656, 2.4788191318511963, 2.582756757736206, 2.6866941452026367, 2.7906317710876465, 2.894568920135498, 2.9985063076019287, 3.1024439334869385, 3.206381320953369, 3.3103187084198, 3.4142563343048096, 3.5181937217712402, 3.62213134765625, 3.7260687351226807, 3.8300061225891113, 3.933943748474121, 4.037880897521973, 4.141818523406982, 4.245756149291992, 4.349693298339844, 4.4536309242248535, 4.557568550109863]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 11.0, 13.0, 7.0, 4.0, 14.0, 11.0, 13.0, 17.0, 10.0, 19.0, 23.0, 24.0, 23.0, 22.0, 22.0, 30.0, 35.0, 29.0, 37.0, 46.0, 24.0, 44.0, 40.0, 46.0, 31.0, 37.0, 33.0, 40.0, 40.0, 27.0, 31.0, 28.0, 25.0, 21.0, 19.0, 12.0, 13.0, 15.0, 14.0, 10.0, 12.0, 7.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7009193897247314, -1.646073341369629, -1.5912272930145264, -1.5363812446594238, -1.4815351963043213, -1.4266891479492188, -1.3718432188034058, -1.3169971704483032, -1.2621511220932007, -1.2073050737380981, -1.1524590253829956, -1.097612977027893, -1.04276704788208, -0.9879209399223328, -0.933074951171875, -0.8782289028167725, -0.8233828544616699, -0.7685368061065674, -0.7136907577514648, -0.6588447690010071, -0.6039987206459045, -0.549152672290802, -0.49430665373802185, -0.4394606351852417, -0.38461458683013916, -0.3297685384750366, -0.27492251992225647, -0.22007648646831512, -0.16523045301437378, -0.11038440465927124, -0.05553838610649109, -0.0006923675537109375, 0.05415356159210205, 0.1089995950460434, 0.16384562849998474, 0.2186916619539261, 0.27353769540786743, 0.32838374376296997, 0.3832297623157501, 0.4380757808685303, 0.4929218292236328, 0.5477678775787354, 0.6026139259338379, 0.6574599146842957, 0.7123059630393982, 0.7671520113945007, 0.8219980001449585, 0.876844048500061, 0.9316900968551636, 0.9865361452102661, 1.0413821935653687, 1.0962282419204712, 1.1510741710662842, 1.2059202194213867, 1.2607662677764893, 1.3156123161315918, 1.3704583644866943, 1.4253044128417969, 1.4801504611968994, 1.534996509552002, 1.5898425579071045, 1.644688606262207, 1.69953453540802, 1.7543805837631226, 1.809226632118225]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 26.0, 23.0, 52.0, 79.0, 160.0, 275.0, 435.0, 782.0, 1383.0, 2545.0, 4511.0, 8838.0, 18549.0, 43714.0, 116084.0, 356995.0, 1063370.0, 1566267.0, 674976.0, 208242.0, 71182.0, 28629.0, 12887.0, 6535.0, 3357.0, 1892.0, 1041.0, 596.0, 338.0, 197.0, 131.0, 74.0, 42.0, 22.0, 20.0, 5.0, 7.0, 8.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.21488571166992188, -0.20565032958984375, -0.19641494750976562, -0.1871795654296875, -0.17794418334960938, -0.16870880126953125, -0.15947341918945312, -0.150238037109375, -0.14100265502929688, -0.13176727294921875, -0.12253189086914062, -0.1132965087890625, -0.10406112670898438, -0.09482574462890625, -0.08559036254882812, -0.07635498046875, -0.06711959838867188, -0.05788421630859375, -0.048648834228515625, -0.0394134521484375, -0.030178070068359375, -0.02094268798828125, -0.011707305908203125, -0.002471923828125, 0.006763458251953125, 0.01599884033203125, 0.025234222412109375, 0.0344696044921875, 0.043704986572265625, 0.05294036865234375, 0.062175750732421875, 0.0714111328125, 0.08064651489257812, 0.08988189697265625, 0.09911727905273438, 0.1083526611328125, 0.11758804321289062, 0.12682342529296875, 0.13605880737304688, 0.145294189453125, 0.15452957153320312, 0.16376495361328125, 0.17300033569335938, 0.1822357177734375, 0.19147109985351562, 0.20070648193359375, 0.20994186401367188, 0.21917724609375, 0.22841262817382812, 0.23764801025390625, 0.24688339233398438, 0.2561187744140625, 0.2653541564941406, 0.27458953857421875, 0.2838249206542969, 0.293060302734375, 0.3022956848144531, 0.31153106689453125, 0.3207664489746094, 0.3300018310546875, 0.3392372131347656, 0.34847259521484375, 0.3577079772949219, 0.366943359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 6.0, 4.0, 13.0, 17.0, 11.0, 11.0, 17.0, 18.0, 25.0, 35.0, 28.0, 28.0, 34.0, 27.0, 38.0, 45.0, 37.0, 34.0, 41.0, 44.0, 43.0, 33.0, 25.0, 42.0, 34.0, 29.0, 26.0, 25.0, 26.0, 20.0, 27.0, 18.0, 18.0, 20.0, 12.0, 9.0, 9.0, 8.0, 6.0, 9.0, 4.0, 8.0, 5.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1768798828125, -0.17090415954589844, -0.16492843627929688, -0.1589527130126953, -0.15297698974609375, -0.1470012664794922, -0.14102554321289062, -0.13504981994628906, -0.1290740966796875, -0.12309837341308594, -0.11712265014648438, -0.11114692687988281, -0.10517120361328125, -0.09919548034667969, -0.09321975708007812, -0.08724403381347656, -0.081268310546875, -0.07529258728027344, -0.06931686401367188, -0.06334114074707031, -0.05736541748046875, -0.05138969421386719, -0.045413970947265625, -0.03943824768066406, -0.0334625244140625, -0.027486801147460938, -0.021511077880859375, -0.015535354614257812, -0.00955963134765625, -0.0035839080810546875, 0.002391815185546875, 0.008367538452148438, 0.01434326171875, 0.020318984985351562, 0.026294708251953125, 0.03227043151855469, 0.03824615478515625, 0.04422187805175781, 0.050197601318359375, 0.05617332458496094, 0.0621490478515625, 0.06812477111816406, 0.07410049438476562, 0.08007621765136719, 0.08605194091796875, 0.09202766418457031, 0.09800338745117188, 0.10397911071777344, 0.109954833984375, 0.11593055725097656, 0.12190628051757812, 0.1278820037841797, 0.13385772705078125, 0.1398334503173828, 0.14580917358398438, 0.15178489685058594, 0.1577606201171875, 0.16373634338378906, 0.16971206665039062, 0.1756877899169922, 0.18166351318359375, 0.1876392364501953, 0.19361495971679688, 0.19959068298339844, 0.20556640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 26.0, 20.0, 42.0, 53.0, 106.0, 186.0, 353.0, 558.0, 1013.0, 1871.0, 3682.0, 7552.0, 16981.0, 42101.0, 123714.0, 458745.0, 2061875.0, 1108216.0, 242554.0, 74064.0, 27408.0, 11802.0, 5392.0, 2694.0, 1412.0, 767.0, 432.0, 270.0, 145.0, 94.0, 61.0, 29.0, 13.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.46337890625, -0.45111083984375, -0.4388427734375, -0.42657470703125, -0.414306640625, -0.40203857421875, -0.3897705078125, -0.37750244140625, -0.365234375, -0.35296630859375, -0.3406982421875, -0.32843017578125, -0.316162109375, -0.30389404296875, -0.2916259765625, -0.27935791015625, -0.26708984375, -0.25482177734375, -0.2425537109375, -0.23028564453125, -0.218017578125, -0.20574951171875, -0.1934814453125, -0.18121337890625, -0.1689453125, -0.15667724609375, -0.1444091796875, -0.13214111328125, -0.119873046875, -0.10760498046875, -0.0953369140625, -0.08306884765625, -0.07080078125, -0.05853271484375, -0.0462646484375, -0.03399658203125, -0.021728515625, -0.00946044921875, 0.0028076171875, 0.01507568359375, 0.02734375, 0.03961181640625, 0.0518798828125, 0.06414794921875, 0.076416015625, 0.08868408203125, 0.1009521484375, 0.11322021484375, 0.12548828125, 0.13775634765625, 0.1500244140625, 0.16229248046875, 0.174560546875, 0.18682861328125, 0.1990966796875, 0.21136474609375, 0.2236328125, 0.23590087890625, 0.2481689453125, 0.26043701171875, 0.272705078125, 0.28497314453125, 0.2972412109375, 0.30950927734375, 0.32177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 6.0, 6.0, 6.0, 13.0, 15.0, 22.0, 24.0, 36.0, 53.0, 67.0, 80.0, 94.0, 175.0, 198.0, 313.0, 430.0, 571.0, 504.0, 391.0, 288.0, 216.0, 146.0, 102.0, 74.0, 55.0, 41.0, 37.0, 27.0, 20.0, 14.0, 8.0, 4.0, 5.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.497802734375, -0.4835548400878906, -0.46930694580078125, -0.4550590515136719, -0.4408111572265625, -0.4265632629394531, -0.41231536865234375, -0.3980674743652344, -0.383819580078125, -0.3695716857910156, -0.35532379150390625, -0.3410758972167969, -0.3268280029296875, -0.3125801086425781, -0.29833221435546875, -0.2840843200683594, -0.26983642578125, -0.2555885314941406, -0.24134063720703125, -0.22709274291992188, -0.2128448486328125, -0.19859695434570312, -0.18434906005859375, -0.17010116577148438, -0.155853271484375, -0.14160537719726562, -0.12735748291015625, -0.11310958862304688, -0.0988616943359375, -0.08461380004882812, -0.07036590576171875, -0.056118011474609375, -0.0418701171875, -0.027622222900390625, -0.01337432861328125, 0.000873565673828125, 0.0151214599609375, 0.029369354248046875, 0.04361724853515625, 0.057865142822265625, 0.072113037109375, 0.08636093139648438, 0.10060882568359375, 0.11485671997070312, 0.1291046142578125, 0.14335250854492188, 0.15760040283203125, 0.17184829711914062, 0.18609619140625, 0.20034408569335938, 0.21459197998046875, 0.22883987426757812, 0.2430877685546875, 0.2573356628417969, 0.27158355712890625, 0.2858314514160156, 0.300079345703125, 0.3143272399902344, 0.32857513427734375, 0.3428230285644531, 0.3570709228515625, 0.3713188171386719, 0.38556671142578125, 0.3998146057128906, 0.4140625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 1.0, 8.0, 25.0, 57.0, 155.0, 292.0, 284.0, 115.0, 42.0, 12.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.028602600097656, -9.77835750579834, -9.528112411499023, -9.277868270874023, -9.027623176574707, -8.77737808227539, -8.527132987976074, -8.276887893676758, -8.026643753051758, -7.776398658752441, -7.526154041290283, -7.275908946990967, -7.025664329528809, -6.775419235229492, -6.525174140930176, -6.274929046630859, -6.024683952331543, -5.774438858032227, -5.524194240570068, -5.273949146270752, -5.023704528808594, -4.773459434509277, -4.523214340209961, -4.2729692459106445, -4.022724628448486, -3.772479772567749, -3.5222349166870117, -3.2719898223876953, -3.021744966506958, -2.7715001106262207, -2.5212550163269043, -2.271010160446167, -2.020766258239746, -1.7705214023590088, -1.520276427268982, -1.270031452178955, -1.0197865962982178, -0.7695417404174805, -0.5192967653274536, -0.26905179023742676, -0.018806934356689453, 0.23143798112869263, 0.4816828966140747, 0.7319278120994568, 0.9821727275848389, 1.2324175834655762, 1.482662558555603, 1.7329075336456299, 1.9831523895263672, 2.2333972454071045, 2.483642101287842, 2.733887195587158, 2.9841320514678955, 3.234376907348633, 3.484622001647949, 3.7348668575286865, 3.985111713409424, 4.23535680770874, 4.485601425170898, 4.735846519470215, 4.986091613769531, 5.2363362312316895, 5.486581325531006, 5.736825942993164, 5.9870710372924805]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 10.0, 7.0, 7.0, 8.0, 18.0, 20.0, 25.0, 20.0, 35.0, 33.0, 46.0, 44.0, 36.0, 39.0, 50.0, 45.0, 59.0, 53.0, 36.0, 34.0, 52.0, 45.0, 50.0, 38.0, 24.0, 23.0, 33.0, 24.0, 15.0, 15.0, 15.0, 7.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7441456317901611, -1.6884320974349976, -1.632718563079834, -1.5770050287246704, -1.5212914943695068, -1.4655779600143433, -1.4098644256591797, -1.3541508913040161, -1.2984373569488525, -1.242723822593689, -1.1870102882385254, -1.1312967538833618, -1.0755832195281982, -1.0198696851730347, -0.9641561508178711, -0.9084426164627075, -0.8527290225028992, -0.7970154881477356, -0.741301953792572, -0.6855884194374084, -0.6298748850822449, -0.5741612911224365, -0.518447756767273, -0.46273425221443176, -0.4070207178592682, -0.3513071835041046, -0.29559364914894104, -0.23988009989261627, -0.1841665655374527, -0.12845301628112793, -0.07273948192596436, -0.01702594757080078, 0.03868758678436279, 0.09440112113952637, 0.15011465549468994, 0.2058282047510147, 0.2615417242050171, 0.31725528836250305, 0.3729688227176666, 0.4286823570728302, 0.4843958914279938, 0.5401094555854797, 0.5958229899406433, 0.6515365242958069, 0.7072500586509705, 0.762963593006134, 0.8186771273612976, 0.8743906617164612, 0.9301041960716248, 0.9858177304267883, 1.0415313243865967, 1.0972448587417603, 1.1529583930969238, 1.2086719274520874, 1.264385461807251, 1.3200989961624146, 1.3758125305175781, 1.4315260648727417, 1.4872395992279053, 1.5429531335830688, 1.5986666679382324, 1.654380202293396, 1.7100937366485596, 1.7658072710037231, 1.8215208053588867]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 18.0, 19.0, 22.0, 33.0, 49.0, 75.0, 121.0, 187.0, 293.0, 478.0, 775.0, 1185.0, 2024.0, 3526.0, 5638.0, 9983.0, 17431.0, 30186.0, 50777.0, 81988.0, 121059.0, 155436.0, 163133.0, 141129.0, 101836.0, 66133.0, 39902.0, 23056.0, 13298.0, 7614.0, 4423.0, 2599.0, 1602.0, 875.0, 553.0, 374.0, 246.0, 162.0, 89.0, 63.0, 53.0, 30.0, 19.0, 17.0, 12.0, 6.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1995849609375, -0.19298934936523438, -0.18639373779296875, -0.17979812622070312, -0.1732025146484375, -0.16660690307617188, -0.16001129150390625, -0.15341567993164062, -0.146820068359375, -0.14022445678710938, -0.13362884521484375, -0.12703323364257812, -0.1204376220703125, -0.11384201049804688, -0.10724639892578125, -0.10065078735351562, -0.09405517578125, -0.08745956420898438, -0.08086395263671875, -0.07426834106445312, -0.0676727294921875, -0.061077117919921875, -0.05448150634765625, -0.047885894775390625, -0.041290283203125, -0.034694671630859375, -0.02809906005859375, -0.021503448486328125, -0.0149078369140625, -0.008312225341796875, -0.00171661376953125, 0.004878997802734375, 0.011474609375, 0.018070220947265625, 0.02466583251953125, 0.031261444091796875, 0.0378570556640625, 0.044452667236328125, 0.05104827880859375, 0.057643890380859375, 0.064239501953125, 0.07083511352539062, 0.07743072509765625, 0.08402633666992188, 0.0906219482421875, 0.09721755981445312, 0.10381317138671875, 0.11040878295898438, 0.11700439453125, 0.12360000610351562, 0.13019561767578125, 0.13679122924804688, 0.1433868408203125, 0.14998245239257812, 0.15657806396484375, 0.16317367553710938, 0.169769287109375, 0.17636489868164062, 0.18296051025390625, 0.18955612182617188, 0.1961517333984375, 0.20274734497070312, 0.20934295654296875, 0.21593856811523438, 0.2225341796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 2.0, 6.0, 6.0, 9.0, 7.0, 16.0, 16.0, 16.0, 24.0, 19.0, 25.0, 24.0, 24.0, 34.0, 38.0, 29.0, 26.0, 34.0, 41.0, 46.0, 40.0, 31.0, 37.0, 38.0, 39.0, 38.0, 40.0, 41.0, 20.0, 23.0, 29.0, 20.0, 25.0, 18.0, 20.0, 9.0, 8.0, 13.0, 15.0, 12.0, 10.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.21240234375, -0.20580101013183594, -0.19919967651367188, -0.1925983428955078, -0.18599700927734375, -0.1793956756591797, -0.17279434204101562, -0.16619300842285156, -0.1595916748046875, -0.15299034118652344, -0.14638900756835938, -0.1397876739501953, -0.13318634033203125, -0.1265850067138672, -0.11998367309570312, -0.11338233947753906, -0.106781005859375, -0.10017967224121094, -0.09357833862304688, -0.08697700500488281, -0.08037567138671875, -0.07377433776855469, -0.06717300415039062, -0.06057167053222656, -0.0539703369140625, -0.04736900329589844, -0.040767669677734375, -0.03416633605957031, -0.02756500244140625, -0.020963668823242188, -0.014362335205078125, -0.0077610015869140625, -0.00115966796875, 0.0054416656494140625, 0.012042999267578125, 0.018644332885742188, 0.02524566650390625, 0.03184700012207031, 0.038448333740234375, 0.04504966735839844, 0.0516510009765625, 0.05825233459472656, 0.06485366821289062, 0.07145500183105469, 0.07805633544921875, 0.08465766906738281, 0.09125900268554688, 0.09786033630371094, 0.104461669921875, 0.11106300354003906, 0.11766433715820312, 0.12426567077636719, 0.13086700439453125, 0.1374683380126953, 0.14406967163085938, 0.15067100524902344, 0.1572723388671875, 0.16387367248535156, 0.17047500610351562, 0.1770763397216797, 0.18367767333984375, 0.1902790069580078, 0.19688034057617188, 0.20348167419433594, 0.2100830078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 13.0, 10.0, 13.0, 32.0, 43.0, 52.0, 78.0, 99.0, 153.0, 241.0, 379.0, 629.0, 1003.0, 1647.0, 2832.0, 4971.0, 9120.0, 17262.0, 32962.0, 61620.0, 111686.0, 181553.0, 246692.0, 163073.0, 97808.0, 53100.0, 28125.0, 14563.0, 8031.0, 4397.0, 2473.0, 1490.0, 832.0, 543.0, 327.0, 214.0, 133.0, 87.0, 78.0, 54.0, 38.0, 33.0, 11.0, 16.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.260498046875, -0.2524528503417969, -0.24440765380859375, -0.23636245727539062, -0.2283172607421875, -0.22027206420898438, -0.21222686767578125, -0.20418167114257812, -0.196136474609375, -0.18809127807617188, -0.18004608154296875, -0.17200088500976562, -0.1639556884765625, -0.15591049194335938, -0.14786529541015625, -0.13982009887695312, -0.13177490234375, -0.12372970581054688, -0.11568450927734375, -0.10763931274414062, -0.0995941162109375, -0.09154891967773438, -0.08350372314453125, -0.07545852661132812, -0.067413330078125, -0.059368133544921875, -0.05132293701171875, -0.043277740478515625, -0.0352325439453125, -0.027187347412109375, -0.01914215087890625, -0.011096954345703125, -0.0030517578125, 0.004993438720703125, 0.01303863525390625, 0.021083831787109375, 0.0291290283203125, 0.037174224853515625, 0.04521942138671875, 0.053264617919921875, 0.061309814453125, 0.06935501098632812, 0.07740020751953125, 0.08544540405273438, 0.0934906005859375, 0.10153579711914062, 0.10958099365234375, 0.11762619018554688, 0.12567138671875, 0.13371658325195312, 0.14176177978515625, 0.14980697631835938, 0.1578521728515625, 0.16589736938476562, 0.17394256591796875, 0.18198776245117188, 0.190032958984375, 0.19807815551757812, 0.20612335205078125, 0.21416854858398438, 0.2222137451171875, 0.23025894165039062, 0.23830413818359375, 0.24634933471679688, 0.25439453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 9.0, 6.0, 12.0, 13.0, 25.0, 33.0, 21.0, 31.0, 38.0, 57.0, 37.0, 66.0, 51.0, 75.0, 68.0, 59.0, 52.0, 54.0, 54.0, 37.0, 28.0, 37.0, 25.0, 27.0, 18.0, 16.0, 14.0, 14.0, 7.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.7985000610351562, -0.7718048095703125, -0.7451095581054688, -0.718414306640625, -0.6917190551757812, -0.6650238037109375, -0.6383285522460938, -0.61163330078125, -0.5849380493164062, -0.5582427978515625, -0.5315475463867188, -0.504852294921875, -0.47815704345703125, -0.4514617919921875, -0.42476654052734375, -0.3980712890625, -0.37137603759765625, -0.3446807861328125, -0.31798553466796875, -0.291290283203125, -0.26459503173828125, -0.2378997802734375, -0.21120452880859375, -0.18450927734375, -0.15781402587890625, -0.1311187744140625, -0.10442352294921875, -0.077728271484375, -0.05103302001953125, -0.0243377685546875, 0.00235748291015625, 0.029052734375, 0.05574798583984375, 0.0824432373046875, 0.10913848876953125, 0.135833740234375, 0.16252899169921875, 0.1892242431640625, 0.21591949462890625, 0.24261474609375, 0.26930999755859375, 0.2960052490234375, 0.32270050048828125, 0.349395751953125, 0.37609100341796875, 0.4027862548828125, 0.42948150634765625, 0.4561767578125, 0.48287200927734375, 0.5095672607421875, 0.5362625122070312, 0.562957763671875, 0.5896530151367188, 0.6163482666015625, 0.6430435180664062, 0.66973876953125, 0.6964340209960938, 0.7231292724609375, 0.7498245239257812, 0.776519775390625, 0.8032150268554688, 0.8299102783203125, 0.8566055297851562, 0.88330078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 14.0, 26.0, 27.0, 43.0, 48.0, 73.0, 101.0, 153.0, 228.0, 310.0, 463.0, 684.0, 1026.0, 1556.0, 2425.0, 4007.0, 6370.0, 10949.0, 18780.0, 31772.0, 54155.0, 88833.0, 137680.0, 208709.0, 174886.0, 119361.0, 74959.0, 44869.0, 26616.0, 15351.0, 9147.0, 5384.0, 3283.0, 2087.0, 1385.0, 891.0, 576.0, 364.0, 282.0, 204.0, 135.0, 87.0, 61.0, 49.0, 50.0, 22.0, 23.0, 16.0, 6.0, 8.0, 1.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.05047607421875, -0.04893827438354492, -0.047400474548339844, -0.045862674713134766, -0.04432487487792969, -0.04278707504272461, -0.04124927520751953, -0.03971147537231445, -0.038173675537109375, -0.0366358757019043, -0.03509807586669922, -0.03356027603149414, -0.03202247619628906, -0.030484676361083984, -0.028946876525878906, -0.027409076690673828, -0.02587127685546875, -0.024333477020263672, -0.022795677185058594, -0.021257877349853516, -0.019720077514648438, -0.01818227767944336, -0.01664447784423828, -0.015106678009033203, -0.013568878173828125, -0.012031078338623047, -0.010493278503417969, -0.00895547866821289, -0.0074176788330078125, -0.005879878997802734, -0.004342079162597656, -0.002804279327392578, -0.0012664794921875, 0.0002713203430175781, 0.0018091201782226562, 0.0033469200134277344, 0.0048847198486328125, 0.006422519683837891, 0.007960319519042969, 0.009498119354248047, 0.011035919189453125, 0.012573719024658203, 0.014111518859863281, 0.01564931869506836, 0.017187118530273438, 0.018724918365478516, 0.020262718200683594, 0.021800518035888672, 0.02333831787109375, 0.024876117706298828, 0.026413917541503906, 0.027951717376708984, 0.029489517211914062, 0.03102731704711914, 0.03256511688232422, 0.0341029167175293, 0.035640716552734375, 0.03717851638793945, 0.03871631622314453, 0.04025411605834961, 0.04179191589355469, 0.043329715728759766, 0.044867515563964844, 0.04640531539916992, 0.047943115234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 12.0, 7.0, 12.0, 14.0, 15.0, 11.0, 23.0, 29.0, 20.0, 24.0, 42.0, 40.0, 37.0, 47.0, 40.0, 46.0, 60.0, 65.0, 42.0, 41.0, 39.0, 36.0, 34.0, 31.0, 32.0, 17.0, 20.0, 24.0, 17.0, 16.0, 15.0, 9.0, 10.0, 9.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.580881118774414e-05, -2.5054439902305603e-05, -2.4300068616867065e-05, -2.3545697331428528e-05, -2.279132604598999e-05, -2.2036954760551453e-05, -2.1282583475112915e-05, -2.0528212189674377e-05, -1.977384090423584e-05, -1.9019469618797302e-05, -1.8265098333358765e-05, -1.7510727047920227e-05, -1.675635576248169e-05, -1.6001984477043152e-05, -1.5247613191604614e-05, -1.4493241906166077e-05, -1.3738870620727539e-05, -1.2984499335289001e-05, -1.2230128049850464e-05, -1.1475756764411926e-05, -1.0721385478973389e-05, -9.967014193534851e-06, -9.212642908096313e-06, -8.458271622657776e-06, -7.703900337219238e-06, -6.949529051780701e-06, -6.195157766342163e-06, -5.4407864809036255e-06, -4.686415195465088e-06, -3.93204391002655e-06, -3.1776726245880127e-06, -2.423301339149475e-06, -1.6689300537109375e-06, -9.145587682723999e-07, -1.601874828338623e-07, 5.941838026046753e-07, 1.3485550880432129e-06, 2.1029263734817505e-06, 2.857297658920288e-06, 3.6116689443588257e-06, 4.366040229797363e-06, 5.120411515235901e-06, 5.8747828006744385e-06, 6.629154086112976e-06, 7.383525371551514e-06, 8.137896656990051e-06, 8.892267942428589e-06, 9.646639227867126e-06, 1.0401010513305664e-05, 1.1155381798744202e-05, 1.190975308418274e-05, 1.2664124369621277e-05, 1.3418495655059814e-05, 1.4172866940498352e-05, 1.492723822593689e-05, 1.5681609511375427e-05, 1.6435980796813965e-05, 1.7190352082252502e-05, 1.794472336769104e-05, 1.8699094653129578e-05, 1.9453465938568115e-05, 2.0207837224006653e-05, 2.096220850944519e-05, 2.1716579794883728e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 9.0, 5.0, 12.0, 10.0, 20.0, 26.0, 34.0, 68.0, 139.0, 188.0, 306.0, 530.0, 965.0, 1757.0, 3351.0, 6230.0, 12728.0, 25073.0, 51516.0, 101355.0, 183061.0, 274419.0, 183409.0, 101122.0, 50680.0, 25435.0, 12405.0, 6360.0, 3209.0, 1708.0, 1014.0, 590.0, 313.0, 174.0, 122.0, 71.0, 59.0, 25.0, 19.0, 17.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.07958984375, -0.07740926742553711, -0.07522869110107422, -0.07304811477661133, -0.07086753845214844, -0.06868696212768555, -0.06650638580322266, -0.06432580947875977, -0.062145233154296875, -0.059964656829833984, -0.057784080505371094, -0.0556035041809082, -0.05342292785644531, -0.05124235153198242, -0.04906177520751953, -0.04688119888305664, -0.04470062255859375, -0.04252004623413086, -0.04033946990966797, -0.03815889358520508, -0.03597831726074219, -0.0337977409362793, -0.031617164611816406, -0.029436588287353516, -0.027256011962890625, -0.025075435638427734, -0.022894859313964844, -0.020714282989501953, -0.018533706665039062, -0.016353130340576172, -0.014172554016113281, -0.01199197769165039, -0.0098114013671875, -0.007630825042724609, -0.005450248718261719, -0.003269672393798828, -0.0010890960693359375, 0.0010914802551269531, 0.0032720565795898438, 0.005452632904052734, 0.007633209228515625, 0.009813785552978516, 0.011994361877441406, 0.014174938201904297, 0.016355514526367188, 0.018536090850830078, 0.02071666717529297, 0.02289724349975586, 0.02507781982421875, 0.02725839614868164, 0.02943897247314453, 0.03161954879760742, 0.03380012512207031, 0.0359807014465332, 0.038161277770996094, 0.040341854095458984, 0.042522430419921875, 0.044703006744384766, 0.046883583068847656, 0.04906415939331055, 0.05124473571777344, 0.05342531204223633, 0.05560588836669922, 0.05778646469116211, 0.059967041015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 11.0, 7.0, 9.0, 19.0, 22.0, 13.0, 23.0, 27.0, 36.0, 31.0, 49.0, 52.0, 59.0, 64.0, 64.0, 70.0, 70.0, 56.0, 42.0, 49.0, 43.0, 41.0, 31.0, 30.0, 13.0, 10.0, 12.0, 7.0, 4.0, 9.0, 7.0, 6.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10845947265625, -0.10482215881347656, -0.10118484497070312, -0.09754753112792969, -0.09391021728515625, -0.09027290344238281, -0.08663558959960938, -0.08299827575683594, -0.0793609619140625, -0.07572364807128906, -0.07208633422851562, -0.06844902038574219, -0.06481170654296875, -0.06117439270019531, -0.057537078857421875, -0.05389976501464844, -0.050262451171875, -0.04662513732910156, -0.042987823486328125, -0.03935050964355469, -0.03571319580078125, -0.03207588195800781, -0.028438568115234375, -0.024801254272460938, -0.0211639404296875, -0.017526626586914062, -0.013889312744140625, -0.010251998901367188, -0.00661468505859375, -0.0029773712158203125, 0.000659942626953125, 0.0042972564697265625, 0.0079345703125, 0.011571884155273438, 0.015209197998046875, 0.018846511840820312, 0.02248382568359375, 0.026121139526367188, 0.029758453369140625, 0.03339576721191406, 0.0370330810546875, 0.04067039489746094, 0.044307708740234375, 0.04794502258300781, 0.05158233642578125, 0.05521965026855469, 0.058856964111328125, 0.06249427795410156, 0.066131591796875, 0.06976890563964844, 0.07340621948242188, 0.07704353332519531, 0.08068084716796875, 0.08431816101074219, 0.08795547485351562, 0.09159278869628906, 0.0952301025390625, 0.09886741638183594, 0.10250473022460938, 0.10614204406738281, 0.10977935791015625, 0.11341667175292969, 0.11705398559570312, 0.12069129943847656, 0.12432861328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 18.0, 22.0, 43.0, 60.0, 96.0, 115.0, 117.0, 151.0, 117.0, 84.0, 59.0, 43.0, 19.0, 11.0, 9.0, 10.0, 5.0, 4.0, 4.0, 0.0, 2.0], "bins": [-4.130890369415283, -4.047792434692383, -3.9646944999694824, -3.881596565246582, -3.7984986305236816, -3.715400457382202, -3.6323025226593018, -3.5492045879364014, -3.466106653213501, -3.3830087184906006, -3.2999107837677, -3.2168128490448, -3.1337146759033203, -3.05061674118042, -2.9675188064575195, -2.884420871734619, -2.8013229370117188, -2.7182250022888184, -2.635127067565918, -2.5520291328430176, -2.468931198120117, -2.3858330249786377, -2.3027350902557373, -2.219637155532837, -2.1365392208099365, -2.053441286087036, -1.9703433513641357, -1.8872452974319458, -1.8041473627090454, -1.721049427986145, -1.637951374053955, -1.5548534393310547, -1.4717552661895752, -1.3886573314666748, -1.3055593967437744, -1.2224613428115845, -1.139363408088684, -1.0562654733657837, -0.9731674790382385, -0.8900694847106934, -0.806971549987793, -0.7238736152648926, -0.6407756209373474, -0.5576776266098022, -0.47457969188690186, -0.3914817273616791, -0.3083837628364563, -0.22528576850891113, -0.14218783378601074, -0.059089869260787964, 0.024008095264434814, 0.10710605978965759, 0.19020402431488037, 0.27330198884010315, 0.3563999533653259, 0.4394979476928711, 0.5225958824157715, 0.6056938171386719, 0.688791811466217, 0.7718898057937622, 0.8549877405166626, 0.938085675239563, 1.021183729171753, 1.1042816638946533, 1.1873795986175537]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 10.0, 8.0, 4.0, 13.0, 14.0, 11.0, 17.0, 18.0, 25.0, 26.0, 24.0, 32.0, 39.0, 40.0, 40.0, 29.0, 41.0, 38.0, 32.0, 49.0, 50.0, 49.0, 48.0, 26.0, 25.0, 35.0, 27.0, 24.0, 29.0, 24.0, 23.0, 22.0, 17.0, 13.0, 8.0, 12.0, 8.0, 8.0, 8.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6128857135772705, -1.564487338066101, -1.516088843345642, -1.4676904678344727, -1.4192919731140137, -1.3708935976028442, -1.3224952220916748, -1.2740967273712158, -1.2256983518600464, -1.177299976348877, -1.128901481628418, -1.0805031061172485, -1.032104730606079, -0.9837062358856201, -0.9353078603744507, -0.8869094252586365, -0.8385109901428223, -0.7901125550270081, -0.7417141199111938, -0.6933157444000244, -0.6449173092842102, -0.596518874168396, -0.5481204986572266, -0.49972206354141235, -0.45132362842559814, -0.40292519330978394, -0.3545267879962921, -0.3061283826828003, -0.2577299475669861, -0.20933152735233307, -0.16093310713768005, -0.11253470182418823, -0.06413626670837402, -0.01573784649372101, 0.03266057372093201, 0.08105899393558502, 0.12945741415023804, 0.17785583436489105, 0.22625425457954407, 0.2746526598930359, 0.3230510950088501, 0.3714495301246643, 0.41984793543815613, 0.46824634075164795, 0.5166447758674622, 0.5650432109832764, 0.6134415864944458, 0.66184002161026, 0.7102384567260742, 0.7586368918418884, 0.8070353269577026, 0.8554337024688721, 0.9038321375846863, 0.9522305727005005, 1.00062894821167, 1.049027442932129, 1.0974258184432983, 1.1458241939544678, 1.1942226886749268, 1.2426210641860962, 1.2910194396972656, 1.3394179344177246, 1.387816309928894, 1.4362146854400635, 1.4846131801605225]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 11.0, 12.0, 11.0, 26.0, 37.0, 58.0, 77.0, 119.0, 212.0, 376.0, 722.0, 1543.0, 3463.0, 8239.0, 21265.0, 63758.0, 237497.0, 760903.0, 1392295.0, 1112261.0, 422194.0, 112685.0, 34297.0, 12438.0, 5148.0, 2295.0, 1071.0, 538.0, 301.0, 166.0, 84.0, 65.0, 36.0, 29.0, 19.0, 10.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2169189453125, -0.2077770233154297, -0.19863510131835938, -0.18949317932128906, -0.18035125732421875, -0.17120933532714844, -0.16206741333007812, -0.1529254913330078, -0.1437835693359375, -0.1346416473388672, -0.12549972534179688, -0.11635780334472656, -0.10721588134765625, -0.09807395935058594, -0.08893203735351562, -0.07979011535644531, -0.070648193359375, -0.06150627136230469, -0.052364349365234375, -0.04322242736816406, -0.03408050537109375, -0.024938583374023438, -0.015796661376953125, -0.0066547393798828125, 0.0024871826171875, 0.011629104614257812, 0.020771026611328125, 0.029912948608398438, 0.03905487060546875, 0.04819679260253906, 0.057338714599609375, 0.06648063659667969, 0.07562255859375, 0.08476448059082031, 0.09390640258789062, 0.10304832458496094, 0.11219024658203125, 0.12133216857910156, 0.13047409057617188, 0.1396160125732422, 0.1487579345703125, 0.1578998565673828, 0.16704177856445312, 0.17618370056152344, 0.18532562255859375, 0.19446754455566406, 0.20360946655273438, 0.2127513885498047, 0.221893310546875, 0.2310352325439453, 0.24017715454101562, 0.24931907653808594, 0.25846099853515625, 0.26760292053222656, 0.2767448425292969, 0.2858867645263672, 0.2950286865234375, 0.3041706085205078, 0.3133125305175781, 0.32245445251464844, 0.33159637451171875, 0.34073829650878906, 0.3498802185058594, 0.3590221405029297, 0.3681640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 6.0, 9.0, 4.0, 14.0, 13.0, 14.0, 18.0, 22.0, 26.0, 18.0, 28.0, 28.0, 38.0, 31.0, 38.0, 40.0, 35.0, 29.0, 40.0, 49.0, 40.0, 35.0, 38.0, 35.0, 41.0, 37.0, 35.0, 24.0, 23.0, 26.0, 23.0, 23.0, 23.0, 14.0, 11.0, 12.0, 12.0, 10.0, 10.0, 5.0, 7.0, 6.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.19677734375, -0.1908130645751953, -0.18484878540039062, -0.17888450622558594, -0.17292022705078125, -0.16695594787597656, -0.16099166870117188, -0.1550273895263672, -0.1490631103515625, -0.1430988311767578, -0.13713455200195312, -0.13117027282714844, -0.12520599365234375, -0.11924171447753906, -0.11327743530273438, -0.10731315612792969, -0.101348876953125, -0.09538459777832031, -0.08942031860351562, -0.08345603942871094, -0.07749176025390625, -0.07152748107910156, -0.06556320190429688, -0.05959892272949219, -0.0536346435546875, -0.04767036437988281, -0.041706085205078125, -0.03574180603027344, -0.02977752685546875, -0.023813247680664062, -0.017848968505859375, -0.011884689331054688, -0.00592041015625, 4.38690185546875e-05, 0.006008148193359375, 0.011972427368164062, 0.01793670654296875, 0.023900985717773438, 0.029865264892578125, 0.03582954406738281, 0.0417938232421875, 0.04775810241699219, 0.053722381591796875, 0.05968666076660156, 0.06565093994140625, 0.07161521911621094, 0.07757949829101562, 0.08354377746582031, 0.089508056640625, 0.09547233581542969, 0.10143661499023438, 0.10740089416503906, 0.11336517333984375, 0.11932945251464844, 0.12529373168945312, 0.1312580108642578, 0.1372222900390625, 0.1431865692138672, 0.14915084838867188, 0.15511512756347656, 0.16107940673828125, 0.16704368591308594, 0.17300796508789062, 0.1789722442626953, 0.1849365234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 4.0, 11.0, 12.0, 14.0, 27.0, 37.0, 45.0, 78.0, 109.0, 147.0, 283.0, 476.0, 830.0, 1854.0, 4171.0, 12384.0, 50770.0, 346683.0, 2881796.0, 775854.0, 89562.0, 18721.0, 5716.0, 2191.0, 1063.0, 553.0, 315.0, 176.0, 121.0, 79.0, 47.0, 47.0, 29.0, 27.0, 19.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.6123046875, -0.5956039428710938, -0.5789031982421875, -0.5622024536132812, -0.545501708984375, -0.5288009643554688, -0.5121002197265625, -0.49539947509765625, -0.47869873046875, -0.46199798583984375, -0.4452972412109375, -0.42859649658203125, -0.411895751953125, -0.39519500732421875, -0.3784942626953125, -0.36179351806640625, -0.3450927734375, -0.32839202880859375, -0.3116912841796875, -0.29499053955078125, -0.278289794921875, -0.26158905029296875, -0.2448883056640625, -0.22818756103515625, -0.21148681640625, -0.19478607177734375, -0.1780853271484375, -0.16138458251953125, -0.144683837890625, -0.12798309326171875, -0.1112823486328125, -0.09458160400390625, -0.077880859375, -0.06118011474609375, -0.0444793701171875, -0.02777862548828125, -0.011077880859375, 0.00562286376953125, 0.0223236083984375, 0.03902435302734375, 0.05572509765625, 0.07242584228515625, 0.0891265869140625, 0.10582733154296875, 0.122528076171875, 0.13922882080078125, 0.1559295654296875, 0.17263031005859375, 0.1893310546875, 0.20603179931640625, 0.2227325439453125, 0.23943328857421875, 0.256134033203125, 0.27283477783203125, 0.2895355224609375, 0.30623626708984375, 0.32293701171875, 0.33963775634765625, 0.3563385009765625, 0.37303924560546875, 0.389739990234375, 0.40644073486328125, 0.4231414794921875, 0.43984222412109375, 0.45654296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 15.0, 17.0, 20.0, 24.0, 32.0, 63.0, 73.0, 94.0, 133.0, 185.0, 245.0, 321.0, 409.0, 434.0, 429.0, 371.0, 331.0, 234.0, 164.0, 121.0, 107.0, 59.0, 44.0, 26.0, 28.0, 19.0, 17.0, 9.0, 6.0, 2.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414794921875, -0.3998985290527344, -0.38500213623046875, -0.3701057434082031, -0.3552093505859375, -0.3403129577636719, -0.32541656494140625, -0.3105201721191406, -0.295623779296875, -0.2807273864746094, -0.26583099365234375, -0.2509346008300781, -0.2360382080078125, -0.22114181518554688, -0.20624542236328125, -0.19134902954101562, -0.17645263671875, -0.16155624389648438, -0.14665985107421875, -0.13176345825195312, -0.1168670654296875, -0.10197067260742188, -0.08707427978515625, -0.07217788696289062, -0.057281494140625, -0.042385101318359375, -0.02748870849609375, -0.012592315673828125, 0.0023040771484375, 0.017200469970703125, 0.03209686279296875, 0.046993255615234375, 0.0618896484375, 0.07678604125976562, 0.09168243408203125, 0.10657882690429688, 0.1214752197265625, 0.13637161254882812, 0.15126800537109375, 0.16616439819335938, 0.181060791015625, 0.19595718383789062, 0.21085357666015625, 0.22574996948242188, 0.2406463623046875, 0.2555427551269531, 0.27043914794921875, 0.2853355407714844, 0.30023193359375, 0.3151283264160156, 0.33002471923828125, 0.3449211120605469, 0.3598175048828125, 0.3747138977050781, 0.38961029052734375, 0.4045066833496094, 0.419403076171875, 0.4342994689941406, 0.44919586181640625, 0.4640922546386719, 0.4789886474609375, 0.4938850402832031, 0.5087814331054688, 0.5236778259277344, 0.53857421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 18.0, 14.0, 27.0, 40.0, 56.0, 70.0, 91.0, 101.0, 121.0, 118.0, 104.0, 62.0, 49.0, 41.0, 22.0, 16.0, 7.0, 3.0, 5.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986452102661133, -2.839566469192505, -2.692681074142456, -2.545795440673828, -2.3989100456237793, -2.2520244121551514, -2.1051387786865234, -1.958253264427185, -1.8113677501678467, -1.6644822359085083, -1.51759672164917, -1.370711088180542, -1.2238255739212036, -1.0769400596618652, -0.9300544857978821, -0.7831689119338989, -0.6362833976745605, -0.4893978536128998, -0.342512309551239, -0.19562676548957825, -0.04874122142791748, 0.0981442928314209, 0.24502986669540405, 0.3919154405593872, 0.5388009548187256, 0.685686469078064, 0.8325720429420471, 0.9794576168060303, 1.1263431310653687, 1.273228645324707, 1.420114278793335, 1.5669997930526733, 1.7138848304748535, 1.860770344734192, 2.0076558589935303, 2.154541492462158, 2.301426887512207, 2.448312520980835, 2.595198154449463, 2.7420835494995117, 2.8889691829681396, 3.0358548164367676, 3.1827402114868164, 3.3296258449554443, 3.4765114784240723, 3.623396873474121, 3.770282506942749, 3.917168140411377, 4.064053535461426, 4.210938930511475, 4.357824802398682, 4.5047101974487305, 4.651595592498779, 4.798480987548828, 4.945366859436035, 5.092252254486084, 5.239137649536133, 5.386023044586182, 5.532908916473389, 5.6797943115234375, 5.826679706573486, 5.973565101623535, 6.120450973510742, 6.267336368560791, 6.414222240447998]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 11.0, 7.0, 12.0, 21.0, 18.0, 15.0, 25.0, 30.0, 35.0, 39.0, 45.0, 44.0, 56.0, 54.0, 46.0, 60.0, 51.0, 46.0, 55.0, 49.0, 30.0, 52.0, 33.0, 34.0, 30.0, 19.0, 17.0, 14.0, 7.0, 13.0, 7.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.424018621444702, -2.350886583328247, -2.277754545211792, -2.204622507095337, -2.131490707397461, -2.058358669281006, -1.9852266311645508, -1.9120945930480957, -1.8389625549316406, -1.7658305168151855, -1.6926984786987305, -1.619566559791565, -1.5464345216751099, -1.4733024835586548, -1.4001705646514893, -1.3270385265350342, -1.253906488418579, -1.180774450302124, -1.107642412185669, -1.0345104932785034, -0.9613784551620483, -0.8882464170455933, -0.815114438533783, -0.7419824600219727, -0.6688504219055176, -0.5957183837890625, -0.5225864052772522, -0.4494543969631195, -0.3763223886489868, -0.3031903803348541, -0.23005837202072144, -0.15692639350891113, -0.08379459381103516, -0.010662585496902466, 0.062469422817230225, 0.13560143113136292, 0.2087334394454956, 0.2818654477596283, 0.354997456073761, 0.4281294345855713, 0.5012614727020264, 0.5743935108184814, 0.6475254893302917, 0.720657467842102, 0.7937895059585571, 0.8669215440750122, 0.9400535225868225, 1.0131855010986328, 1.086317539215088, 1.159449577331543, 1.232581615447998, 1.3057135343551636, 1.3788455724716187, 1.4519776105880737, 1.5251095294952393, 1.5982415676116943, 1.6713736057281494, 1.7445056438446045, 1.8176376819610596, 1.890769600868225, 1.9639016389846802, 2.0370335578918457, 2.110165596008301, 2.183297634124756, 2.256429672241211]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 20.0, 26.0, 29.0, 53.0, 75.0, 116.0, 174.0, 266.0, 464.0, 712.0, 1261.0, 2223.0, 4181.0, 8475.0, 17478.0, 40869.0, 96047.0, 212725.0, 301375.0, 201031.0, 89548.0, 37684.0, 16849.0, 7787.0, 3874.0, 2088.0, 1232.0, 668.0, 416.0, 288.0, 151.0, 106.0, 75.0, 61.0, 31.0, 22.0, 19.0, 15.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21106910705566406, -0.20277786254882812, -0.1944866180419922, -0.18619537353515625, -0.1779041290283203, -0.16961288452148438, -0.16132164001464844, -0.1530303955078125, -0.14473915100097656, -0.13644790649414062, -0.1281566619873047, -0.11986541748046875, -0.11157417297363281, -0.10328292846679688, -0.09499168395996094, -0.086700439453125, -0.07840919494628906, -0.07011795043945312, -0.06182670593261719, -0.05353546142578125, -0.04524421691894531, -0.036952972412109375, -0.028661727905273438, -0.0203704833984375, -0.012079238891601562, -0.003787994384765625, 0.0045032501220703125, 0.01279449462890625, 0.021085739135742188, 0.029376983642578125, 0.03766822814941406, 0.04595947265625, 0.05425071716308594, 0.06254196166992188, 0.07083320617675781, 0.07912445068359375, 0.08741569519042969, 0.09570693969726562, 0.10399818420410156, 0.1122894287109375, 0.12058067321777344, 0.12887191772460938, 0.1371631622314453, 0.14545440673828125, 0.1537456512451172, 0.16203689575195312, 0.17032814025878906, 0.178619384765625, 0.18691062927246094, 0.19520187377929688, 0.2034931182861328, 0.21178436279296875, 0.2200756072998047, 0.22836685180664062, 0.23665809631347656, 0.2449493408203125, 0.25324058532714844, 0.2615318298339844, 0.2698230743408203, 0.27811431884765625, 0.2864055633544922, 0.2946968078613281, 0.30298805236816406, 0.311279296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 11.0, 10.0, 12.0, 12.0, 15.0, 19.0, 37.0, 32.0, 33.0, 28.0, 52.0, 37.0, 49.0, 43.0, 47.0, 54.0, 60.0, 48.0, 33.0, 46.0, 41.0, 34.0, 38.0, 34.0, 31.0, 23.0, 29.0, 29.0, 16.0, 14.0, 8.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2524833679199219, -0.24349212646484375, -0.23450088500976562, -0.2255096435546875, -0.21651840209960938, -0.20752716064453125, -0.19853591918945312, -0.189544677734375, -0.18055343627929688, -0.17156219482421875, -0.16257095336914062, -0.1535797119140625, -0.14458847045898438, -0.13559722900390625, -0.12660598754882812, -0.11761474609375, -0.10862350463867188, -0.09963226318359375, -0.09064102172851562, -0.0816497802734375, -0.07265853881835938, -0.06366729736328125, -0.054676055908203125, -0.045684814453125, -0.036693572998046875, -0.02770233154296875, -0.018711090087890625, -0.0097198486328125, -0.000728607177734375, 0.00826263427734375, 0.017253875732421875, 0.0262451171875, 0.035236358642578125, 0.04422760009765625, 0.053218841552734375, 0.0622100830078125, 0.07120132446289062, 0.08019256591796875, 0.08918380737304688, 0.098175048828125, 0.10716629028320312, 0.11615753173828125, 0.12514877319335938, 0.1341400146484375, 0.14313125610351562, 0.15212249755859375, 0.16111373901367188, 0.17010498046875, 0.17909622192382812, 0.18808746337890625, 0.19707870483398438, 0.2060699462890625, 0.21506118774414062, 0.22405242919921875, 0.23304367065429688, 0.242034912109375, 0.2510261535644531, 0.26001739501953125, 0.2690086364746094, 0.2779998779296875, 0.2869911193847656, 0.29598236083984375, 0.3049736022949219, 0.31396484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 0.0, 7.0, 7.0, 10.0, 13.0, 14.0, 21.0, 27.0, 50.0, 60.0, 77.0, 136.0, 272.0, 561.0, 1287.0, 3541.0, 13048.0, 77235.0, 675398.0, 237287.0, 29301.0, 6357.0, 2065.0, 823.0, 374.0, 223.0, 129.0, 74.0, 55.0, 31.0, 12.0, 14.0, 11.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.51708984375, -0.5013008117675781, -0.48551177978515625, -0.4697227478027344, -0.4539337158203125, -0.4381446838378906, -0.42235565185546875, -0.4065666198730469, -0.390777587890625, -0.3749885559082031, -0.35919952392578125, -0.3434104919433594, -0.3276214599609375, -0.3118324279785156, -0.29604339599609375, -0.2802543640136719, -0.26446533203125, -0.24867630004882812, -0.23288726806640625, -0.21709823608398438, -0.2013092041015625, -0.18552017211914062, -0.16973114013671875, -0.15394210815429688, -0.138153076171875, -0.12236404418945312, -0.10657501220703125, -0.09078598022460938, -0.0749969482421875, -0.059207916259765625, -0.04341888427734375, -0.027629852294921875, -0.0118408203125, 0.003948211669921875, 0.01973724365234375, 0.035526275634765625, 0.0513153076171875, 0.06710433959960938, 0.08289337158203125, 0.09868240356445312, 0.114471435546875, 0.13026046752929688, 0.14604949951171875, 0.16183853149414062, 0.1776275634765625, 0.19341659545898438, 0.20920562744140625, 0.22499465942382812, 0.24078369140625, 0.2565727233886719, 0.27236175537109375, 0.2881507873535156, 0.3039398193359375, 0.3197288513183594, 0.33551788330078125, 0.3513069152832031, 0.367095947265625, 0.3828849792480469, 0.39867401123046875, 0.4144630432128906, 0.4302520751953125, 0.4460411071777344, 0.46183013916015625, 0.4776191711425781, 0.493408203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 7.0, 13.0, 14.0, 19.0, 22.0, 18.0, 24.0, 38.0, 53.0, 39.0, 45.0, 38.0, 43.0, 56.0, 44.0, 60.0, 40.0, 66.0, 39.0, 41.0, 50.0, 40.0, 27.0, 34.0, 24.0, 9.0, 25.0, 10.0, 14.0, 11.0, 8.0, 1.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.69580078125, -0.6740951538085938, -0.6523895263671875, -0.6306838989257812, -0.608978271484375, -0.5872726440429688, -0.5655670166015625, -0.5438613891601562, -0.52215576171875, -0.5004501342773438, -0.4787445068359375, -0.45703887939453125, -0.435333251953125, -0.41362762451171875, -0.3919219970703125, -0.37021636962890625, -0.3485107421875, -0.32680511474609375, -0.3050994873046875, -0.28339385986328125, -0.261688232421875, -0.23998260498046875, -0.2182769775390625, -0.19657135009765625, -0.17486572265625, -0.15316009521484375, -0.1314544677734375, -0.10974884033203125, -0.088043212890625, -0.06633758544921875, -0.0446319580078125, -0.02292633056640625, -0.001220703125, 0.02048492431640625, 0.0421905517578125, 0.06389617919921875, 0.085601806640625, 0.10730743408203125, 0.1290130615234375, 0.15071868896484375, 0.17242431640625, 0.19412994384765625, 0.2158355712890625, 0.23754119873046875, 0.259246826171875, 0.28095245361328125, 0.3026580810546875, 0.32436370849609375, 0.3460693359375, 0.36777496337890625, 0.3894805908203125, 0.41118621826171875, 0.432891845703125, 0.45459747314453125, 0.4763031005859375, 0.49800872802734375, 0.51971435546875, 0.5414199829101562, 0.5631256103515625, 0.5848312377929688, 0.606536865234375, 0.6282424926757812, 0.6499481201171875, 0.6716537475585938, 0.693359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 6.0, 16.0, 15.0, 44.0, 65.0, 99.0, 162.0, 335.0, 1063.0, 7554.0, 710396.0, 321567.0, 5695.0, 884.0, 260.0, 132.0, 89.0, 64.0, 35.0, 18.0, 11.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4278221130371094, -0.41399383544921875, -0.4001655578613281, -0.3863372802734375, -0.3725090026855469, -0.35868072509765625, -0.3448524475097656, -0.331024169921875, -0.3171958923339844, -0.30336761474609375, -0.2895393371582031, -0.2757110595703125, -0.2618827819824219, -0.24805450439453125, -0.23422622680664062, -0.22039794921875, -0.20656967163085938, -0.19274139404296875, -0.17891311645507812, -0.1650848388671875, -0.15125656127929688, -0.13742828369140625, -0.12360000610351562, -0.109771728515625, -0.09594345092773438, -0.08211517333984375, -0.06828689575195312, -0.0544586181640625, -0.040630340576171875, -0.02680206298828125, -0.012973785400390625, 0.0008544921875, 0.014682769775390625, 0.02851104736328125, 0.042339324951171875, 0.0561676025390625, 0.06999588012695312, 0.08382415771484375, 0.09765243530273438, 0.111480712890625, 0.12530899047851562, 0.13913726806640625, 0.15296554565429688, 0.1667938232421875, 0.18062210083007812, 0.19445037841796875, 0.20827865600585938, 0.22210693359375, 0.23593521118164062, 0.24976348876953125, 0.2635917663574219, 0.2774200439453125, 0.2912483215332031, 0.30507659912109375, 0.3189048767089844, 0.332733154296875, 0.3465614318847656, 0.36038970947265625, 0.3742179870605469, 0.3880462646484375, 0.4018745422363281, 0.41570281982421875, 0.4295310974121094, 0.443359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 9.0, 14.0, 17.0, 26.0, 40.0, 42.0, 74.0, 88.0, 104.0, 116.0, 108.0, 83.0, 65.0, 60.0, 44.0, 36.0, 21.0, 14.0, 7.0, 2.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5462359189987183e-05, -2.4281442165374756e-05, -2.310052514076233e-05, -2.1919608116149902e-05, -2.0738691091537476e-05, -1.955777406692505e-05, -1.8376857042312622e-05, -1.7195940017700195e-05, -1.601502299308777e-05, -1.4834105968475342e-05, -1.3653188943862915e-05, -1.2472271919250488e-05, -1.1291354894638062e-05, -1.0110437870025635e-05, -8.929520845413208e-06, -7.748603820800781e-06, -6.5676867961883545e-06, -5.386769771575928e-06, -4.205852746963501e-06, -3.0249357223510742e-06, -1.8440186977386475e-06, -6.631016731262207e-07, 5.178153514862061e-07, 1.6987323760986328e-06, 2.8796494007110596e-06, 4.060566425323486e-06, 5.241483449935913e-06, 6.42240047454834e-06, 7.603317499160767e-06, 8.784234523773193e-06, 9.96515154838562e-06, 1.1146068572998047e-05, 1.2326985597610474e-05, 1.35079026222229e-05, 1.4688819646835327e-05, 1.5869736671447754e-05, 1.705065369606018e-05, 1.8231570720672607e-05, 1.9412487745285034e-05, 2.059340476989746e-05, 2.1774321794509888e-05, 2.2955238819122314e-05, 2.413615584373474e-05, 2.5317072868347168e-05, 2.6497989892959595e-05, 2.767890691757202e-05, 2.8859823942184448e-05, 3.0040740966796875e-05, 3.12216579914093e-05, 3.240257501602173e-05, 3.3583492040634155e-05, 3.476440906524658e-05, 3.594532608985901e-05, 3.7126243114471436e-05, 3.830716013908386e-05, 3.948807716369629e-05, 4.0668994188308716e-05, 4.184991121292114e-05, 4.303082823753357e-05, 4.4211745262145996e-05, 4.539266228675842e-05, 4.657357931137085e-05, 4.7754496335983276e-05, 4.89354133605957e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 12.0, 27.0, 55.0, 95.0, 244.0, 705.0, 3029.0, 44103.0, 959052.0, 37312.0, 2718.0, 687.0, 240.0, 115.0, 78.0, 36.0, 19.0, 17.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.437744140625, -0.4242668151855469, -0.41078948974609375, -0.3973121643066406, -0.3838348388671875, -0.3703575134277344, -0.35688018798828125, -0.3434028625488281, -0.329925537109375, -0.3164482116699219, -0.30297088623046875, -0.2894935607910156, -0.2760162353515625, -0.2625389099121094, -0.24906158447265625, -0.23558425903320312, -0.22210693359375, -0.20862960815429688, -0.19515228271484375, -0.18167495727539062, -0.1681976318359375, -0.15472030639648438, -0.14124298095703125, -0.12776565551757812, -0.114288330078125, -0.10081100463867188, -0.08733367919921875, -0.07385635375976562, -0.0603790283203125, -0.046901702880859375, -0.03342437744140625, -0.019947052001953125, -0.0064697265625, 0.007007598876953125, 0.02048492431640625, 0.033962249755859375, 0.0474395751953125, 0.060916900634765625, 0.07439422607421875, 0.08787155151367188, 0.101348876953125, 0.11482620239257812, 0.12830352783203125, 0.14178085327148438, 0.1552581787109375, 0.16873550415039062, 0.18221282958984375, 0.19569015502929688, 0.20916748046875, 0.22264480590820312, 0.23612213134765625, 0.24959945678710938, 0.2630767822265625, 0.2765541076660156, 0.29003143310546875, 0.3035087585449219, 0.316986083984375, 0.3304634094238281, 0.34394073486328125, 0.3574180603027344, 0.3708953857421875, 0.3843727111816406, 0.39785003662109375, 0.4113273620605469, 0.4248046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 15.0, 26.0, 45.0, 81.0, 156.0, 230.0, 217.0, 94.0, 56.0, 31.0, 12.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4721260070800781, -0.45719146728515625, -0.4422569274902344, -0.4273223876953125, -0.4123878479003906, -0.39745330810546875, -0.3825187683105469, -0.367584228515625, -0.3526496887207031, -0.33771514892578125, -0.3227806091308594, -0.3078460693359375, -0.2929115295410156, -0.27797698974609375, -0.2630424499511719, -0.24810791015625, -0.23317337036132812, -0.21823883056640625, -0.20330429077148438, -0.1883697509765625, -0.17343521118164062, -0.15850067138671875, -0.14356613159179688, -0.128631591796875, -0.11369705200195312, -0.09876251220703125, -0.08382797241210938, -0.0688934326171875, -0.053958892822265625, -0.03902435302734375, -0.024089813232421875, -0.0091552734375, 0.005779266357421875, 0.02071380615234375, 0.035648345947265625, 0.0505828857421875, 0.06551742553710938, 0.08045196533203125, 0.09538650512695312, 0.110321044921875, 0.12525558471679688, 0.14019012451171875, 0.15512466430664062, 0.1700592041015625, 0.18499374389648438, 0.19992828369140625, 0.21486282348632812, 0.22979736328125, 0.24473190307617188, 0.25966644287109375, 0.2746009826660156, 0.2895355224609375, 0.3044700622558594, 0.31940460205078125, 0.3343391418457031, 0.349273681640625, 0.3642082214355469, 0.37914276123046875, 0.3940773010253906, 0.4090118408203125, 0.4239463806152344, 0.43888092041015625, 0.4538154602050781, 0.46875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 16.0, 21.0, 24.0, 41.0, 72.0, 77.0, 134.0, 148.0, 128.0, 95.0, 79.0, 49.0, 39.0, 21.0, 14.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.244434356689453, -2.130798578262329, -2.017162799835205, -1.903527021408081, -1.7898913621902466, -1.6762555837631226, -1.5626198053359985, -1.448984146118164, -1.33534836769104, -1.221712589263916, -1.108076810836792, -0.9944410920143127, -0.8808053731918335, -0.7671695947647095, -0.6535338163375854, -0.5398980975151062, -0.4262622594833374, -0.31262651085853577, -0.19899074733257294, -0.08535498380661011, 0.02828076481819153, 0.14191651344299316, 0.2555522918701172, 0.36918801069259644, 0.48282378911972046, 0.5964595675468445, 0.7100952863693237, 0.8237310647964478, 0.9373668432235718, 1.0510025024414062, 1.1646382808685303, 1.2782740592956543, 1.3919098377227783, 1.5055456161499023, 1.6191813945770264, 1.7328171730041504, 1.8464528322219849, 1.9600886106491089, 2.0737242698669434, 2.1873600482940674, 2.3009958267211914, 2.4146316051483154, 2.5282673835754395, 2.6419031620025635, 2.7555389404296875, 2.8691744804382324, 2.9828104972839355, 3.0964460372924805, 3.2100820541381836, 3.3237178325653076, 3.4373536109924316, 3.5509893894195557, 3.6646251678466797, 3.7782607078552246, 3.8918967247009277, 4.005532264709473, 4.119167804718018, 4.2328033447265625, 4.346439361572266, 4.4600749015808105, 4.573710918426514, 4.687346458435059, 4.800982475280762, 4.914618015289307, 5.02825403213501]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 10.0, 19.0, 14.0, 16.0, 19.0, 19.0, 42.0, 47.0, 48.0, 74.0, 70.0, 68.0, 75.0, 69.0, 64.0, 66.0, 40.0, 50.0, 33.0, 30.0, 36.0, 24.0, 14.0, 11.0, 6.0, 8.0, 7.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9931352138519287, -2.894886016845703, -2.7966365814208984, -2.6983871459960938, -2.600137948989868, -2.5018887519836426, -2.403639316558838, -2.305389881134033, -2.2071406841278076, -2.108891487121582, -2.0106420516967773, -1.9123927354812622, -1.814143419265747, -1.715894103050232, -1.6176447868347168, -1.5193954706192017, -1.4211461544036865, -1.3228968381881714, -1.2246475219726562, -1.1263982057571411, -1.028148889541626, -0.9298995733261108, -0.8316502571105957, -0.7334009408950806, -0.6351516246795654, -0.5369023084640503, -0.43865299224853516, -0.34040367603302, -0.24215435981750488, -0.14390504360198975, -0.04565572738647461, 0.05259358882904053, 0.15084266662597656, 0.2490919828414917, 0.34734129905700684, 0.445590615272522, 0.5438399314880371, 0.6420892477035522, 0.7403385639190674, 0.8385878801345825, 0.9368371963500977, 1.0350865125656128, 1.133335828781128, 1.231585144996643, 1.3298344612121582, 1.4280837774276733, 1.5263330936431885, 1.6245824098587036, 1.7228317260742188, 1.8210810422897339, 1.919330358505249, 2.0175795555114746, 2.1158289909362793, 2.214078426361084, 2.3123276233673096, 2.410576820373535, 2.50882625579834, 2.6070756912231445, 2.70532488822937, 2.8035740852355957, 2.9018235206604004, 3.000072956085205, 3.0983221530914307, 3.1965713500976562, 3.294820785522461]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 14.0, 9.0, 6.0, 9.0, 14.0, 14.0, 26.0, 28.0, 31.0, 42.0, 52.0, 71.0, 148.0, 227.0, 80.0, 55.0, 32.0, 31.0, 28.0, 19.0, 8.0, 10.0, 8.0, 6.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.381103515625, -0.3696098327636719, -0.35811614990234375, -0.3466224670410156, -0.3351287841796875, -0.3236351013183594, -0.31214141845703125, -0.3006477355957031, -0.289154052734375, -0.2776603698730469, -0.26616668701171875, -0.2546730041503906, -0.2431793212890625, -0.23168563842773438, -0.22019195556640625, -0.20869827270507812, -0.19720458984375, -0.18571090698242188, -0.17421722412109375, -0.16272354125976562, -0.1512298583984375, -0.13973617553710938, -0.12824249267578125, -0.11674880981445312, -0.105255126953125, -0.09376144409179688, -0.08226776123046875, -0.07077407836914062, -0.0592803955078125, -0.047786712646484375, -0.03629302978515625, -0.024799346923828125, -0.0133056640625, -0.001811981201171875, 0.00968170166015625, 0.021175384521484375, 0.0326690673828125, 0.044162750244140625, 0.05565643310546875, 0.06715011596679688, 0.078643798828125, 0.09013748168945312, 0.10163116455078125, 0.11312484741210938, 0.1246185302734375, 0.13611221313476562, 0.14760589599609375, 0.15909957885742188, 0.17059326171875, 0.18208694458007812, 0.19358062744140625, 0.20507431030273438, 0.2165679931640625, 0.22806167602539062, 0.23955535888671875, 0.2510490417480469, 0.262542724609375, 0.2740364074707031, 0.28553009033203125, 0.2970237731933594, 0.3085174560546875, 0.3200111389160156, 0.33150482177734375, 0.3429985046386719, 0.3544921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 8.0, 21.0, 22.0, 42.0, 65.0, 133.0, 228.0, 565.0, 1584.0, 6420.0, 74690.0, 8283641.0, 16336.0, 3053.0, 920.0, 371.0, 204.0, 114.0, 51.0, 38.0, 19.0, 14.0, 17.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9379535913467407, -1.8796736001968384, -1.8213937282562256, -1.7631137371063232, -1.7048338651657104, -1.646553874015808, -1.5882740020751953, -1.529994010925293, -1.4717140197753906, -1.4134340286254883, -1.3551541566848755, -1.2968741655349731, -1.2385942935943604, -1.180314302444458, -1.1220343112945557, -1.0637544393539429, -1.00547456741333, -0.9471946358680725, -0.8889147043228149, -0.8306347131729126, -0.772354781627655, -0.7140748500823975, -0.6557949185371399, -0.5975149869918823, -0.53923499584198, -0.4809550642967224, -0.42267510294914246, -0.3643951714038849, -0.30611521005630493, -0.24783527851104736, -0.1895553469657898, -0.13127538561820984, -0.07299542427062988, -0.014715481549501419, 0.043564461171627045, 0.10184440016746521, 0.16012434661388397, 0.21840429306030273, 0.2766842246055603, 0.33496418595314026, 0.3932441174983978, 0.4515240490436554, 0.5098040103912354, 0.5680839419364929, 0.6263638734817505, 0.6846438646316528, 0.7429237365722656, 0.801203727722168, 0.8594836592674255, 0.9177635908126831, 0.9760435223579407, 1.0343234539031982, 1.0926034450531006, 1.150883436203003, 1.2091633081436157, 1.267443299293518, 1.3257231712341309, 1.3840031623840332, 1.442283034324646, 1.5005630254745483, 1.5588428974151611, 1.6171228885650635, 1.6754028797149658, 1.7336827516555786, 1.791962742805481]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4320980310440063, -1.3883832693099976, -1.3446685075759888, -1.3009538650512695, -1.2572391033172607, -1.213524341583252, -1.1698095798492432, -1.1260948181152344, -1.0823800563812256, -1.0386652946472168, -0.9949505925178528, -0.951235830783844, -0.90752112865448, -0.8638063669204712, -0.8200916051864624, -0.7763768434524536, -0.7326622009277344, -0.6889474391937256, -0.6452327370643616, -0.6015179753303528, -0.5578032732009888, -0.51408851146698, -0.4703737497329712, -0.4266590178012848, -0.3829442858695984, -0.339229553937912, -0.2955148220062256, -0.2518000602722168, -0.2080853283405304, -0.164370596408844, -0.1206558346748352, -0.0769411027431488, -0.03322649002075195, 0.010488249361515045, 0.05420298874378204, 0.09791773557662964, 0.14163246750831604, 0.18534719944000244, 0.22906196117401123, 0.27277669310569763, 0.31649142503738403, 0.36020615696907043, 0.40392088890075684, 0.4476356506347656, 0.491350382566452, 0.5350651144981384, 0.5787798762321472, 0.6224945783615112, 0.66620934009552, 0.7099241018295288, 0.7536388039588928, 0.7973535656929016, 0.8410682678222656, 0.8847830295562744, 0.9284977912902832, 0.972212553024292, 1.0159273147583008, 1.0596420764923096, 1.1033568382263184, 1.1470715999603271, 1.1907862424850464, 1.2345010042190552, 1.278215765953064, 1.3219305276870728, 1.365645170211792]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 8.0, 7.0, 16.0, 15.0, 20.0, 23.0, 31.0, 35.0, 37.0, 74.0, 57.0, 62.0, 68.0, 87.0, 70.0, 58.0, 78.0, 44.0, 46.0, 35.0, 37.0, 25.0, 17.0, 12.0, 7.0, 1.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.27188873291015625, -0.2642364501953125, -0.25658416748046875, -0.248931884765625, -0.24127960205078125, -0.2336273193359375, -0.22597503662109375, -0.21832275390625, -0.21067047119140625, -0.2030181884765625, -0.19536590576171875, -0.187713623046875, -0.18006134033203125, -0.1724090576171875, -0.16475677490234375, -0.1571044921875, -0.14945220947265625, -0.1417999267578125, -0.13414764404296875, -0.126495361328125, -0.11884307861328125, -0.1111907958984375, -0.10353851318359375, -0.09588623046875, -0.08823394775390625, -0.0805816650390625, -0.07292938232421875, -0.065277099609375, -0.05762481689453125, -0.0499725341796875, -0.04232025146484375, -0.03466796875, -0.02701568603515625, -0.0193634033203125, -0.01171112060546875, -0.004058837890625, 0.00359344482421875, 0.0112457275390625, 0.01889801025390625, 0.02655029296875, 0.03420257568359375, 0.0418548583984375, 0.04950714111328125, 0.057159423828125, 0.06481170654296875, 0.0724639892578125, 0.08011627197265625, 0.0877685546875, 0.09542083740234375, 0.1030731201171875, 0.11072540283203125, 0.118377685546875, 0.12602996826171875, 0.1336822509765625, 0.14133453369140625, 0.14898681640625, 0.15663909912109375, 0.1642913818359375, 0.17194366455078125, 0.179595947265625, 0.18724822998046875, 0.1949005126953125, 0.20255279541015625, 0.210205078125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 13.0, 17.0, 29.0, 34.0, 54.0, 76.0, 122.0, 180.0, 311.0, 540.0, 966.0, 1754.0, 3615.0, 7624.0, 17935.0, 50805.0, 192073.0, 172171.0, 45460.0, 16354.0, 6953.0, 3319.0, 1690.0, 894.0, 477.0, 298.0, 168.0, 124.0, 78.0, 37.0, 29.0, 16.0, 13.0, 8.0, 11.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.532928466796875, -2.42718505859375, -2.321441650390625, -2.2156982421875, -2.109954833984375, -2.00421142578125, -1.898468017578125, -1.792724609375, -1.686981201171875, -1.58123779296875, -1.475494384765625, -1.3697509765625, -1.264007568359375, -1.15826416015625, -1.052520751953125, -0.94677734375, -0.841033935546875, -0.73529052734375, -0.629547119140625, -0.5238037109375, -0.418060302734375, -0.31231689453125, -0.206573486328125, -0.100830078125, 0.004913330078125, 0.11065673828125, 0.216400146484375, 0.3221435546875, 0.427886962890625, 0.53363037109375, 0.639373779296875, 0.7451171875, 0.850860595703125, 0.95660400390625, 1.062347412109375, 1.1680908203125, 1.273834228515625, 1.37957763671875, 1.485321044921875, 1.591064453125, 1.696807861328125, 1.80255126953125, 1.908294677734375, 2.0140380859375, 2.119781494140625, 2.22552490234375, 2.331268310546875, 2.43701171875, 2.542755126953125, 2.64849853515625, 2.754241943359375, 2.8599853515625, 2.965728759765625, 3.07147216796875, 3.177215576171875, 3.282958984375, 3.388702392578125, 3.49444580078125, 3.600189208984375, 3.7059326171875, 3.811676025390625, 3.91741943359375, 4.023162841796875, 4.12890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 13.0, 17.0, 15.0, 17.0, 18.0, 18.0, 27.0, 27.0, 34.0, 33.0, 37.0, 56.0, 49.0, 59.0, 51.0, 52.0, 61.0, 44.0, 51.0, 33.0, 36.0, 29.0, 37.0, 24.0, 21.0, 24.0, 24.0, 22.0, 10.0, 13.0, 11.0, 4.0, 2.0, 9.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2611961364746094, -0.25237274169921875, -0.24354934692382812, -0.2347259521484375, -0.22590255737304688, -0.21707916259765625, -0.20825576782226562, -0.199432373046875, -0.19060897827148438, -0.18178558349609375, -0.17296218872070312, -0.1641387939453125, -0.15531539916992188, -0.14649200439453125, -0.13766860961914062, -0.12884521484375, -0.12002182006835938, -0.11119842529296875, -0.10237503051757812, -0.0935516357421875, -0.08472824096679688, -0.07590484619140625, -0.06708145141601562, -0.058258056640625, -0.049434661865234375, -0.04061126708984375, -0.031787872314453125, -0.0229644775390625, -0.014141082763671875, -0.00531768798828125, 0.003505706787109375, 0.0123291015625, 0.021152496337890625, 0.02997589111328125, 0.038799285888671875, 0.0476226806640625, 0.056446075439453125, 0.06526947021484375, 0.07409286499023438, 0.082916259765625, 0.09173965454101562, 0.10056304931640625, 0.10938644409179688, 0.1182098388671875, 0.12703323364257812, 0.13585662841796875, 0.14468002319335938, 0.15350341796875, 0.16232681274414062, 0.17115020751953125, 0.17997360229492188, 0.1887969970703125, 0.19762039184570312, 0.20644378662109375, 0.21526718139648438, 0.224090576171875, 0.23291397094726562, 0.24173736572265625, 0.2505607604980469, 0.2593841552734375, 0.2682075500488281, 0.27703094482421875, 0.2858543395996094, 0.294677734375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 11.0, 8.0, 18.0, 12.0, 11.0, 21.0, 22.0, 33.0, 41.0, 37.0, 52.0, 43.0, 39.0, 30.0, 22.0, 20.0, 13.0, 6.0, 13.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0747687816619873, -1.0402421951293945, -1.0057154893875122, -0.9711889028549194, -0.9366622567176819, -0.9021356105804443, -0.8676090240478516, -0.833082377910614, -0.7985557317733765, -0.7640290856361389, -0.7295024991035461, -0.6949758529663086, -0.660449206829071, -0.6259225606918335, -0.5913959741592407, -0.5568693280220032, -0.5223427414894104, -0.48781612515449524, -0.4532894790172577, -0.41876286268234253, -0.384236216545105, -0.3497096002101898, -0.31518298387527466, -0.2806563377380371, -0.24612972140312195, -0.2116030901670456, -0.17707645893096924, -0.14254984259605408, -0.10802321135997772, -0.07349658012390137, -0.038969963788986206, -0.004443332552909851, 0.030083298683166504, 0.06460992991924286, 0.09913655370473862, 0.13366317749023438, 0.16818980872631073, 0.20271643996238708, 0.23724305629730225, 0.2717697024345398, 0.30629631876945496, 0.3408229351043701, 0.37534958124160767, 0.4098761975765228, 0.444402813911438, 0.47892946004867554, 0.5134561061859131, 0.5479826927185059, 0.5825093388557434, 0.617035984992981, 0.6515625715255737, 0.6860892176628113, 0.7206158638000488, 0.7551424503326416, 0.7896690964698792, 0.8241957426071167, 0.8587223291397095, 0.893248975276947, 0.9277755618095398, 0.9623022079467773, 0.9968288540840149, 1.0313555002212524, 1.0658820867538452, 1.100408673286438, 1.1349353790283203]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 5.0, 1.0, 13.0, 1.0, 9.0, 11.0, 15.0, 16.0, 19.0, 23.0, 35.0, 34.0, 47.0, 40.0, 52.0, 33.0, 27.0, 17.0, 15.0, 8.0, 8.0, 4.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.28456449508667, -1.245125412940979, -1.205686330795288, -1.1662472486495972, -1.1268081665039062, -1.0873689651489258, -1.0479298830032349, -1.008490800857544, -0.969051718711853, -0.9296126365661621, -0.8901735544204712, -0.8507344126701355, -0.8112953305244446, -0.7718562483787537, -0.732417106628418, -0.692978024482727, -0.6535389423370361, -0.6140998601913452, -0.5746607780456543, -0.5352216362953186, -0.4957825541496277, -0.45634347200393677, -0.41690436005592346, -0.37746524810791016, -0.33802616596221924, -0.2985870838165283, -0.259147971868515, -0.2197088748216629, -0.1802697777748108, -0.14083068072795868, -0.10139158368110657, -0.06195247173309326, -0.022513389587402344, 0.016925707459449768, 0.05636480450630188, 0.09580390155315399, 0.1352429986000061, 0.17468209564685822, 0.21412119269371033, 0.25356030464172363, 0.29299938678741455, 0.33243846893310547, 0.3718775808811188, 0.4113166928291321, 0.450755774974823, 0.4901948571205139, 0.5296339988708496, 0.5690730810165405, 0.6085121631622314, 0.6479512453079224, 0.6873903274536133, 0.726829469203949, 0.7662685513496399, 0.8057076334953308, 0.8451467752456665, 0.8845858573913574, 0.9240249395370483, 0.9634640216827393, 1.0029031038284302, 1.042342185974121, 1.0817813873291016, 1.1212204694747925, 1.1606595516204834, 1.2000986337661743, 1.2395377159118652]}, "eval/loss": 3.0510671138763428, "eval/bleu": 1.5827445667544166e-18, "eval/runtime": 2619.9089, "eval/samples_per_second": 5.634, "eval/steps_per_second": 0.704, "train/train_runtime": 93795.5595, "train/train_samples_per_second": 6.633, "train/train_steps_per_second": 0.104, "train/total_flos": 0.0, "train/train_loss": 3.260483605049765, "_wandb": {"runtime": 94192}} \ No newline at end of file