diff --git "a/wandb/run-20220327_210229-2wif55w7/files/wandb-summary.json" "b/wandb/run-20220327_210229-2wif55w7/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220327_210229-2wif55w7/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.9509, "train/learning_rate": 2.976e-05, "train/epoch": 2.24, "train/global_step": 500, "_runtime": 11469, "_timestamp": 1648426418, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 877.0, 134.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.84069061279297, -15.51488208770752, -7.18907356262207, 1.1367340087890625, 9.462543487548828, 17.788352966308594, 26.114158630371094, 34.43996810913086, 42.765777587890625, 51.09158706665039, 59.417396545410156, 67.74320220947266, 76.06901550292969, 84.39482116699219, 92.72062683105469, 101.04643249511719, 109.37224578857422, 117.69805145263672, 126.02386474609375, 134.34967041015625, 142.67547607421875, 151.00128173828125, 159.32708740234375, 167.6529083251953, 175.9787139892578, 184.3045196533203, 192.6303253173828, 200.95614624023438, 209.28195190429688, 217.60775756835938, 225.93356323242188, 234.25936889648438, 242.585205078125, 250.9110107421875, 259.23681640625, 267.5626220703125, 275.888427734375, 284.2142333984375, 292.5400390625, 300.8658752441406, 309.1916809082031, 317.5174865722656, 325.8432922363281, 334.1690979003906, 342.4949035644531, 350.82073974609375, 359.14654541015625, 367.47235107421875, 375.79815673828125, 384.12396240234375, 392.44976806640625, 400.77557373046875, 409.10137939453125, 417.42718505859375, 425.75299072265625, 434.0788269042969, 442.40460205078125, 450.73040771484375, 459.05621337890625, 467.38201904296875, 475.70782470703125, 484.03363037109375, 492.35943603515625, 500.6852722167969, 509.0110778808594]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 16.0, 35.0, 32.0, 45.0, 84.0, 94.0, 115.0, 126.0, 117.0, 92.0, 75.0, 65.0, 35.0, 23.0, 9.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.390655517578125, -49.18394470214844, -47.97723388671875, -46.77052307128906, -45.563812255859375, -44.35710144042969, -43.150390625, -41.94367980957031, -40.736968994140625, -39.53025817871094, -38.32354736328125, -37.11683654785156, -35.910125732421875, -34.70341491699219, -33.4967041015625, -32.28999328613281, -31.083282470703125, -29.876571655273438, -28.66986083984375, -27.463150024414062, -26.256439208984375, -25.049728393554688, -23.843017578125, -22.636306762695312, -21.429595947265625, -20.222885131835938, -19.01617431640625, -17.809463500976562, -16.602752685546875, -15.396041870117188, -14.1893310546875, -12.982620239257812, -11.77590560913086, -10.569194793701172, -9.362483978271484, -8.155773162841797, -6.949062347412109, -5.742351531982422, -4.535640716552734, -3.328929901123047, -2.1222190856933594, -0.9155082702636719, 0.2912025451660156, 1.4979133605957031, 2.7046241760253906, 3.911334991455078, 5.118045806884766, 6.324756622314453, 7.531467437744141, 8.738178253173828, 9.944889068603516, 11.151599884033203, 12.35831069946289, 13.565021514892578, 14.771732330322266, 15.978443145751953, 17.18515396118164, 18.391864776611328, 19.598575592041016, 20.805286407470703, 22.01199722290039, 23.218708038330078, 24.425418853759766, 25.632129669189453, 26.83884048461914]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 5.0, 3.0, 10.0, 20.0, 24.0, 40.0, 65.0, 114.0, 248.0, 9231.0, 2012982.0, 2150358.0, 17216.0, 3708.0, 105.0, 59.0, 39.0, 16.0, 15.0, 3.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-120.0625, -117.134765625, -114.20703125, -111.279296875, -108.3515625, -105.423828125, -102.49609375, -99.568359375, -96.640625, -93.712890625, -90.78515625, -87.857421875, -84.9296875, -82.001953125, -79.07421875, -76.146484375, -73.21875, -70.291015625, -67.36328125, -64.435546875, -61.5078125, -58.580078125, -55.65234375, -52.724609375, -49.796875, -46.869140625, -43.94140625, -41.013671875, -38.0859375, -35.158203125, -32.23046875, -29.302734375, -26.375, -23.447265625, -20.51953125, -17.591796875, -14.6640625, -11.736328125, -8.80859375, -5.880859375, -2.953125, -0.025390625, 2.90234375, 5.830078125, 8.7578125, 11.685546875, 14.61328125, 17.541015625, 20.46875, 23.396484375, 26.32421875, 29.251953125, 32.1796875, 35.107421875, 38.03515625, 40.962890625, 43.890625, 46.818359375, 49.74609375, 52.673828125, 55.6015625, 58.529296875, 61.45703125, 64.384765625, 67.3125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 21.0, 37.0, 37.0, 42.0, 88.0, 94.0, 107.0, 121.0, 107.0, 106.0, 71.0, 65.0, 29.0, 20.0, 17.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-55.1875, -53.82080078125, -52.4541015625, -51.08740234375, -49.720703125, -48.35400390625, -46.9873046875, -45.62060546875, -44.25390625, -42.88720703125, -41.5205078125, -40.15380859375, -38.787109375, -37.42041015625, -36.0537109375, -34.68701171875, -33.3203125, -31.95361328125, -30.5869140625, -29.22021484375, -27.853515625, -26.48681640625, -25.1201171875, -23.75341796875, -22.38671875, -21.02001953125, -19.6533203125, -18.28662109375, -16.919921875, -15.55322265625, -14.1865234375, -12.81982421875, -11.453125, -10.08642578125, -8.7197265625, -7.35302734375, -5.986328125, -4.61962890625, -3.2529296875, -1.88623046875, -0.51953125, 0.84716796875, 2.2138671875, 3.58056640625, 4.947265625, 6.31396484375, 7.6806640625, 9.04736328125, 10.4140625, 11.78076171875, 13.1474609375, 14.51416015625, 15.880859375, 17.24755859375, 18.6142578125, 19.98095703125, 21.34765625, 22.71435546875, 24.0810546875, 25.44775390625, 26.814453125, 28.18115234375, 29.5478515625, 30.91455078125, 32.28125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 15.0, 513.0, 4193660.0, 82.0, 16.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4800.0, -4714.734375, -4629.46875, -4544.203125, -4458.9375, -4373.671875, -4288.40625, -4203.140625, -4117.875, -4032.609375, -3947.34375, -3862.078125, -3776.8125, -3691.546875, -3606.28125, -3521.015625, -3435.75, -3350.484375, -3265.21875, -3179.953125, -3094.6875, -3009.421875, -2924.15625, -2838.890625, -2753.625, -2668.359375, -2583.09375, -2497.828125, -2412.5625, -2327.296875, -2242.03125, -2156.765625, -2071.5, -1986.234375, -1900.96875, -1815.703125, -1730.4375, -1645.171875, -1559.90625, -1474.640625, -1389.375, -1304.109375, -1218.84375, -1133.578125, -1048.3125, -963.046875, -877.78125, -792.515625, -707.25, -621.984375, -536.71875, -451.453125, -366.1875, -280.921875, -195.65625, -110.390625, -25.125, 60.140625, 145.40625, 230.671875, 315.9375, 401.203125, 486.46875, 571.734375, 657.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 59.0, 3932.0, 77.0, 10.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-143.0, -140.470947265625, -137.94189453125, -135.412841796875, -132.8837890625, -130.354736328125, -127.82568359375, -125.296630859375, -122.767578125, -120.238525390625, -117.70947265625, -115.180419921875, -112.6513671875, -110.122314453125, -107.59326171875, -105.064208984375, -102.53515625, -100.006103515625, -97.47705078125, -94.947998046875, -92.4189453125, -89.889892578125, -87.36083984375, -84.831787109375, -82.302734375, -79.773681640625, -77.24462890625, -74.715576171875, -72.1865234375, -69.657470703125, -67.12841796875, -64.599365234375, -62.0703125, -59.541259765625, -57.01220703125, -54.483154296875, -51.9541015625, -49.425048828125, -46.89599609375, -44.366943359375, -41.837890625, -39.308837890625, -36.77978515625, -34.250732421875, -31.7216796875, -29.192626953125, -26.66357421875, -24.134521484375, -21.60546875, -19.076416015625, -16.54736328125, -14.018310546875, -11.4892578125, -8.960205078125, -6.43115234375, -3.902099609375, -1.373046875, 1.156005859375, 3.68505859375, 6.214111328125, 8.7431640625, 11.272216796875, 13.80126953125, 16.330322265625, 18.859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 12.0, 19.0, 33.0, 79.0, 159.0, 257.0, 219.0, 119.0, 56.0, 21.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0], "bins": [-36.846946716308594, -36.138763427734375, -35.43058395385742, -34.7224006652832, -34.01422119140625, -33.30603790283203, -32.59785461425781, -31.88967514038086, -31.181493759155273, -30.473312377929688, -29.7651309967041, -29.056949615478516, -28.348766326904297, -27.64058494567871, -26.932403564453125, -26.22422218322754, -25.516040802001953, -24.807859420776367, -24.09967803955078, -23.391494750976562, -22.683313369750977, -21.97513198852539, -21.266950607299805, -20.55876922607422, -19.8505859375, -19.142404556274414, -18.434223175048828, -17.72603988647461, -17.017858505249023, -16.309677124023438, -15.601495742797852, -14.893314361572266, -14.18513298034668, -13.476951599121094, -12.768769264221191, -12.060587882995605, -11.35240650177002, -10.644224166870117, -9.936042785644531, -9.227861404418945, -8.51968002319336, -7.811498165130615, -7.103316783905029, -6.395134925842285, -5.686953544616699, -4.978771686553955, -4.270589828491211, -3.562408447265625, -2.8542261123657227, -2.1460444927215576, -1.437862753868103, -0.7296810150146484, -0.0214993953704834, 0.6866822242736816, 1.3948640823364258, 2.1030454635620117, 2.811227321624756, 3.519408941268921, 4.227590560913086, 4.93577241897583, 5.643954277038574, 6.35213565826416, 7.060317516326904, 7.76849889755249, 8.476680755615234]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 11.0, 12.0, 13.0, 20.0, 20.0, 34.0, 47.0, 50.0, 45.0, 62.0, 66.0, 57.0, 72.0, 62.0, 58.0, 58.0, 64.0, 48.0, 40.0, 26.0, 25.0, 29.0, 12.0, 16.0, 13.0, 1.0, 6.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.440315246582031, -12.05218505859375, -11.664053916931152, -11.275923728942871, -10.88779354095459, -10.499662399291992, -10.111532211303711, -9.72340202331543, -9.335271835327148, -8.947141647338867, -8.55901050567627, -8.170880317687988, -7.782750129699707, -7.394619464874268, -7.006488800048828, -6.618358612060547, -6.230227470397949, -5.84209680557251, -5.4539666175842285, -5.065835952758789, -4.677705764770508, -4.289575099945068, -3.901444435119629, -3.5133140087127686, -3.125183582305908, -2.737053155899048, -2.3489227294921875, -1.960792064666748, -1.5726616382598877, -1.1845312118530273, -0.7964005470275879, -0.40827012062072754, -0.020140647888183594, 0.36798983812332153, 0.7561203241348267, 1.1442508697509766, 1.532381296157837, 1.9205117225646973, 2.3086423873901367, 2.696772813796997, 3.0849032402038574, 3.4730336666107178, 3.861164093017578, 4.249294757843018, 4.637425422668457, 5.025555610656738, 5.413686275482178, 5.801816940307617, 6.189947128295898, 6.578077793121338, 6.966207981109619, 7.354338645935059, 7.74246883392334, 8.130599975585938, 8.518730163574219, 8.9068603515625, 9.294990539550781, 9.683120727539062, 10.07125186920166, 10.459382057189941, 10.847512245178223, 11.23564338684082, 11.623773574829102, 12.011903762817383, 12.40003490447998]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 13.0, 19.0, 34.0, 46.0, 74.0, 116.0, 208.0, 421.0, 1006.0, 2612.0, 10652.0, 92965.0, 845962.0, 80158.0, 9960.0, 2499.0, 883.0, 400.0, 210.0, 130.0, 66.0, 40.0, 26.0, 12.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.48046875, -4.34661865234375, -4.2127685546875, -4.07891845703125, -3.945068359375, -3.81121826171875, -3.6773681640625, -3.54351806640625, -3.40966796875, -3.27581787109375, -3.1419677734375, -3.00811767578125, -2.874267578125, -2.74041748046875, -2.6065673828125, -2.47271728515625, -2.3388671875, -2.20501708984375, -2.0711669921875, -1.93731689453125, -1.803466796875, -1.66961669921875, -1.5357666015625, -1.40191650390625, -1.26806640625, -1.13421630859375, -1.0003662109375, -0.86651611328125, -0.732666015625, -0.59881591796875, -0.4649658203125, -0.33111572265625, -0.197265625, -0.06341552734375, 0.0704345703125, 0.20428466796875, 0.338134765625, 0.47198486328125, 0.6058349609375, 0.73968505859375, 0.87353515625, 1.00738525390625, 1.1412353515625, 1.27508544921875, 1.408935546875, 1.54278564453125, 1.6766357421875, 1.81048583984375, 1.9443359375, 2.07818603515625, 2.2120361328125, 2.34588623046875, 2.479736328125, 2.61358642578125, 2.7474365234375, 2.88128662109375, 3.01513671875, 3.14898681640625, 3.2828369140625, 3.41668701171875, 3.550537109375, 3.68438720703125, 3.8182373046875, 3.95208740234375, 4.0859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 22.0, 25.0, 37.0, 64.0, 84.0, 95.0, 107.0, 112.0, 106.0, 103.0, 70.0, 59.0, 40.0, 18.0, 17.0, 5.0, 9.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.609375, -15.097900390625, -14.58642578125, -14.074951171875, -13.5634765625, -13.052001953125, -12.54052734375, -12.029052734375, -11.517578125, -11.006103515625, -10.49462890625, -9.983154296875, -9.4716796875, -8.960205078125, -8.44873046875, -7.937255859375, -7.42578125, -6.914306640625, -6.40283203125, -5.891357421875, -5.3798828125, -4.868408203125, -4.35693359375, -3.845458984375, -3.333984375, -2.822509765625, -2.31103515625, -1.799560546875, -1.2880859375, -0.776611328125, -0.26513671875, 0.246337890625, 0.7578125, 1.269287109375, 1.78076171875, 2.292236328125, 2.8037109375, 3.315185546875, 3.82666015625, 4.338134765625, 4.849609375, 5.361083984375, 5.87255859375, 6.384033203125, 6.8955078125, 7.406982421875, 7.91845703125, 8.429931640625, 8.94140625, 9.452880859375, 9.96435546875, 10.475830078125, 10.9873046875, 11.498779296875, 12.01025390625, 12.521728515625, 13.033203125, 13.544677734375, 14.05615234375, 14.567626953125, 15.0791015625, 15.590576171875, 16.10205078125, 16.613525390625, 17.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 15.0, 15.0, 22.0, 33.0, 51.0, 64.0, 112.0, 210.0, 301.0, 563.0, 978.0, 1845.0, 3708.0, 8191.0, 19991.0, 58306.0, 228857.0, 538614.0, 123753.0, 37140.0, 13738.0, 5852.0, 2807.0, 1453.0, 801.0, 409.0, 243.0, 160.0, 92.0, 86.0, 41.0, 29.0, 15.0, 12.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4091796875, -1.3655548095703125, -1.321929931640625, -1.2783050537109375, -1.23468017578125, -1.1910552978515625, -1.147430419921875, -1.1038055419921875, -1.0601806640625, -1.0165557861328125, -0.972930908203125, -0.9293060302734375, -0.88568115234375, -0.8420562744140625, -0.798431396484375, -0.7548065185546875, -0.711181640625, -0.6675567626953125, -0.623931884765625, -0.5803070068359375, -0.53668212890625, -0.4930572509765625, -0.449432373046875, -0.4058074951171875, -0.3621826171875, -0.3185577392578125, -0.274932861328125, -0.2313079833984375, -0.18768310546875, -0.1440582275390625, -0.100433349609375, -0.0568084716796875, -0.01318359375, 0.0304412841796875, 0.074066162109375, 0.1176910400390625, 0.16131591796875, 0.2049407958984375, 0.248565673828125, 0.2921905517578125, 0.3358154296875, 0.3794403076171875, 0.423065185546875, 0.4666900634765625, 0.51031494140625, 0.5539398193359375, 0.597564697265625, 0.6411895751953125, 0.684814453125, 0.7284393310546875, 0.772064208984375, 0.8156890869140625, 0.85931396484375, 0.9029388427734375, 0.946563720703125, 0.9901885986328125, 1.0338134765625, 1.0774383544921875, 1.121063232421875, 1.1646881103515625, 1.20831298828125, 1.2519378662109375, 1.295562744140625, 1.3391876220703125, 1.3828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 7.0, 7.0, 5.0, 11.0, 20.0, 17.0, 28.0, 32.0, 34.0, 41.0, 54.0, 49.0, 46.0, 47.0, 47.0, 54.0, 72.0, 54.0, 42.0, 56.0, 42.0, 52.0, 28.0, 21.0, 19.0, 19.0, 15.0, 19.0, 10.0, 9.0, 6.0, 3.0, 2.0, 5.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-15.5390625, -15.0885009765625, -14.637939453125, -14.1873779296875, -13.73681640625, -13.2862548828125, -12.835693359375, -12.3851318359375, -11.9345703125, -11.4840087890625, -11.033447265625, -10.5828857421875, -10.13232421875, -9.6817626953125, -9.231201171875, -8.7806396484375, -8.330078125, -7.8795166015625, -7.428955078125, -6.9783935546875, -6.52783203125, -6.0772705078125, -5.626708984375, -5.1761474609375, -4.7255859375, -4.2750244140625, -3.824462890625, -3.3739013671875, -2.92333984375, -2.4727783203125, -2.022216796875, -1.5716552734375, -1.12109375, -0.6705322265625, -0.219970703125, 0.2305908203125, 0.68115234375, 1.1317138671875, 1.582275390625, 2.0328369140625, 2.4833984375, 2.9339599609375, 3.384521484375, 3.8350830078125, 4.28564453125, 4.7362060546875, 5.186767578125, 5.6373291015625, 6.087890625, 6.5384521484375, 6.989013671875, 7.4395751953125, 7.89013671875, 8.3406982421875, 8.791259765625, 9.2418212890625, 9.6923828125, 10.1429443359375, 10.593505859375, 11.0440673828125, 11.49462890625, 11.9451904296875, 12.395751953125, 12.8463134765625, 13.296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 5.0, 7.0, 12.0, 19.0, 25.0, 31.0, 55.0, 77.0, 123.0, 184.0, 343.0, 549.0, 988.0, 1673.0, 3090.0, 6134.0, 14530.0, 42333.0, 192771.0, 563892.0, 158682.0, 37051.0, 13256.0, 5794.0, 3075.0, 1569.0, 950.0, 515.0, 323.0, 178.0, 114.0, 81.0, 38.0, 33.0, 20.0, 8.0, 7.0, 6.0, 6.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.195068359375, -0.18923568725585938, -0.18340301513671875, -0.17757034301757812, -0.1717376708984375, -0.16590499877929688, -0.16007232666015625, -0.15423965454101562, -0.148406982421875, -0.14257431030273438, -0.13674163818359375, -0.13090896606445312, -0.1250762939453125, -0.11924362182617188, -0.11341094970703125, -0.10757827758789062, -0.10174560546875, -0.09591293334960938, -0.09008026123046875, -0.08424758911132812, -0.0784149169921875, -0.07258224487304688, -0.06674957275390625, -0.060916900634765625, -0.055084228515625, -0.049251556396484375, -0.04341888427734375, -0.037586212158203125, -0.0317535400390625, -0.025920867919921875, -0.02008819580078125, -0.014255523681640625, -0.0084228515625, -0.002590179443359375, 0.00324249267578125, 0.009075164794921875, 0.0149078369140625, 0.020740509033203125, 0.02657318115234375, 0.032405853271484375, 0.038238525390625, 0.044071197509765625, 0.04990386962890625, 0.055736541748046875, 0.0615692138671875, 0.06740188598632812, 0.07323455810546875, 0.07906723022460938, 0.08489990234375, 0.09073257446289062, 0.09656524658203125, 0.10239791870117188, 0.1082305908203125, 0.11406326293945312, 0.11989593505859375, 0.12572860717773438, 0.131561279296875, 0.13739395141601562, 0.14322662353515625, 0.14905929565429688, 0.1548919677734375, 0.16072463989257812, 0.16655731201171875, 0.17238998413085938, 0.17822265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 12.0, 5.0, 14.0, 28.0, 29.0, 46.0, 36.0, 85.0, 91.0, 111.0, 110.0, 133.0, 77.0, 67.0, 47.0, 25.0, 28.0, 16.0, 9.0, 11.0, 8.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011372566223144531, -0.0001104092225432396, -0.00010709278285503387, -0.00010377634316682816, -0.00010045990347862244, -9.714346379041672e-05, -9.3827024102211e-05, -9.051058441400528e-05, -8.719414472579956e-05, -8.387770503759384e-05, -8.056126534938812e-05, -7.72448256611824e-05, -7.392838597297668e-05, -7.061194628477097e-05, -6.729550659656525e-05, -6.397906690835953e-05, -6.066262722015381e-05, -5.734618753194809e-05, -5.402974784374237e-05, -5.071330815553665e-05, -4.739686846733093e-05, -4.4080428779125214e-05, -4.0763989090919495e-05, -3.7447549402713776e-05, -3.413110971450806e-05, -3.081467002630234e-05, -2.749823033809662e-05, -2.41817906498909e-05, -2.086535096168518e-05, -1.754891127347946e-05, -1.4232471585273743e-05, -1.0916031897068024e-05, -7.599592208862305e-06, -4.283152520656586e-06, -9.667128324508667e-07, 2.3497268557548523e-06, 5.666166543960571e-06, 8.98260623216629e-06, 1.229904592037201e-05, 1.5615485608577728e-05, 1.8931925296783447e-05, 2.2248364984989166e-05, 2.5564804673194885e-05, 2.8881244361400604e-05, 3.219768404960632e-05, 3.551412373781204e-05, 3.883056342601776e-05, 4.214700311422348e-05, 4.54634428024292e-05, 4.877988249063492e-05, 5.209632217884064e-05, 5.5412761867046356e-05, 5.8729201555252075e-05, 6.20456412434578e-05, 6.536208093166351e-05, 6.867852061986923e-05, 7.199496030807495e-05, 7.531139999628067e-05, 7.862783968448639e-05, 8.194427937269211e-05, 8.526071906089783e-05, 8.857715874910355e-05, 9.189359843730927e-05, 9.521003812551498e-05, 9.85264778137207e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 11.0, 9.0, 13.0, 35.0, 58.0, 82.0, 133.0, 348.0, 2699.0, 543946.0, 497914.0, 2564.0, 355.0, 126.0, 54.0, 36.0, 22.0, 28.0, 21.0, 21.0, 14.0, 9.0, 6.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66357421875, -0.6398696899414062, -0.6161651611328125, -0.5924606323242188, -0.568756103515625, -0.5450515747070312, -0.5213470458984375, -0.49764251708984375, -0.47393798828125, -0.45023345947265625, -0.4265289306640625, -0.40282440185546875, -0.379119873046875, -0.35541534423828125, -0.3317108154296875, -0.30800628662109375, -0.2843017578125, -0.26059722900390625, -0.2368927001953125, -0.21318817138671875, -0.189483642578125, -0.16577911376953125, -0.1420745849609375, -0.11837005615234375, -0.09466552734375, -0.07096099853515625, -0.0472564697265625, -0.02355194091796875, 0.000152587890625, 0.02385711669921875, 0.0475616455078125, 0.07126617431640625, 0.094970703125, 0.11867523193359375, 0.1423797607421875, 0.16608428955078125, 0.189788818359375, 0.21349334716796875, 0.2371978759765625, 0.26090240478515625, 0.28460693359375, 0.30831146240234375, 0.3320159912109375, 0.35572052001953125, 0.379425048828125, 0.40312957763671875, 0.4268341064453125, 0.45053863525390625, 0.4742431640625, 0.49794769287109375, 0.5216522216796875, 0.5453567504882812, 0.569061279296875, 0.5927658081054688, 0.6164703369140625, 0.6401748657226562, 0.66387939453125, 0.6875839233398438, 0.7112884521484375, 0.7349929809570312, 0.758697509765625, 0.7824020385742188, 0.8061065673828125, 0.8298110961914062, 0.853515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 20.0, 30.0, 45.0, 54.0, 61.0, 96.0, 114.0, 132.0, 127.0, 79.0, 71.0, 36.0, 19.0, 21.0, 10.0, 9.0, 17.0, 5.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.06628990173339844, -0.06385421752929688, -0.06141853332519531, -0.05898284912109375, -0.05654716491699219, -0.054111480712890625, -0.05167579650878906, -0.0492401123046875, -0.04680442810058594, -0.044368743896484375, -0.04193305969238281, -0.03949737548828125, -0.03706169128417969, -0.034626007080078125, -0.03219032287597656, -0.029754638671875, -0.027318954467773438, -0.024883270263671875, -0.022447586059570312, -0.02001190185546875, -0.017576217651367188, -0.015140533447265625, -0.012704849243164062, -0.0102691650390625, -0.007833480834960938, -0.005397796630859375, -0.0029621124267578125, -0.00052642822265625, 0.0019092559814453125, 0.004344940185546875, 0.0067806243896484375, 0.00921630859375, 0.011651992797851562, 0.014087677001953125, 0.016523361206054688, 0.01895904541015625, 0.021394729614257812, 0.023830413818359375, 0.026266098022460938, 0.0287017822265625, 0.031137466430664062, 0.033573150634765625, 0.03600883483886719, 0.03844451904296875, 0.04088020324707031, 0.043315887451171875, 0.04575157165527344, 0.048187255859375, 0.05062294006347656, 0.053058624267578125, 0.05549430847167969, 0.05792999267578125, 0.06036567687988281, 0.06280136108398438, 0.06523704528808594, 0.0676727294921875, 0.07010841369628906, 0.07254409790039062, 0.07497978210449219, 0.07741546630859375, 0.07985115051269531, 0.08228683471679688, 0.08472251892089844, 0.087158203125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 9.0, 8.0, 22.0, 76.0, 230.0, 328.0, 219.0, 65.0, 31.0, 5.0, 4.0, 4.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.306140899658203, -27.570613861083984, -26.835086822509766, -26.099559783935547, -25.364032745361328, -24.62850570678711, -23.89297866821289, -23.157451629638672, -22.421924591064453, -21.686397552490234, -20.950870513916016, -20.215343475341797, -19.479816436767578, -18.74428939819336, -18.00876235961914, -17.273235321044922, -16.537710189819336, -15.802183151245117, -15.066656112670898, -14.33112907409668, -13.595602035522461, -12.860074996948242, -12.12454891204834, -11.389021873474121, -10.653494834899902, -9.917967796325684, -9.182440757751465, -8.446914672851562, -7.7113871574401855, -6.975860118865967, -6.240333557128906, -5.5048065185546875, -4.769277572631836, -4.033750534057617, -3.2982237339019775, -2.562696933746338, -1.8271698951721191, -1.0916428565979004, -0.35611629486083984, 0.3794107437133789, 1.1149377822875977, 1.8504647016525269, 2.585991621017456, 3.3215184211730957, 4.0570454597473145, 4.792572498321533, 5.528099060058594, 6.2636260986328125, 6.999153137207031, 7.73468017578125, 8.470207214355469, 9.205734252929688, 9.941261291503906, 10.676788330078125, 11.412314414978027, 12.147841453552246, 12.883368492126465, 13.618895530700684, 14.354422569274902, 15.089948654174805, 15.825475692749023, 16.561002731323242, 17.29652976989746, 18.03205680847168, 18.7675838470459]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 6.0, 21.0, 27.0, 27.0, 72.0, 80.0, 88.0, 114.0, 112.0, 99.0, 110.0, 75.0, 52.0, 41.0, 23.0, 19.0, 6.0, 8.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.959997177124023, -14.454948425292969, -13.949899673461914, -13.44485092163086, -12.939802169799805, -12.43475341796875, -11.929704666137695, -11.42465591430664, -10.919607162475586, -10.414558410644531, -9.909509658813477, -9.404460906982422, -8.899412155151367, -8.394363403320312, -7.889314651489258, -7.384265899658203, -6.879217147827148, -6.374168395996094, -5.869119644165039, -5.364070892333984, -4.85902214050293, -4.353973388671875, -3.8489246368408203, -3.3438758850097656, -2.838827133178711, -2.3337783813476562, -1.8287296295166016, -1.3236808776855469, -0.8186321258544922, -0.3135833740234375, 0.1914653778076172, 0.6965141296386719, 1.2015609741210938, 1.7066097259521484, 2.211658477783203, 2.716707229614258, 3.2217559814453125, 3.726804733276367, 4.231853485107422, 4.736902236938477, 5.241950988769531, 5.746999740600586, 6.252048492431641, 6.757097244262695, 7.26214599609375, 7.767194747924805, 8.27224349975586, 8.777292251586914, 9.282341003417969, 9.787389755249023, 10.292438507080078, 10.797487258911133, 11.302536010742188, 11.807584762573242, 12.312633514404297, 12.817682266235352, 13.322731018066406, 13.827779769897461, 14.332828521728516, 14.83787727355957, 15.342926025390625, 15.84797477722168, 16.353023529052734, 16.85807228088379, 17.363121032714844]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 6.0, 22.0, 24.0, 25.0, 57.0, 94.0, 158.0, 337.0, 645.0, 1524.0, 3851.0, 11333.0, 44608.0, 253775.0, 570410.0, 124359.0, 25163.0, 7469.0, 2626.0, 1005.0, 503.0, 217.0, 130.0, 65.0, 40.0, 23.0, 21.0, 10.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.09765625, -5.9342041015625, -5.770751953125, -5.6072998046875, -5.44384765625, -5.2803955078125, -5.116943359375, -4.9534912109375, -4.7900390625, -4.6265869140625, -4.463134765625, -4.2996826171875, -4.13623046875, -3.9727783203125, -3.809326171875, -3.6458740234375, -3.482421875, -3.3189697265625, -3.155517578125, -2.9920654296875, -2.82861328125, -2.6651611328125, -2.501708984375, -2.3382568359375, -2.1748046875, -2.0113525390625, -1.847900390625, -1.6844482421875, -1.52099609375, -1.3575439453125, -1.194091796875, -1.0306396484375, -0.8671875, -0.7037353515625, -0.540283203125, -0.3768310546875, -0.21337890625, -0.0499267578125, 0.113525390625, 0.2769775390625, 0.4404296875, 0.6038818359375, 0.767333984375, 0.9307861328125, 1.09423828125, 1.2576904296875, 1.421142578125, 1.5845947265625, 1.748046875, 1.9114990234375, 2.074951171875, 2.2384033203125, 2.40185546875, 2.5653076171875, 2.728759765625, 2.8922119140625, 3.0556640625, 3.2191162109375, 3.382568359375, 3.5460205078125, 3.70947265625, 3.8729248046875, 4.036376953125, 4.1998291015625, 4.36328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 7.0, 9.0, 7.0, 14.0, 8.0, 13.0, 27.0, 38.0, 39.0, 42.0, 60.0, 63.0, 64.0, 63.0, 56.0, 65.0, 64.0, 54.0, 44.0, 53.0, 51.0, 36.0, 33.0, 23.0, 12.0, 11.0, 10.0, 4.0, 14.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.4742431640625, -11.846923828125, -11.2196044921875, -10.59228515625, -9.9649658203125, -9.337646484375, -8.7103271484375, -8.0830078125, -7.4556884765625, -6.828369140625, -6.2010498046875, -5.57373046875, -4.9464111328125, -4.319091796875, -3.6917724609375, -3.064453125, -2.4371337890625, -1.809814453125, -1.1824951171875, -0.55517578125, 0.0721435546875, 0.699462890625, 1.3267822265625, 1.9541015625, 2.5814208984375, 3.208740234375, 3.8360595703125, 4.46337890625, 5.0906982421875, 5.718017578125, 6.3453369140625, 6.97265625, 7.5999755859375, 8.227294921875, 8.8546142578125, 9.48193359375, 10.1092529296875, 10.736572265625, 11.3638916015625, 11.9912109375, 12.6185302734375, 13.245849609375, 13.8731689453125, 14.50048828125, 15.1278076171875, 15.755126953125, 16.3824462890625, 17.009765625, 17.6370849609375, 18.264404296875, 18.8917236328125, 19.51904296875, 20.1463623046875, 20.773681640625, 21.4010009765625, 22.0283203125, 22.6556396484375, 23.282958984375, 23.9102783203125, 24.53759765625, 25.1649169921875, 25.792236328125, 26.4195556640625, 27.046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 6.0, 5.0, 8.0, 9.0, 17.0, 14.0, 22.0, 18.0, 34.0, 55.0, 57.0, 66.0, 94.0, 118.0, 169.0, 381.0, 1085.0, 8481.0, 554701.0, 473591.0, 7431.0, 1030.0, 384.0, 203.0, 141.0, 112.0, 70.0, 62.0, 34.0, 44.0, 17.0, 15.0, 15.0, 13.0, 8.0, 11.0, 3.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-15.3359375, -14.8409423828125, -14.345947265625, -13.8509521484375, -13.35595703125, -12.8609619140625, -12.365966796875, -11.8709716796875, -11.3759765625, -10.8809814453125, -10.385986328125, -9.8909912109375, -9.39599609375, -8.9010009765625, -8.406005859375, -7.9110107421875, -7.416015625, -6.9210205078125, -6.426025390625, -5.9310302734375, -5.43603515625, -4.9410400390625, -4.446044921875, -3.9510498046875, -3.4560546875, -2.9610595703125, -2.466064453125, -1.9710693359375, -1.47607421875, -0.9810791015625, -0.486083984375, 0.0089111328125, 0.50390625, 0.9989013671875, 1.493896484375, 1.9888916015625, 2.48388671875, 2.9788818359375, 3.473876953125, 3.9688720703125, 4.4638671875, 4.9588623046875, 5.453857421875, 5.9488525390625, 6.44384765625, 6.9388427734375, 7.433837890625, 7.9288330078125, 8.423828125, 8.9188232421875, 9.413818359375, 9.9088134765625, 10.40380859375, 10.8988037109375, 11.393798828125, 11.8887939453125, 12.3837890625, 12.8787841796875, 13.373779296875, 13.8687744140625, 14.36376953125, 14.8587646484375, 15.353759765625, 15.8487548828125, 16.34375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 4.0, 5.0, 8.0, 8.0, 6.0, 9.0, 16.0, 11.0, 24.0, 30.0, 22.0, 28.0, 34.0, 51.0, 47.0, 44.0, 36.0, 57.0, 45.0, 45.0, 61.0, 45.0, 43.0, 35.0, 36.0, 37.0, 29.0, 20.0, 28.0, 30.0, 18.0, 16.0, 12.0, 10.0, 9.0, 4.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2578125, -10.8546142578125, -10.451416015625, -10.0482177734375, -9.64501953125, -9.2418212890625, -8.838623046875, -8.4354248046875, -8.0322265625, -7.6290283203125, -7.225830078125, -6.8226318359375, -6.41943359375, -6.0162353515625, -5.613037109375, -5.2098388671875, -4.806640625, -4.4034423828125, -4.000244140625, -3.5970458984375, -3.19384765625, -2.7906494140625, -2.387451171875, -1.9842529296875, -1.5810546875, -1.1778564453125, -0.774658203125, -0.3714599609375, 0.03173828125, 0.4349365234375, 0.838134765625, 1.2413330078125, 1.64453125, 2.0477294921875, 2.450927734375, 2.8541259765625, 3.25732421875, 3.6605224609375, 4.063720703125, 4.4669189453125, 4.8701171875, 5.2733154296875, 5.676513671875, 6.0797119140625, 6.48291015625, 6.8861083984375, 7.289306640625, 7.6925048828125, 8.095703125, 8.4989013671875, 8.902099609375, 9.3052978515625, 9.70849609375, 10.1116943359375, 10.514892578125, 10.9180908203125, 11.3212890625, 11.7244873046875, 12.127685546875, 12.5308837890625, 12.93408203125, 13.3372802734375, 13.740478515625, 14.1436767578125, 14.546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 15.0, 27.0, 131.0, 857.0, 1034757.0, 12283.0, 328.0, 80.0, 22.0, 13.0, 8.0, 4.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-32.15625, -31.469482421875, -30.78271484375, -30.095947265625, -29.4091796875, -28.722412109375, -28.03564453125, -27.348876953125, -26.662109375, -25.975341796875, -25.28857421875, -24.601806640625, -23.9150390625, -23.228271484375, -22.54150390625, -21.854736328125, -21.16796875, -20.481201171875, -19.79443359375, -19.107666015625, -18.4208984375, -17.734130859375, -17.04736328125, -16.360595703125, -15.673828125, -14.987060546875, -14.30029296875, -13.613525390625, -12.9267578125, -12.239990234375, -11.55322265625, -10.866455078125, -10.1796875, -9.492919921875, -8.80615234375, -8.119384765625, -7.4326171875, -6.745849609375, -6.05908203125, -5.372314453125, -4.685546875, -3.998779296875, -3.31201171875, -2.625244140625, -1.9384765625, -1.251708984375, -0.56494140625, 0.121826171875, 0.80859375, 1.495361328125, 2.18212890625, 2.868896484375, 3.5556640625, 4.242431640625, 4.92919921875, 5.615966796875, 6.302734375, 6.989501953125, 7.67626953125, 8.363037109375, 9.0498046875, 9.736572265625, 10.42333984375, 11.110107421875, 11.796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 14.0, 26.0, 104.0, 342.0, 334.0, 113.0, 39.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005459785461425781, -0.0005271360278129578, -0.0005082935094833374, -0.000489450991153717, -0.0004706084728240967, -0.0004517659544944763, -0.00043292343616485596, -0.0004140809178352356, -0.00039523839950561523, -0.0003763958811759949, -0.0003575533628463745, -0.00033871084451675415, -0.0003198683261871338, -0.00030102580785751343, -0.00028218328952789307, -0.0002633407711982727, -0.00024449825286865234, -0.00022565573453903198, -0.00020681321620941162, -0.00018797069787979126, -0.0001691281795501709, -0.00015028566122055054, -0.00013144314289093018, -0.00011260062456130981, -9.375810623168945e-05, -7.491558790206909e-05, -5.607306957244873e-05, -3.723055124282837e-05, -1.8388032913208008e-05, 4.544854164123535e-07, 1.9297003746032715e-05, 3.8139522075653076e-05, 5.698204040527344e-05, 7.58245587348938e-05, 9.466707706451416e-05, 0.00011350959539413452, 0.00013235211372375488, 0.00015119463205337524, 0.0001700371503829956, 0.00018887966871261597, 0.00020772218704223633, 0.0002265647053718567, 0.00024540722370147705, 0.0002642497420310974, 0.0002830922603607178, 0.00030193477869033813, 0.0003207772970199585, 0.00033961981534957886, 0.0003584623336791992, 0.0003773048520088196, 0.00039614737033843994, 0.0004149898886680603, 0.00043383240699768066, 0.000452674925327301, 0.0004715174436569214, 0.0004903599619865417, 0.0005092024803161621, 0.0005280449986457825, 0.0005468875169754028, 0.0005657300353050232, 0.0005845725536346436, 0.0006034150719642639, 0.0006222575902938843, 0.0006411001086235046, 0.000659942626953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 7.0, 31.0, 40.0, 83.0, 112.0, 314.0, 1223.0, 10096.0, 982822.0, 50473.0, 2367.0, 550.0, 168.0, 83.0, 47.0, 24.0, 22.0, 9.0, 5.0, 9.0, 7.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.45703125, -4.30169677734375, -4.1463623046875, -3.99102783203125, -3.835693359375, -3.68035888671875, -3.5250244140625, -3.36968994140625, -3.21435546875, -3.05902099609375, -2.9036865234375, -2.74835205078125, -2.593017578125, -2.43768310546875, -2.2823486328125, -2.12701416015625, -1.9716796875, -1.81634521484375, -1.6610107421875, -1.50567626953125, -1.350341796875, -1.19500732421875, -1.0396728515625, -0.88433837890625, -0.72900390625, -0.57366943359375, -0.4183349609375, -0.26300048828125, -0.107666015625, 0.04766845703125, 0.2030029296875, 0.35833740234375, 0.513671875, 0.66900634765625, 0.8243408203125, 0.97967529296875, 1.135009765625, 1.29034423828125, 1.4456787109375, 1.60101318359375, 1.75634765625, 1.91168212890625, 2.0670166015625, 2.22235107421875, 2.377685546875, 2.53302001953125, 2.6883544921875, 2.84368896484375, 2.9990234375, 3.15435791015625, 3.3096923828125, 3.46502685546875, 3.620361328125, 3.77569580078125, 3.9310302734375, 4.08636474609375, 4.24169921875, 4.39703369140625, 4.5523681640625, 4.70770263671875, 4.863037109375, 5.01837158203125, 5.1737060546875, 5.32904052734375, 5.484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 24.0, 27.0, 35.0, 55.0, 105.0, 126.0, 164.0, 147.0, 90.0, 71.0, 43.0, 28.0, 14.0, 12.0, 7.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77197265625, -0.7449111938476562, -0.7178497314453125, -0.6907882690429688, -0.663726806640625, -0.6366653442382812, -0.6096038818359375, -0.5825424194335938, -0.55548095703125, -0.5284194946289062, -0.5013580322265625, -0.47429656982421875, -0.447235107421875, -0.42017364501953125, -0.3931121826171875, -0.36605072021484375, -0.3389892578125, -0.31192779541015625, -0.2848663330078125, -0.25780487060546875, -0.230743408203125, -0.20368194580078125, -0.1766204833984375, -0.14955902099609375, -0.12249755859375, -0.09543609619140625, -0.0683746337890625, -0.04131317138671875, -0.014251708984375, 0.01280975341796875, 0.0398712158203125, 0.06693267822265625, 0.093994140625, 0.12105560302734375, 0.1481170654296875, 0.17517852783203125, 0.202239990234375, 0.22930145263671875, 0.2563629150390625, 0.28342437744140625, 0.31048583984375, 0.33754730224609375, 0.3646087646484375, 0.39167022705078125, 0.418731689453125, 0.44579315185546875, 0.4728546142578125, 0.49991607666015625, 0.5269775390625, 0.5540390014648438, 0.5811004638671875, 0.6081619262695312, 0.635223388671875, 0.6622848510742188, 0.6893463134765625, 0.7164077758789062, 0.74346923828125, 0.7705307006835938, 0.7975921630859375, 0.8246536254882812, 0.851715087890625, 0.8787765502929688, 0.9058380126953125, 0.9328994750976562, 0.9599609375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 13.0, 895.0, 103.0, 9.0], "bins": [-408.661865234375, -402.04071044921875, -395.4195861816406, -388.7984313964844, -382.1772766113281, -375.55615234375, -368.93499755859375, -362.3138427734375, -355.69268798828125, -349.071533203125, -342.4504089355469, -335.8292541503906, -329.2080993652344, -322.58697509765625, -315.9658203125, -309.34466552734375, -302.7235412597656, -296.1023864746094, -289.48126220703125, -282.860107421875, -276.23895263671875, -269.6177978515625, -262.9966735839844, -256.3755187988281, -249.75437927246094, -243.13323974609375, -236.5120849609375, -229.8909454345703, -223.26980590820312, -216.64865112304688, -210.0275115966797, -203.4063720703125, -196.78521728515625, -190.16407775878906, -183.5429229736328, -176.92178344726562, -170.30062866210938, -163.6794891357422, -157.058349609375, -150.43719482421875, -143.8160400390625, -137.1949005126953, -130.57374572753906, -123.95260620117188, -117.33145904541016, -110.71031188964844, -104.08917236328125, -97.46802520751953, -90.84688568115234, -84.22573852539062, -77.60459899902344, -70.98345184326172, -64.3623046875, -57.74115753173828, -51.12001419067383, -44.498870849609375, -37.877723693847656, -31.25657844543457, -24.635433197021484, -18.0142879486084, -11.393142700195312, -4.771995544433594, 1.8491477966308594, 8.470291137695312, 15.091438293457031]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 7.0, 11.0, 16.0, 6.0, 19.0, 20.0, 27.0, 29.0, 26.0, 23.0, 36.0, 43.0, 51.0, 67.0, 60.0, 67.0, 59.0, 52.0, 47.0, 43.0, 51.0, 40.0, 38.0, 31.0, 24.0, 19.0, 20.0, 15.0, 10.0, 11.0, 9.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.82306671142578, -21.034130096435547, -20.245193481445312, -19.456256866455078, -18.66731834411621, -17.878381729125977, -17.089445114135742, -16.300508499145508, -15.511570930480957, -14.722634315490723, -13.933696746826172, -13.144760131835938, -12.355823516845703, -11.566885948181152, -10.777949333190918, -9.989011764526367, -9.200075149536133, -8.411138534545898, -7.622200965881348, -6.833264350891113, -6.044327259063721, -5.255390167236328, -4.466453552246094, -3.677516460418701, -2.8885793685913086, -2.099642276763916, -1.3107054233551025, -0.5217685699462891, 0.2671685218811035, 1.056105613708496, 1.8450422286987305, 2.633979320526123, 3.422914505004883, 4.211851596832275, 5.000788688659668, 5.789725303649902, 6.578662395477295, 7.3675994873046875, 8.156536102294922, 8.945472717285156, 9.734410285949707, 10.523346900939941, 11.312284469604492, 12.101221084594727, 12.890157699584961, 13.679095268249512, 14.468031883239746, 15.256969451904297, 16.04590606689453, 16.834842681884766, 17.623779296875, 18.412715911865234, 19.2016544342041, 19.990591049194336, 20.77952766418457, 21.568464279174805, 22.357402801513672, 23.146339416503906, 23.93527603149414, 24.724212646484375, 25.513151168823242, 26.302087783813477, 27.09102439880371, 27.879961013793945, 28.66889762878418]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 13.0, 34.0, 32.0, 45.0, 74.0, 190.0, 3711.0, 1899120.0, 2289505.0, 1139.0, 184.0, 96.0, 51.0, 27.0, 20.0, 13.0, 9.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.46875, -36.86669921875, -35.2646484375, -33.66259765625, -32.060546875, -30.45849609375, -28.8564453125, -27.25439453125, -25.65234375, -24.05029296875, -22.4482421875, -20.84619140625, -19.244140625, -17.64208984375, -16.0400390625, -14.43798828125, -12.8359375, -11.23388671875, -9.6318359375, -8.02978515625, -6.427734375, -4.82568359375, -3.2236328125, -1.62158203125, -0.01953125, 1.58251953125, 3.1845703125, 4.78662109375, 6.388671875, 7.99072265625, 9.5927734375, 11.19482421875, 12.796875, 14.39892578125, 16.0009765625, 17.60302734375, 19.205078125, 20.80712890625, 22.4091796875, 24.01123046875, 25.61328125, 27.21533203125, 28.8173828125, 30.41943359375, 32.021484375, 33.62353515625, 35.2255859375, 36.82763671875, 38.4296875, 40.03173828125, 41.6337890625, 43.23583984375, 44.837890625, 46.43994140625, 48.0419921875, 49.64404296875, 51.24609375, 52.84814453125, 54.4501953125, 56.05224609375, 57.654296875, 59.25634765625, 60.8583984375, 62.46044921875, 64.0625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 7.0, 14.0, 23.0, 38.0, 51.0, 60.0, 89.0, 96.0, 107.0, 103.0, 109.0, 92.0, 66.0, 64.0, 31.0, 10.0, 13.0, 7.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.7298583984375, -9.248779296875, -8.7677001953125, -8.28662109375, -7.8055419921875, -7.324462890625, -6.8433837890625, -6.3623046875, -5.8812255859375, -5.400146484375, -4.9190673828125, -4.43798828125, -3.9569091796875, -3.475830078125, -2.9947509765625, -2.513671875, -2.0325927734375, -1.551513671875, -1.0704345703125, -0.58935546875, -0.1082763671875, 0.372802734375, 0.8538818359375, 1.3349609375, 1.8160400390625, 2.297119140625, 2.7781982421875, 3.25927734375, 3.7403564453125, 4.221435546875, 4.7025146484375, 5.18359375, 5.6646728515625, 6.145751953125, 6.6268310546875, 7.10791015625, 7.5889892578125, 8.070068359375, 8.5511474609375, 9.0322265625, 9.5133056640625, 9.994384765625, 10.4754638671875, 10.95654296875, 11.4376220703125, 11.918701171875, 12.3997802734375, 12.880859375, 13.3619384765625, 13.843017578125, 14.3240966796875, 14.80517578125, 15.2862548828125, 15.767333984375, 16.2484130859375, 16.7294921875, 17.2105712890625, 17.691650390625, 18.1727294921875, 18.65380859375, 19.1348876953125, 19.615966796875, 20.0970458984375, 20.578125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 5.0, 5.0, 7.0, 2.0, 13.0, 21.0, 37.0, 105.0, 448.0, 5075.0, 4183871.0, 4001.0, 421.0, 100.0, 46.0, 34.0, 24.0, 14.0, 11.0, 6.0, 9.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.5625, -78.080078125, -75.59765625, -73.115234375, -70.6328125, -68.150390625, -65.66796875, -63.185546875, -60.703125, -58.220703125, -55.73828125, -53.255859375, -50.7734375, -48.291015625, -45.80859375, -43.326171875, -40.84375, -38.361328125, -35.87890625, -33.396484375, -30.9140625, -28.431640625, -25.94921875, -23.466796875, -20.984375, -18.501953125, -16.01953125, -13.537109375, -11.0546875, -8.572265625, -6.08984375, -3.607421875, -1.125, 1.357421875, 3.83984375, 6.322265625, 8.8046875, 11.287109375, 13.76953125, 16.251953125, 18.734375, 21.216796875, 23.69921875, 26.181640625, 28.6640625, 31.146484375, 33.62890625, 36.111328125, 38.59375, 41.076171875, 43.55859375, 46.041015625, 48.5234375, 51.005859375, 53.48828125, 55.970703125, 58.453125, 60.935546875, 63.41796875, 65.900390625, 68.3828125, 70.865234375, 73.34765625, 75.830078125, 78.3125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 11.0, 26.0, 97.0, 697.0, 2433.0, 645.0, 102.0, 29.0, 11.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9560546875, -11.576171875, -11.1962890625, -10.81640625, -10.4365234375, -10.056640625, -9.6767578125, -9.296875, -8.9169921875, -8.537109375, -8.1572265625, -7.77734375, -7.3974609375, -7.017578125, -6.6376953125, -6.2578125, -5.8779296875, -5.498046875, -5.1181640625, -4.73828125, -4.3583984375, -3.978515625, -3.5986328125, -3.21875, -2.8388671875, -2.458984375, -2.0791015625, -1.69921875, -1.3193359375, -0.939453125, -0.5595703125, -0.1796875, 0.2001953125, 0.580078125, 0.9599609375, 1.33984375, 1.7197265625, 2.099609375, 2.4794921875, 2.859375, 3.2392578125, 3.619140625, 3.9990234375, 4.37890625, 4.7587890625, 5.138671875, 5.5185546875, 5.8984375, 6.2783203125, 6.658203125, 7.0380859375, 7.41796875, 7.7978515625, 8.177734375, 8.5576171875, 8.9375, 9.3173828125, 9.697265625, 10.0771484375, 10.45703125, 10.8369140625, 11.216796875, 11.5966796875, 11.9765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 15.0, 39.0, 162.0, 377.0, 264.0, 87.0, 35.0, 6.0, 14.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.142328262329102, -13.239542961120605, -12.33675765991211, -11.433971405029297, -10.531187057495117, -9.628400802612305, -8.725615501403809, -7.8228302001953125, -6.920044898986816, -6.01725959777832, -5.114474296569824, -4.21168851852417, -3.308903217315674, -2.4061179161071777, -1.5033321380615234, -0.6005468368530273, 0.30223846435546875, 1.2050238847732544, 2.10780930519104, 3.0105948448181152, 3.9133801460266113, 4.816165447235107, 5.718951225280762, 6.621736526489258, 7.524521827697754, 8.42730712890625, 9.330092430114746, 10.232877731323242, 11.135663986206055, 12.038448333740234, 12.941234588623047, 13.844019889831543, 14.746803283691406, 15.649588584899902, 16.5523738861084, 17.45516014099121, 18.35794448852539, 19.260730743408203, 20.163516998291016, 21.066301345825195, 21.969085693359375, 22.871871948242188, 23.774656295776367, 24.67744255065918, 25.58022689819336, 26.483013153076172, 27.385799407958984, 28.288583755493164, 29.191370010375977, 30.09415626525879, 30.99694061279297, 31.89972686767578, 32.802513122558594, 33.70529556274414, 34.60808181762695, 35.510868072509766, 36.41365432739258, 37.31644058227539, 38.2192268371582, 39.12200927734375, 40.02479553222656, 40.927581787109375, 41.83036804199219, 42.733154296875, 43.63593673706055]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 11.0, 19.0, 32.0, 30.0, 35.0, 63.0, 75.0, 67.0, 88.0, 85.0, 75.0, 83.0, 79.0, 49.0, 55.0, 41.0, 36.0, 19.0, 8.0, 12.0, 9.0, 7.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.069784164428711, -7.676638603210449, -7.2834930419921875, -6.890347480773926, -6.497201919555664, -6.104056358337402, -5.710910797119141, -5.317765235900879, -4.924619674682617, -4.5314741134643555, -4.138328552246094, -3.745182991027832, -3.3520374298095703, -2.9588918685913086, -2.565746545791626, -2.1726009845733643, -1.7794556617736816, -1.38631010055542, -0.993164598941803, -0.600019097328186, -0.20687353610992432, 0.1862720251083374, 0.5794174671173096, 0.9725630283355713, 1.365708589553833, 1.7588541507720947, 2.1519997119903564, 2.545145034790039, 2.938290596008301, 3.3314361572265625, 3.724581718444824, 4.117727279663086, 4.510872840881348, 4.904018402099609, 5.297163963317871, 5.690309524536133, 6.0834550857543945, 6.476600646972656, 6.869746208190918, 7.26289176940918, 7.656037330627441, 8.049182891845703, 8.442328453063965, 8.835474014282227, 9.228619575500488, 9.62176513671875, 10.014910697937012, 10.408056259155273, 10.801200866699219, 11.19434642791748, 11.587491989135742, 11.980637550354004, 12.373783111572266, 12.766928672790527, 13.160074234008789, 13.55321979522705, 13.946365356445312, 14.339510917663574, 14.732656478881836, 15.125802040100098, 15.51894760131836, 15.912093162536621, 16.305238723754883, 16.698383331298828, 17.091529846191406]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 12.0, 18.0, 29.0, 47.0, 86.0, 196.0, 406.0, 899.0, 2260.0, 7732.0, 93525.0, 904756.0, 30902.0, 4831.0, 1578.0, 646.0, 283.0, 157.0, 83.0, 40.0, 19.0, 13.0, 9.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.814453125, -3.688690185546875, -3.56292724609375, -3.437164306640625, -3.3114013671875, -3.185638427734375, -3.05987548828125, -2.934112548828125, -2.808349609375, -2.682586669921875, -2.55682373046875, -2.431060791015625, -2.3052978515625, -2.179534912109375, -2.05377197265625, -1.928009033203125, -1.80224609375, -1.676483154296875, -1.55072021484375, -1.424957275390625, -1.2991943359375, -1.173431396484375, -1.04766845703125, -0.921905517578125, -0.796142578125, -0.670379638671875, -0.54461669921875, -0.418853759765625, -0.2930908203125, -0.167327880859375, -0.04156494140625, 0.084197998046875, 0.2099609375, 0.335723876953125, 0.46148681640625, 0.587249755859375, 0.7130126953125, 0.838775634765625, 0.96453857421875, 1.090301513671875, 1.216064453125, 1.341827392578125, 1.46759033203125, 1.593353271484375, 1.7191162109375, 1.844879150390625, 1.97064208984375, 2.096405029296875, 2.22216796875, 2.347930908203125, 2.47369384765625, 2.599456787109375, 2.7252197265625, 2.850982666015625, 2.97674560546875, 3.102508544921875, 3.228271484375, 3.354034423828125, 3.47979736328125, 3.605560302734375, 3.7313232421875, 3.857086181640625, 3.98284912109375, 4.108612060546875, 4.234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 12.0, 12.0, 25.0, 38.0, 47.0, 61.0, 87.0, 100.0, 119.0, 109.0, 92.0, 90.0, 66.0, 58.0, 26.0, 19.0, 16.0, 8.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171875, -6.8468017578125, -6.521728515625, -6.1966552734375, -5.87158203125, -5.5465087890625, -5.221435546875, -4.8963623046875, -4.5712890625, -4.2462158203125, -3.921142578125, -3.5960693359375, -3.27099609375, -2.9459228515625, -2.620849609375, -2.2957763671875, -1.970703125, -1.6456298828125, -1.320556640625, -0.9954833984375, -0.67041015625, -0.3453369140625, -0.020263671875, 0.3048095703125, 0.6298828125, 0.9549560546875, 1.280029296875, 1.6051025390625, 1.93017578125, 2.2552490234375, 2.580322265625, 2.9053955078125, 3.23046875, 3.5555419921875, 3.880615234375, 4.2056884765625, 4.53076171875, 4.8558349609375, 5.180908203125, 5.5059814453125, 5.8310546875, 6.1561279296875, 6.481201171875, 6.8062744140625, 7.13134765625, 7.4564208984375, 7.781494140625, 8.1065673828125, 8.431640625, 8.7567138671875, 9.081787109375, 9.4068603515625, 9.73193359375, 10.0570068359375, 10.382080078125, 10.7071533203125, 11.0322265625, 11.3572998046875, 11.682373046875, 12.0074462890625, 12.33251953125, 12.6575927734375, 12.982666015625, 13.3077392578125, 13.6328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 5.0, 3.0, 7.0, 14.0, 21.0, 31.0, 46.0, 75.0, 122.0, 211.0, 386.0, 664.0, 1364.0, 2978.0, 7049.0, 19132.0, 57323.0, 217904.0, 538683.0, 137220.0, 40823.0, 14090.0, 5521.0, 2333.0, 1185.0, 579.0, 308.0, 171.0, 109.0, 66.0, 36.0, 36.0, 22.0, 13.0, 10.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8974609375, -0.871337890625, -0.84521484375, -0.819091796875, -0.79296875, -0.766845703125, -0.74072265625, -0.714599609375, -0.6884765625, -0.662353515625, -0.63623046875, -0.610107421875, -0.583984375, -0.557861328125, -0.53173828125, -0.505615234375, -0.4794921875, -0.453369140625, -0.42724609375, -0.401123046875, -0.375, -0.348876953125, -0.32275390625, -0.296630859375, -0.2705078125, -0.244384765625, -0.21826171875, -0.192138671875, -0.166015625, -0.139892578125, -0.11376953125, -0.087646484375, -0.0615234375, -0.035400390625, -0.00927734375, 0.016845703125, 0.04296875, 0.069091796875, 0.09521484375, 0.121337890625, 0.1474609375, 0.173583984375, 0.19970703125, 0.225830078125, 0.251953125, 0.278076171875, 0.30419921875, 0.330322265625, 0.3564453125, 0.382568359375, 0.40869140625, 0.434814453125, 0.4609375, 0.487060546875, 0.51318359375, 0.539306640625, 0.5654296875, 0.591552734375, 0.61767578125, 0.643798828125, 0.669921875, 0.696044921875, 0.72216796875, 0.748291015625, 0.7744140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 6.0, 13.0, 18.0, 26.0, 26.0, 49.0, 38.0, 46.0, 37.0, 48.0, 56.0, 56.0, 59.0, 63.0, 55.0, 56.0, 49.0, 58.0, 23.0, 31.0, 32.0, 28.0, 17.0, 19.0, 21.0, 10.0, 14.0, 11.0, 7.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.10302734375, -8.8310546875, -8.55908203125, -8.287109375, -8.01513671875, -7.7431640625, -7.47119140625, -7.19921875, -6.92724609375, -6.6552734375, -6.38330078125, -6.111328125, -5.83935546875, -5.5673828125, -5.29541015625, -5.0234375, -4.75146484375, -4.4794921875, -4.20751953125, -3.935546875, -3.66357421875, -3.3916015625, -3.11962890625, -2.84765625, -2.57568359375, -2.3037109375, -2.03173828125, -1.759765625, -1.48779296875, -1.2158203125, -0.94384765625, -0.671875, -0.39990234375, -0.1279296875, 0.14404296875, 0.416015625, 0.68798828125, 0.9599609375, 1.23193359375, 1.50390625, 1.77587890625, 2.0478515625, 2.31982421875, 2.591796875, 2.86376953125, 3.1357421875, 3.40771484375, 3.6796875, 3.95166015625, 4.2236328125, 4.49560546875, 4.767578125, 5.03955078125, 5.3115234375, 5.58349609375, 5.85546875, 6.12744140625, 6.3994140625, 6.67138671875, 6.943359375, 7.21533203125, 7.4873046875, 7.75927734375, 8.03125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 10.0, 16.0, 14.0, 22.0, 27.0, 68.0, 79.0, 127.0, 200.0, 277.0, 504.0, 692.0, 1241.0, 2372.0, 4888.0, 11649.0, 31868.0, 106791.0, 356402.0, 365317.0, 110604.0, 32751.0, 11831.0, 4984.0, 2493.0, 1264.0, 704.0, 446.0, 297.0, 197.0, 126.0, 94.0, 67.0, 58.0, 23.0, 17.0, 10.0, 8.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.08477783203125, -0.08235645294189453, -0.07993507385253906, -0.0775136947631836, -0.07509231567382812, -0.07267093658447266, -0.07024955749511719, -0.06782817840576172, -0.06540679931640625, -0.06298542022705078, -0.06056404113769531, -0.058142662048339844, -0.055721282958984375, -0.053299903869628906, -0.05087852478027344, -0.04845714569091797, -0.0460357666015625, -0.04361438751220703, -0.04119300842285156, -0.038771629333496094, -0.036350250244140625, -0.033928871154785156, -0.03150749206542969, -0.02908611297607422, -0.02666473388671875, -0.02424335479736328, -0.021821975708007812, -0.019400596618652344, -0.016979217529296875, -0.014557838439941406, -0.012136459350585938, -0.009715080261230469, -0.007293701171875, -0.004872322082519531, -0.0024509429931640625, -2.956390380859375e-05, 0.002391815185546875, 0.004813194274902344, 0.0072345733642578125, 0.009655952453613281, 0.01207733154296875, 0.014498710632324219, 0.016920089721679688, 0.019341468811035156, 0.021762847900390625, 0.024184226989746094, 0.026605606079101562, 0.02902698516845703, 0.0314483642578125, 0.03386974334716797, 0.03629112243652344, 0.038712501525878906, 0.041133880615234375, 0.043555259704589844, 0.04597663879394531, 0.04839801788330078, 0.05081939697265625, 0.05324077606201172, 0.05566215515136719, 0.058083534240722656, 0.060504913330078125, 0.0629262924194336, 0.06534767150878906, 0.06776905059814453, 0.0701904296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 3.0, 3.0, 10.0, 9.0, 15.0, 19.0, 17.0, 39.0, 38.0, 66.0, 84.0, 80.0, 78.0, 102.0, 92.0, 101.0, 50.0, 67.0, 34.0, 25.0, 20.0, 8.0, 13.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.92605972290039e-05, -6.723683327436447e-05, -6.521306931972504e-05, -6.31893053650856e-05, -6.116554141044617e-05, -5.914177745580673e-05, -5.71180135011673e-05, -5.509424954652786e-05, -5.307048559188843e-05, -5.104672163724899e-05, -4.902295768260956e-05, -4.699919372797012e-05, -4.497542977333069e-05, -4.2951665818691254e-05, -4.092790186405182e-05, -3.8904137909412384e-05, -3.688037395477295e-05, -3.4856610000133514e-05, -3.283284604549408e-05, -3.0809082090854645e-05, -2.878531813621521e-05, -2.6761554181575775e-05, -2.473779022693634e-05, -2.2714026272296906e-05, -2.069026231765747e-05, -1.8666498363018036e-05, -1.66427344083786e-05, -1.4618970453739166e-05, -1.2595206499099731e-05, -1.0571442544460297e-05, -8.547678589820862e-06, -6.523914635181427e-06, -4.500150680541992e-06, -2.4763867259025574e-06, -4.5262277126312256e-07, 1.5711411833763123e-06, 3.594905138015747e-06, 5.618669092655182e-06, 7.642433047294617e-06, 9.666197001934052e-06, 1.1689960956573486e-05, 1.3713724911212921e-05, 1.5737488865852356e-05, 1.776125282049179e-05, 1.9785016775131226e-05, 2.180878072977066e-05, 2.3832544684410095e-05, 2.585630863904953e-05, 2.7880072593688965e-05, 2.99038365483284e-05, 3.1927600502967834e-05, 3.395136445760727e-05, 3.5975128412246704e-05, 3.799889236688614e-05, 4.0022656321525574e-05, 4.204642027616501e-05, 4.407018423080444e-05, 4.609394818544388e-05, 4.811771214008331e-05, 5.014147609472275e-05, 5.216524004936218e-05, 5.418900400400162e-05, 5.621276795864105e-05, 5.823653191328049e-05, 6.026029586791992e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 4.0, 13.0, 22.0, 28.0, 42.0, 92.0, 160.0, 721.0, 13075.0, 962970.0, 69276.0, 1648.0, 228.0, 89.0, 50.0, 38.0, 28.0, 9.0, 13.0, 12.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2600135803222656, -0.24903106689453125, -0.23804855346679688, -0.2270660400390625, -0.21608352661132812, -0.20510101318359375, -0.19411849975585938, -0.183135986328125, -0.17215347290039062, -0.16117095947265625, -0.15018844604492188, -0.1392059326171875, -0.12822341918945312, -0.11724090576171875, -0.10625839233398438, -0.09527587890625, -0.08429336547851562, -0.07331085205078125, -0.062328338623046875, -0.0513458251953125, -0.040363311767578125, -0.02938079833984375, -0.018398284912109375, -0.007415771484375, 0.003566741943359375, 0.01454925537109375, 0.025531768798828125, 0.0365142822265625, 0.047496795654296875, 0.05847930908203125, 0.06946182250976562, 0.0804443359375, 0.09142684936523438, 0.10240936279296875, 0.11339187622070312, 0.1243743896484375, 0.13535690307617188, 0.14633941650390625, 0.15732192993164062, 0.168304443359375, 0.17928695678710938, 0.19026947021484375, 0.20125198364257812, 0.2122344970703125, 0.22321701049804688, 0.23419952392578125, 0.24518203735351562, 0.25616455078125, 0.2671470642089844, 0.27812957763671875, 0.2891120910644531, 0.3000946044921875, 0.3110771179199219, 0.32205963134765625, 0.3330421447753906, 0.344024658203125, 0.3550071716308594, 0.36598968505859375, 0.3769721984863281, 0.3879547119140625, 0.3989372253417969, 0.40991973876953125, 0.4209022521972656, 0.431884765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 10.0, 12.0, 16.0, 28.0, 36.0, 63.0, 76.0, 105.0, 128.0, 130.0, 95.0, 90.0, 44.0, 41.0, 32.0, 19.0, 18.0, 8.0, 11.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027313232421875, -0.0262603759765625, -0.02520751953125, -0.0241546630859375, -0.023101806640625, -0.0220489501953125, -0.02099609375, -0.0199432373046875, -0.018890380859375, -0.0178375244140625, -0.01678466796875, -0.0157318115234375, -0.014678955078125, -0.0136260986328125, -0.0125732421875, -0.0115203857421875, -0.010467529296875, -0.0094146728515625, -0.00836181640625, -0.0073089599609375, -0.006256103515625, -0.0052032470703125, -0.004150390625, -0.0030975341796875, -0.002044677734375, -0.0009918212890625, 6.103515625e-05, 0.0011138916015625, 0.002166748046875, 0.0032196044921875, 0.0042724609375, 0.0053253173828125, 0.006378173828125, 0.0074310302734375, 0.00848388671875, 0.0095367431640625, 0.010589599609375, 0.0116424560546875, 0.0126953125, 0.0137481689453125, 0.014801025390625, 0.0158538818359375, 0.01690673828125, 0.0179595947265625, 0.019012451171875, 0.0200653076171875, 0.0211181640625, 0.0221710205078125, 0.023223876953125, 0.0242767333984375, 0.02532958984375, 0.0263824462890625, 0.027435302734375, 0.0284881591796875, 0.029541015625, 0.0305938720703125, 0.031646728515625, 0.0326995849609375, 0.03375244140625, 0.0348052978515625, 0.035858154296875, 0.0369110107421875, 0.0379638671875, 0.0390167236328125, 0.040069580078125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 10.0, 10.0, 23.0, 63.0, 100.0, 210.0, 223.0, 176.0, 80.0, 51.0, 17.0, 11.0, 9.0, 6.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.386265754699707, -13.06292724609375, -12.739587783813477, -12.41624927520752, -12.092910766601562, -11.769572257995605, -11.446233749389648, -11.122894287109375, -10.799555778503418, -10.476217269897461, -10.152877807617188, -9.82953929901123, -9.506200790405273, -9.182862281799316, -8.85952377319336, -8.536184310913086, -8.212845802307129, -7.889507293701172, -7.566168308258057, -7.242829322814941, -6.919490814208984, -6.596152305603027, -6.272813320159912, -5.949474334716797, -5.62613582611084, -5.302797317504883, -4.979458332061768, -4.656119346618652, -4.332780838012695, -4.009442329406738, -3.686103343963623, -3.362764596939087, -3.039426803588867, -2.716088056564331, -2.392749309539795, -2.069410562515259, -1.7460718154907227, -1.4227330684661865, -1.0993943214416504, -0.7760555744171143, -0.4527168273925781, -0.129378080368042, 0.19396066665649414, 0.5172994136810303, 0.8406381607055664, 1.1639769077301025, 1.4873156547546387, 1.8106544017791748, 2.133993148803711, 2.457331895828247, 2.780670642852783, 3.1040093898773193, 3.4273481369018555, 3.7506868839263916, 4.074025630950928, 4.397364616394043, 4.720703125, 5.044041633605957, 5.367380619049072, 5.6907196044921875, 6.0140581130981445, 6.337396621704102, 6.660735607147217, 6.984074592590332, 7.307413101196289]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 13.0, 26.0, 39.0, 38.0, 64.0, 98.0, 92.0, 109.0, 101.0, 105.0, 82.0, 75.0, 51.0, 40.0, 17.0, 12.0, 12.0, 11.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.702004432678223, -6.386074542999268, -6.0701446533203125, -5.754215240478516, -5.4382853507995605, -5.1223554611206055, -4.806426048278809, -4.4904961585998535, -4.174566268920898, -3.8586363792419434, -3.5427067279815674, -3.2267770767211914, -2.9108471870422363, -2.5949172973632812, -2.2789876461029053, -1.9630579948425293, -1.6471281051635742, -1.3311983346939087, -1.0152685642242432, -0.6993387937545776, -0.3834090232849121, -0.06747925281524658, 0.24845051765441895, 0.5643801689147949, 0.88031005859375, 1.1962398290634155, 1.512169599533081, 1.8280993700027466, 2.144029140472412, 2.459959030151367, 2.775888681411743, 3.091818332672119, 3.4077491760253906, 3.7236790657043457, 4.039608955383301, 4.355538368225098, 4.671468257904053, 4.987398147583008, 5.303327560424805, 5.61925745010376, 5.935187339782715, 6.25111722946167, 6.567047119140625, 6.882976531982422, 7.198906421661377, 7.514836311340332, 7.830765724182129, 8.146696090698242, 8.462625503540039, 8.778554916381836, 9.09448528289795, 9.410414695739746, 9.72634506225586, 10.042274475097656, 10.358203887939453, 10.67413330078125, 10.990063667297363, 11.30599308013916, 11.621923446655273, 11.93785285949707, 12.253782272338867, 12.56971263885498, 12.885642051696777, 13.20157241821289, 13.517501831054688]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 11.0, 16.0, 19.0, 62.0, 83.0, 163.0, 384.0, 758.0, 1891.0, 5122.0, 17634.0, 90579.0, 570821.0, 301015.0, 43738.0, 10474.0, 3272.0, 1251.0, 615.0, 274.0, 138.0, 74.0, 46.0, 23.0, 20.0, 12.0, 6.0, 6.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1796875, -5.99127197265625, -5.8028564453125, -5.61444091796875, -5.426025390625, -5.23760986328125, -5.0491943359375, -4.86077880859375, -4.67236328125, -4.48394775390625, -4.2955322265625, -4.10711669921875, -3.918701171875, -3.73028564453125, -3.5418701171875, -3.35345458984375, -3.1650390625, -2.97662353515625, -2.7882080078125, -2.59979248046875, -2.411376953125, -2.22296142578125, -2.0345458984375, -1.84613037109375, -1.65771484375, -1.46929931640625, -1.2808837890625, -1.09246826171875, -0.904052734375, -0.71563720703125, -0.5272216796875, -0.33880615234375, -0.150390625, 0.03802490234375, 0.2264404296875, 0.41485595703125, 0.603271484375, 0.79168701171875, 0.9801025390625, 1.16851806640625, 1.35693359375, 1.54534912109375, 1.7337646484375, 1.92218017578125, 2.110595703125, 2.29901123046875, 2.4874267578125, 2.67584228515625, 2.8642578125, 3.05267333984375, 3.2410888671875, 3.42950439453125, 3.617919921875, 3.80633544921875, 3.9947509765625, 4.18316650390625, 4.37158203125, 4.55999755859375, 4.7484130859375, 4.93682861328125, 5.125244140625, 5.31365966796875, 5.5020751953125, 5.69049072265625, 5.87890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 14.0, 19.0, 23.0, 33.0, 32.0, 59.0, 53.0, 64.0, 76.0, 72.0, 81.0, 63.0, 74.0, 73.0, 61.0, 39.0, 42.0, 26.0, 27.0, 15.0, 11.0, 10.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -7.990966796875, -7.56005859375, -7.129150390625, -6.6982421875, -6.267333984375, -5.83642578125, -5.405517578125, -4.974609375, -4.543701171875, -4.11279296875, -3.681884765625, -3.2509765625, -2.820068359375, -2.38916015625, -1.958251953125, -1.52734375, -1.096435546875, -0.66552734375, -0.234619140625, 0.1962890625, 0.627197265625, 1.05810546875, 1.489013671875, 1.919921875, 2.350830078125, 2.78173828125, 3.212646484375, 3.6435546875, 4.074462890625, 4.50537109375, 4.936279296875, 5.3671875, 5.798095703125, 6.22900390625, 6.659912109375, 7.0908203125, 7.521728515625, 7.95263671875, 8.383544921875, 8.814453125, 9.245361328125, 9.67626953125, 10.107177734375, 10.5380859375, 10.968994140625, 11.39990234375, 11.830810546875, 12.26171875, 12.692626953125, 13.12353515625, 13.554443359375, 13.9853515625, 14.416259765625, 14.84716796875, 15.278076171875, 15.708984375, 16.139892578125, 16.57080078125, 17.001708984375, 17.4326171875, 17.863525390625, 18.29443359375, 18.725341796875, 19.15625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 5.0, 4.0, 10.0, 18.0, 20.0, 22.0, 41.0, 38.0, 49.0, 75.0, 107.0, 130.0, 193.0, 260.0, 637.0, 5009.0, 902936.0, 135723.0, 1981.0, 436.0, 239.0, 161.0, 114.0, 79.0, 60.0, 48.0, 30.0, 27.0, 12.0, 20.0, 17.0, 6.0, 9.0, 3.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.953125, -27.173095703125, -26.39306640625, -25.613037109375, -24.8330078125, -24.052978515625, -23.27294921875, -22.492919921875, -21.712890625, -20.932861328125, -20.15283203125, -19.372802734375, -18.5927734375, -17.812744140625, -17.03271484375, -16.252685546875, -15.47265625, -14.692626953125, -13.91259765625, -13.132568359375, -12.3525390625, -11.572509765625, -10.79248046875, -10.012451171875, -9.232421875, -8.452392578125, -7.67236328125, -6.892333984375, -6.1123046875, -5.332275390625, -4.55224609375, -3.772216796875, -2.9921875, -2.212158203125, -1.43212890625, -0.652099609375, 0.1279296875, 0.907958984375, 1.68798828125, 2.468017578125, 3.248046875, 4.028076171875, 4.80810546875, 5.588134765625, 6.3681640625, 7.148193359375, 7.92822265625, 8.708251953125, 9.48828125, 10.268310546875, 11.04833984375, 11.828369140625, 12.6083984375, 13.388427734375, 14.16845703125, 14.948486328125, 15.728515625, 16.508544921875, 17.28857421875, 18.068603515625, 18.8486328125, 19.628662109375, 20.40869140625, 21.188720703125, 21.96875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 8.0, 12.0, 11.0, 12.0, 21.0, 30.0, 23.0, 43.0, 44.0, 46.0, 57.0, 44.0, 42.0, 41.0, 72.0, 57.0, 63.0, 61.0, 53.0, 36.0, 45.0, 34.0, 27.0, 21.0, 16.0, 14.0, 17.0, 13.0, 8.0, 4.0, 7.0, 7.0, 1.0, 0.0, 1.0, 6.0, 2.0, 1.0, 1.0], "bins": [-15.5390625, -15.1502685546875, -14.761474609375, -14.3726806640625, -13.98388671875, -13.5950927734375, -13.206298828125, -12.8175048828125, -12.4287109375, -12.0399169921875, -11.651123046875, -11.2623291015625, -10.87353515625, -10.4847412109375, -10.095947265625, -9.7071533203125, -9.318359375, -8.9295654296875, -8.540771484375, -8.1519775390625, -7.76318359375, -7.3743896484375, -6.985595703125, -6.5968017578125, -6.2080078125, -5.8192138671875, -5.430419921875, -5.0416259765625, -4.65283203125, -4.2640380859375, -3.875244140625, -3.4864501953125, -3.09765625, -2.7088623046875, -2.320068359375, -1.9312744140625, -1.54248046875, -1.1536865234375, -0.764892578125, -0.3760986328125, 0.0126953125, 0.4014892578125, 0.790283203125, 1.1790771484375, 1.56787109375, 1.9566650390625, 2.345458984375, 2.7342529296875, 3.123046875, 3.5118408203125, 3.900634765625, 4.2894287109375, 4.67822265625, 5.0670166015625, 5.455810546875, 5.8446044921875, 6.2333984375, 6.6221923828125, 7.010986328125, 7.3997802734375, 7.78857421875, 8.1773681640625, 8.566162109375, 8.9549560546875, 9.34375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 9.0, 11.0, 14.0, 13.0, 20.0, 34.0, 54.0, 82.0, 180.0, 388.0, 1361.0, 9906.0, 1003305.0, 30167.0, 1945.0, 539.0, 196.0, 119.0, 64.0, 31.0, 25.0, 23.0, 17.0, 10.0, 8.0, 8.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8984375, -9.575439453125, -9.25244140625, -8.929443359375, -8.6064453125, -8.283447265625, -7.96044921875, -7.637451171875, -7.314453125, -6.991455078125, -6.66845703125, -6.345458984375, -6.0224609375, -5.699462890625, -5.37646484375, -5.053466796875, -4.73046875, -4.407470703125, -4.08447265625, -3.761474609375, -3.4384765625, -3.115478515625, -2.79248046875, -2.469482421875, -2.146484375, -1.823486328125, -1.50048828125, -1.177490234375, -0.8544921875, -0.531494140625, -0.20849609375, 0.114501953125, 0.4375, 0.760498046875, 1.08349609375, 1.406494140625, 1.7294921875, 2.052490234375, 2.37548828125, 2.698486328125, 3.021484375, 3.344482421875, 3.66748046875, 3.990478515625, 4.3134765625, 4.636474609375, 4.95947265625, 5.282470703125, 5.60546875, 5.928466796875, 6.25146484375, 6.574462890625, 6.8974609375, 7.220458984375, 7.54345703125, 7.866455078125, 8.189453125, 8.512451171875, 8.83544921875, 9.158447265625, 9.4814453125, 9.804443359375, 10.12744140625, 10.450439453125, 10.7734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 8.0, 12.0, 33.0, 34.0, 79.0, 84.0, 125.0, 149.0, 135.0, 97.0, 77.0, 50.0, 44.0, 18.0, 13.0, 11.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037407875061035156, -0.00036438554525375366, -0.00035469233989715576, -0.00034499913454055786, -0.00033530592918395996, -0.00032561272382736206, -0.00031591951847076416, -0.00030622631311416626, -0.00029653310775756836, -0.00028683990240097046, -0.00027714669704437256, -0.00026745349168777466, -0.00025776028633117676, -0.00024806708097457886, -0.00023837387561798096, -0.00022868067026138306, -0.00021898746490478516, -0.00020929425954818726, -0.00019960105419158936, -0.00018990784883499146, -0.00018021464347839355, -0.00017052143812179565, -0.00016082823276519775, -0.00015113502740859985, -0.00014144182205200195, -0.00013174861669540405, -0.00012205541133880615, -0.00011236220598220825, -0.00010266900062561035, -9.297579526901245e-05, -8.328258991241455e-05, -7.358938455581665e-05, -6.389617919921875e-05, -5.420297384262085e-05, -4.450976848602295e-05, -3.481656312942505e-05, -2.512335777282715e-05, -1.5430152416229248e-05, -5.736947059631348e-06, 3.956258296966553e-06, 1.3649463653564453e-05, 2.3342669010162354e-05, 3.3035874366760254e-05, 4.2729079723358154e-05, 5.2422285079956055e-05, 6.211549043655396e-05, 7.180869579315186e-05, 8.150190114974976e-05, 9.119510650634766e-05, 0.00010088831186294556, 0.00011058151721954346, 0.00012027472257614136, 0.00012996792793273926, 0.00013966113328933716, 0.00014935433864593506, 0.00015904754400253296, 0.00016874074935913086, 0.00017843395471572876, 0.00018812716007232666, 0.00019782036542892456, 0.00020751357078552246, 0.00021720677614212036, 0.00022689998149871826, 0.00023659318685531616, 0.00024628639221191406]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 15.0, 17.0, 21.0, 27.0, 58.0, 61.0, 117.0, 294.0, 844.0, 9189.0, 995698.0, 39639.0, 1743.0, 375.0, 174.0, 77.0, 49.0, 42.0, 25.0, 25.0, 13.0, 10.0, 5.0, 4.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.8984375, -9.5859375, -9.2734375, -8.9609375, -8.6484375, -8.3359375, -8.0234375, -7.7109375, -7.3984375, -7.0859375, -6.7734375, -6.4609375, -6.1484375, -5.8359375, -5.5234375, -5.2109375, -4.8984375, -4.5859375, -4.2734375, -3.9609375, -3.6484375, -3.3359375, -3.0234375, -2.7109375, -2.3984375, -2.0859375, -1.7734375, -1.4609375, -1.1484375, -0.8359375, -0.5234375, -0.2109375, 0.1015625, 0.4140625, 0.7265625, 1.0390625, 1.3515625, 1.6640625, 1.9765625, 2.2890625, 2.6015625, 2.9140625, 3.2265625, 3.5390625, 3.8515625, 4.1640625, 4.4765625, 4.7890625, 5.1015625, 5.4140625, 5.7265625, 6.0390625, 6.3515625, 6.6640625, 6.9765625, 7.2890625, 7.6015625, 7.9140625, 8.2265625, 8.5390625, 8.8515625, 9.1640625, 9.4765625, 9.7890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 14.0, 18.0, 16.0, 17.0, 36.0, 65.0, 94.0, 142.0, 203.0, 130.0, 66.0, 53.0, 35.0, 19.0, 24.0, 9.0, 12.0, 9.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6171875, -1.553619384765625, -1.49005126953125, -1.426483154296875, -1.3629150390625, -1.299346923828125, -1.23577880859375, -1.172210693359375, -1.108642578125, -1.045074462890625, -0.98150634765625, -0.917938232421875, -0.8543701171875, -0.790802001953125, -0.72723388671875, -0.663665771484375, -0.60009765625, -0.536529541015625, -0.47296142578125, -0.409393310546875, -0.3458251953125, -0.282257080078125, -0.21868896484375, -0.155120849609375, -0.091552734375, -0.027984619140625, 0.03558349609375, 0.099151611328125, 0.1627197265625, 0.226287841796875, 0.28985595703125, 0.353424072265625, 0.4169921875, 0.480560302734375, 0.54412841796875, 0.607696533203125, 0.6712646484375, 0.734832763671875, 0.79840087890625, 0.861968994140625, 0.925537109375, 0.989105224609375, 1.05267333984375, 1.116241455078125, 1.1798095703125, 1.243377685546875, 1.30694580078125, 1.370513916015625, 1.43408203125, 1.497650146484375, 1.56121826171875, 1.624786376953125, 1.6883544921875, 1.751922607421875, 1.81549072265625, 1.879058837890625, 1.942626953125, 2.006195068359375, 2.06976318359375, 2.133331298828125, 2.1968994140625, 2.260467529296875, 2.32403564453125, 2.387603759765625, 2.451171875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 30.0, 754.0, 224.0, 9.0, 1.0], "bins": [-245.9085235595703, -241.86376953125, -237.8190155029297, -233.77426147460938, -229.7294921875, -225.6847381591797, -221.63998413085938, -217.59523010253906, -213.55047607421875, -209.50572204589844, -205.46096801757812, -201.4162139892578, -197.3714599609375, -193.32669067382812, -189.2819366455078, -185.2371826171875, -181.1924285888672, -177.14767456054688, -173.10292053222656, -169.05816650390625, -165.01339721679688, -160.96864318847656, -156.92388916015625, -152.87913513183594, -148.83438110351562, -144.7896270751953, -140.744873046875, -136.7001190185547, -132.65536499023438, -128.610595703125, -124.56584167480469, -120.52108764648438, -116.47633361816406, -112.43157958984375, -108.38682556152344, -104.3420639038086, -100.29730987548828, -96.25255584716797, -92.20779418945312, -88.16304016113281, -84.1182861328125, -80.07353210449219, -76.02877807617188, -71.98401641845703, -67.93926239013672, -63.894508361816406, -59.84975051879883, -55.80499267578125, -51.7602424621582, -47.715484619140625, -43.67073059082031, -39.6259765625, -35.58121871948242, -31.536462783813477, -27.49170684814453, -23.446950912475586, -19.40219497680664, -15.357439041137695, -11.31268310546875, -7.267927169799805, -3.2231712341308594, 0.8215847015380859, 4.866340637207031, 8.911096572875977, 12.955853462219238]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 12.0, 11.0, 9.0, 13.0, 15.0, 21.0, 19.0, 26.0, 23.0, 34.0, 32.0, 41.0, 35.0, 37.0, 42.0, 57.0, 52.0, 44.0, 35.0, 44.0, 53.0, 48.0, 34.0, 29.0, 26.0, 32.0, 28.0, 21.0, 19.0, 14.0, 18.0, 19.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.335044860839844, -10.931319236755371, -10.527593612670898, -10.123868942260742, -9.72014331817627, -9.316417694091797, -8.91269302368164, -8.508967399597168, -8.105241775512695, -7.701516151428223, -7.297791004180908, -6.894065856933594, -6.490340232849121, -6.086614608764648, -5.682889461517334, -5.2791643142700195, -4.875438690185547, -4.471713066101074, -4.06798791885376, -3.664262533187866, -3.2605371475219727, -2.856811761856079, -2.4530863761901855, -2.049360990524292, -1.6456356048583984, -1.2419102191925049, -0.8381848335266113, -0.4344594478607178, -0.03073406219482422, 0.37299132347106934, 0.7767167091369629, 1.1804420948028564, 1.58416748046875, 1.9878928661346436, 2.391618251800537, 2.7953436374664307, 3.199069023132324, 3.6027944087982178, 4.006519794464111, 4.410244941711426, 4.813970565795898, 5.217696189880371, 5.6214213371276855, 6.025146484375, 6.428872108459473, 6.832597732543945, 7.23632287979126, 7.640048027038574, 8.043773651123047, 8.44749927520752, 8.851224899291992, 9.254949569702148, 9.658675193786621, 10.062400817871094, 10.46612548828125, 10.869851112365723, 11.273576736450195, 11.677302360534668, 12.08102798461914, 12.484752655029297, 12.88847827911377, 13.292203903198242, 13.695928573608398, 14.099654197692871, 14.503379821777344]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 12.0, 7.0, 15.0, 22.0, 25.0, 38.0, 53.0, 104.0, 172.0, 354.0, 1657.0, 4285.0, 26019.0, 791880.0, 3052432.0, 300550.0, 13833.0, 1630.0, 547.0, 252.0, 118.0, 90.0, 53.0, 39.0, 24.0, 22.0, 18.0, 12.0, 3.0, 10.0, 0.0, 2.0, 3.0, 2.0], "bins": [-17.859375, -17.45672607421875, -17.0540771484375, -16.65142822265625, -16.248779296875, -15.84613037109375, -15.4434814453125, -15.04083251953125, -14.63818359375, -14.23553466796875, -13.8328857421875, -13.43023681640625, -13.027587890625, -12.62493896484375, -12.2222900390625, -11.81964111328125, -11.4169921875, -11.01434326171875, -10.6116943359375, -10.20904541015625, -9.806396484375, -9.40374755859375, -9.0010986328125, -8.59844970703125, -8.19580078125, -7.79315185546875, -7.3905029296875, -6.98785400390625, -6.585205078125, -6.18255615234375, -5.7799072265625, -5.37725830078125, -4.974609375, -4.57196044921875, -4.1693115234375, -3.76666259765625, -3.364013671875, -2.96136474609375, -2.5587158203125, -2.15606689453125, -1.75341796875, -1.35076904296875, -0.9481201171875, -0.54547119140625, -0.142822265625, 0.25982666015625, 0.6624755859375, 1.06512451171875, 1.4677734375, 1.87042236328125, 2.2730712890625, 2.67572021484375, 3.078369140625, 3.48101806640625, 3.8836669921875, 4.28631591796875, 4.68896484375, 5.09161376953125, 5.4942626953125, 5.89691162109375, 6.299560546875, 6.70220947265625, 7.1048583984375, 7.50750732421875, 7.91015625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 8.0, 23.0, 22.0, 29.0, 41.0, 59.0, 71.0, 56.0, 102.0, 75.0, 74.0, 84.0, 72.0, 75.0, 53.0, 37.0, 33.0, 24.0, 17.0, 13.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9765625, -7.6575927734375, -7.338623046875, -7.0196533203125, -6.70068359375, -6.3817138671875, -6.062744140625, -5.7437744140625, -5.4248046875, -5.1058349609375, -4.786865234375, -4.4678955078125, -4.14892578125, -3.8299560546875, -3.510986328125, -3.1920166015625, -2.873046875, -2.5540771484375, -2.235107421875, -1.9161376953125, -1.59716796875, -1.2781982421875, -0.959228515625, -0.6402587890625, -0.3212890625, -0.0023193359375, 0.316650390625, 0.6356201171875, 0.95458984375, 1.2735595703125, 1.592529296875, 1.9114990234375, 2.23046875, 2.5494384765625, 2.868408203125, 3.1873779296875, 3.50634765625, 3.8253173828125, 4.144287109375, 4.4632568359375, 4.7822265625, 5.1011962890625, 5.420166015625, 5.7391357421875, 6.05810546875, 6.3770751953125, 6.696044921875, 7.0150146484375, 7.333984375, 7.6529541015625, 7.971923828125, 8.2908935546875, 8.60986328125, 8.9288330078125, 9.247802734375, 9.5667724609375, 9.8857421875, 10.2047119140625, 10.523681640625, 10.8426513671875, 11.16162109375, 11.4805908203125, 11.799560546875, 12.1185302734375, 12.4375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 6.0, 8.0, 12.0, 19.0, 30.0, 49.0, 140.0, 597.0, 15211.0, 4176027.0, 1734.0, 280.0, 95.0, 39.0, 20.0, 9.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-109.75, -107.4755859375, -105.201171875, -102.9267578125, -100.65234375, -98.3779296875, -96.103515625, -93.8291015625, -91.5546875, -89.2802734375, -87.005859375, -84.7314453125, -82.45703125, -80.1826171875, -77.908203125, -75.6337890625, -73.359375, -71.0849609375, -68.810546875, -66.5361328125, -64.26171875, -61.9873046875, -59.712890625, -57.4384765625, -55.1640625, -52.8896484375, -50.615234375, -48.3408203125, -46.06640625, -43.7919921875, -41.517578125, -39.2431640625, -36.96875, -34.6943359375, -32.419921875, -30.1455078125, -27.87109375, -25.5966796875, -23.322265625, -21.0478515625, -18.7734375, -16.4990234375, -14.224609375, -11.9501953125, -9.67578125, -7.4013671875, -5.126953125, -2.8525390625, -0.578125, 1.6962890625, 3.970703125, 6.2451171875, 8.51953125, 10.7939453125, 13.068359375, 15.3427734375, 17.6171875, 19.8916015625, 22.166015625, 24.4404296875, 26.71484375, 28.9892578125, 31.263671875, 33.5380859375, 35.8125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 7.0, 14.0, 36.0, 67.0, 176.0, 676.0, 1679.0, 1033.0, 226.0, 73.0, 43.0, 18.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.2734375, -9.03338623046875, -8.7933349609375, -8.55328369140625, -8.313232421875, -8.07318115234375, -7.8331298828125, -7.59307861328125, -7.35302734375, -7.11297607421875, -6.8729248046875, -6.63287353515625, -6.392822265625, -6.15277099609375, -5.9127197265625, -5.67266845703125, -5.4326171875, -5.19256591796875, -4.9525146484375, -4.71246337890625, -4.472412109375, -4.23236083984375, -3.9923095703125, -3.75225830078125, -3.51220703125, -3.27215576171875, -3.0321044921875, -2.79205322265625, -2.552001953125, -2.31195068359375, -2.0718994140625, -1.83184814453125, -1.591796875, -1.35174560546875, -1.1116943359375, -0.87164306640625, -0.631591796875, -0.39154052734375, -0.1514892578125, 0.08856201171875, 0.32861328125, 0.56866455078125, 0.8087158203125, 1.04876708984375, 1.288818359375, 1.52886962890625, 1.7689208984375, 2.00897216796875, 2.2490234375, 2.48907470703125, 2.7291259765625, 2.96917724609375, 3.209228515625, 3.44927978515625, 3.6893310546875, 3.92938232421875, 4.16943359375, 4.40948486328125, 4.6495361328125, 4.88958740234375, 5.129638671875, 5.36968994140625, 5.6097412109375, 5.84979248046875, 6.08984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 11.0, 7.0, 13.0, 25.0, 37.0, 42.0, 91.0, 118.0, 136.0, 151.0, 122.0, 82.0, 62.0, 27.0, 27.0, 12.0, 14.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673105239868164, -9.359976768493652, -9.04684829711914, -8.733719825744629, -8.420591354370117, -8.107461929321289, -7.794333457946777, -7.481204986572266, -7.168076515197754, -6.854948043823242, -6.5418195724487305, -6.2286906242370605, -5.915562152862549, -5.602433681488037, -5.289304733276367, -4.9761762619018555, -4.663047790527344, -4.349919319152832, -4.03679084777832, -3.7236618995666504, -3.4105334281921387, -3.097404956817627, -2.784276247024536, -2.4711475372314453, -2.1580190658569336, -1.8448904752731323, -1.531761884689331, -1.2186332941055298, -0.9055047035217285, -0.5923761129379272, -0.279247522354126, 0.033881187438964844, 0.34701061248779297, 0.6601392030715942, 0.9732677936553955, 1.2863963842391968, 1.599524974822998, 1.9126535654067993, 2.2257821559906006, 2.5389108657836914, 2.852039337158203, 3.165167808532715, 3.4782965183258057, 3.7914252281188965, 4.104553699493408, 4.41768217086792, 4.73081111907959, 5.043939590454102, 5.357068061828613, 5.670196533203125, 5.983325004577637, 6.296453952789307, 6.609582424163818, 6.92271089553833, 7.23583984375, 7.548968315124512, 7.862096786499023, 8.175225257873535, 8.488353729248047, 8.801482200622559, 9.11461067199707, 9.427740097045898, 9.74086856842041, 10.053997039794922, 10.367125511169434]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 6.0, 16.0, 15.0, 20.0, 19.0, 21.0, 27.0, 37.0, 55.0, 60.0, 73.0, 62.0, 74.0, 48.0, 54.0, 72.0, 69.0, 57.0, 45.0, 33.0, 32.0, 24.0, 22.0, 20.0, 12.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.829596519470215, -6.547545909881592, -6.265495300292969, -5.983444690704346, -5.701394081115723, -5.419343948364258, -5.137293338775635, -4.855242729187012, -4.573192119598389, -4.291141510009766, -4.009090900421143, -3.7270405292510986, -3.4449899196624756, -3.1629393100738525, -2.8808889389038086, -2.5988383293151855, -2.3167877197265625, -2.0347371101379395, -1.752686619758606, -1.4706361293792725, -1.1885855197906494, -0.9065349102020264, -0.6244844198226929, -0.3424339294433594, -0.06038331985473633, 0.22166723012924194, 0.5037177801132202, 0.7857683300971985, 1.0678188800811768, 1.3498694896697998, 1.6319199800491333, 1.9139704704284668, 2.1960220336914062, 2.4780726432800293, 2.7601232528686523, 3.0421736240386963, 3.3242242336273193, 3.6062748432159424, 3.8883252143859863, 4.170375823974609, 4.452426433563232, 4.7344770431518555, 5.0165276527404785, 5.298578262329102, 5.580628395080566, 5.862679481506348, 6.1447296142578125, 6.4267802238464355, 6.708830833435059, 6.990881443023682, 7.272932052612305, 7.554982662200928, 7.837033271789551, 8.119083404541016, 8.401134490966797, 8.683184623718262, 8.965234756469727, 9.247284889221191, 9.529335975646973, 9.811386108398438, 10.093437194824219, 10.375487327575684, 10.657538414001465, 10.93958854675293, 11.221639633178711]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 8.0, 22.0, 17.0, 38.0, 50.0, 81.0, 178.0, 339.0, 770.0, 1722.0, 4201.0, 15477.0, 256909.0, 733281.0, 25991.0, 5468.0, 2115.0, 960.0, 435.0, 181.0, 116.0, 49.0, 38.0, 29.0, 18.0, 15.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.623046875, -3.53045654296875, -3.4378662109375, -3.34527587890625, -3.252685546875, -3.16009521484375, -3.0675048828125, -2.97491455078125, -2.88232421875, -2.78973388671875, -2.6971435546875, -2.60455322265625, -2.511962890625, -2.41937255859375, -2.3267822265625, -2.23419189453125, -2.1416015625, -2.04901123046875, -1.9564208984375, -1.86383056640625, -1.771240234375, -1.67864990234375, -1.5860595703125, -1.49346923828125, -1.40087890625, -1.30828857421875, -1.2156982421875, -1.12310791015625, -1.030517578125, -0.93792724609375, -0.8453369140625, -0.75274658203125, -0.66015625, -0.56756591796875, -0.4749755859375, -0.38238525390625, -0.289794921875, -0.19720458984375, -0.1046142578125, -0.01202392578125, 0.08056640625, 0.17315673828125, 0.2657470703125, 0.35833740234375, 0.450927734375, 0.54351806640625, 0.6361083984375, 0.72869873046875, 0.8212890625, 0.91387939453125, 1.0064697265625, 1.09906005859375, 1.191650390625, 1.28424072265625, 1.3768310546875, 1.46942138671875, 1.56201171875, 1.65460205078125, 1.7471923828125, 1.83978271484375, 1.932373046875, 2.02496337890625, 2.1175537109375, 2.21014404296875, 2.302734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 18.0, 16.0, 28.0, 25.0, 42.0, 45.0, 70.0, 78.0, 92.0, 86.0, 81.0, 92.0, 72.0, 68.0, 40.0, 40.0, 34.0, 18.0, 21.0, 12.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.12506103515625, -4.9102783203125, -4.69549560546875, -4.480712890625, -4.26593017578125, -4.0511474609375, -3.83636474609375, -3.62158203125, -3.40679931640625, -3.1920166015625, -2.97723388671875, -2.762451171875, -2.54766845703125, -2.3328857421875, -2.11810302734375, -1.9033203125, -1.68853759765625, -1.4737548828125, -1.25897216796875, -1.044189453125, -0.82940673828125, -0.6146240234375, -0.39984130859375, -0.18505859375, 0.02972412109375, 0.2445068359375, 0.45928955078125, 0.674072265625, 0.88885498046875, 1.1036376953125, 1.31842041015625, 1.533203125, 1.74798583984375, 1.9627685546875, 2.17755126953125, 2.392333984375, 2.60711669921875, 2.8218994140625, 3.03668212890625, 3.25146484375, 3.46624755859375, 3.6810302734375, 3.89581298828125, 4.110595703125, 4.32537841796875, 4.5401611328125, 4.75494384765625, 4.9697265625, 5.18450927734375, 5.3992919921875, 5.61407470703125, 5.828857421875, 6.04364013671875, 6.2584228515625, 6.47320556640625, 6.68798828125, 6.90277099609375, 7.1175537109375, 7.33233642578125, 7.547119140625, 7.76190185546875, 7.9766845703125, 8.19146728515625, 8.40625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 6.0, 10.0, 11.0, 11.0, 26.0, 33.0, 47.0, 76.0, 119.0, 195.0, 341.0, 548.0, 992.0, 1910.0, 3823.0, 8420.0, 20049.0, 51799.0, 162348.0, 504775.0, 193809.0, 58770.0, 22227.0, 9309.0, 4294.0, 2036.0, 1026.0, 598.0, 341.0, 216.0, 124.0, 82.0, 59.0, 37.0, 27.0, 11.0, 10.0, 7.0, 10.0, 4.0, 10.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60400390625, -0.5835723876953125, -0.563140869140625, -0.5427093505859375, -0.52227783203125, -0.5018463134765625, -0.481414794921875, -0.4609832763671875, -0.4405517578125, -0.4201202392578125, -0.399688720703125, -0.3792572021484375, -0.35882568359375, -0.3383941650390625, -0.317962646484375, -0.2975311279296875, -0.277099609375, -0.2566680908203125, -0.236236572265625, -0.2158050537109375, -0.19537353515625, -0.1749420166015625, -0.154510498046875, -0.1340789794921875, -0.1136474609375, -0.0932159423828125, -0.072784423828125, -0.0523529052734375, -0.03192138671875, -0.0114898681640625, 0.008941650390625, 0.0293731689453125, 0.0498046875, 0.0702362060546875, 0.090667724609375, 0.1110992431640625, 0.13153076171875, 0.1519622802734375, 0.172393798828125, 0.1928253173828125, 0.2132568359375, 0.2336883544921875, 0.254119873046875, 0.2745513916015625, 0.29498291015625, 0.3154144287109375, 0.335845947265625, 0.3562774658203125, 0.376708984375, 0.3971405029296875, 0.417572021484375, 0.4380035400390625, 0.45843505859375, 0.4788665771484375, 0.499298095703125, 0.5197296142578125, 0.5401611328125, 0.5605926513671875, 0.581024169921875, 0.6014556884765625, 0.62188720703125, 0.6423187255859375, 0.662750244140625, 0.6831817626953125, 0.70361328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 9.0, 7.0, 4.0, 10.0, 5.0, 8.0, 21.0, 29.0, 31.0, 23.0, 34.0, 31.0, 30.0, 44.0, 43.0, 45.0, 55.0, 47.0, 51.0, 56.0, 53.0, 38.0, 42.0, 36.0, 27.0, 31.0, 39.0, 29.0, 25.0, 16.0, 18.0, 14.0, 8.0, 12.0, 3.0, 5.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65234375, -5.43792724609375, -5.2235107421875, -5.00909423828125, -4.794677734375, -4.58026123046875, -4.3658447265625, -4.15142822265625, -3.93701171875, -3.72259521484375, -3.5081787109375, -3.29376220703125, -3.079345703125, -2.86492919921875, -2.6505126953125, -2.43609619140625, -2.2216796875, -2.00726318359375, -1.7928466796875, -1.57843017578125, -1.364013671875, -1.14959716796875, -0.9351806640625, -0.72076416015625, -0.50634765625, -0.29193115234375, -0.0775146484375, 0.13690185546875, 0.351318359375, 0.56573486328125, 0.7801513671875, 0.99456787109375, 1.208984375, 1.42340087890625, 1.6378173828125, 1.85223388671875, 2.066650390625, 2.28106689453125, 2.4954833984375, 2.70989990234375, 2.92431640625, 3.13873291015625, 3.3531494140625, 3.56756591796875, 3.781982421875, 3.99639892578125, 4.2108154296875, 4.42523193359375, 4.6396484375, 4.85406494140625, 5.0684814453125, 5.28289794921875, 5.497314453125, 5.71173095703125, 5.9261474609375, 6.14056396484375, 6.35498046875, 6.56939697265625, 6.7838134765625, 6.99822998046875, 7.212646484375, 7.42706298828125, 7.6414794921875, 7.85589599609375, 8.0703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 8.0, 17.0, 27.0, 30.0, 35.0, 51.0, 61.0, 104.0, 149.0, 243.0, 436.0, 973.0, 2015.0, 7173.0, 65899.0, 894411.0, 65509.0, 7148.0, 2092.0, 936.0, 512.0, 266.0, 145.0, 97.0, 64.0, 46.0, 24.0, 24.0, 14.0, 13.0, 11.0, 9.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.345458984375, -0.3354454040527344, -0.32543182373046875, -0.3154182434082031, -0.3054046630859375, -0.2953910827636719, -0.28537750244140625, -0.2753639221191406, -0.265350341796875, -0.2553367614746094, -0.24532318115234375, -0.23530960083007812, -0.2252960205078125, -0.21528244018554688, -0.20526885986328125, -0.19525527954101562, -0.18524169921875, -0.17522811889648438, -0.16521453857421875, -0.15520095825195312, -0.1451873779296875, -0.13517379760742188, -0.12516021728515625, -0.11514663696289062, -0.105133056640625, -0.09511947631835938, -0.08510589599609375, -0.07509231567382812, -0.0650787353515625, -0.055065155029296875, -0.04505157470703125, -0.035037994384765625, -0.0250244140625, -0.015010833740234375, -0.00499725341796875, 0.005016326904296875, 0.0150299072265625, 0.025043487548828125, 0.03505706787109375, 0.045070648193359375, 0.055084228515625, 0.06509780883789062, 0.07511138916015625, 0.08512496948242188, 0.0951385498046875, 0.10515213012695312, 0.11516571044921875, 0.12517929077148438, 0.13519287109375, 0.14520645141601562, 0.15522003173828125, 0.16523361206054688, 0.1752471923828125, 0.18526077270507812, 0.19527435302734375, 0.20528793334960938, 0.215301513671875, 0.22531509399414062, 0.23532867431640625, 0.24534225463867188, 0.2553558349609375, 0.2653694152832031, 0.27538299560546875, 0.2853965759277344, 0.29541015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 14.0, 15.0, 24.0, 43.0, 59.0, 69.0, 70.0, 92.0, 119.0, 98.0, 96.0, 78.0, 57.0, 42.0, 25.0, 23.0, 19.0, 11.0, 5.0, 11.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.556510925292969e-05, -6.367452442646027e-05, -6.178393959999084e-05, -5.989335477352142e-05, -5.8002769947052e-05, -5.611218512058258e-05, -5.422160029411316e-05, -5.233101546764374e-05, -5.0440430641174316e-05, -4.8549845814704895e-05, -4.6659260988235474e-05, -4.476867616176605e-05, -4.287809133529663e-05, -4.098750650882721e-05, -3.909692168235779e-05, -3.720633685588837e-05, -3.5315752029418945e-05, -3.3425167202949524e-05, -3.15345823764801e-05, -2.964399755001068e-05, -2.775341272354126e-05, -2.586282789707184e-05, -2.3972243070602417e-05, -2.2081658244132996e-05, -2.0191073417663574e-05, -1.8300488591194153e-05, -1.640990376472473e-05, -1.451931893825531e-05, -1.2628734111785889e-05, -1.0738149285316467e-05, -8.847564458847046e-06, -6.9569796323776245e-06, -5.066394805908203e-06, -3.1758099794387817e-06, -1.2852251529693604e-06, 6.05359673500061e-07, 2.4959444999694824e-06, 4.386529326438904e-06, 6.277114152908325e-06, 8.167698979377747e-06, 1.0058283805847168e-05, 1.194886863231659e-05, 1.383945345878601e-05, 1.5730038285255432e-05, 1.7620623111724854e-05, 1.9511207938194275e-05, 2.1401792764663696e-05, 2.3292377591133118e-05, 2.518296241760254e-05, 2.707354724407196e-05, 2.8964132070541382e-05, 3.08547168970108e-05, 3.2745301723480225e-05, 3.4635886549949646e-05, 3.652647137641907e-05, 3.841705620288849e-05, 4.030764102935791e-05, 4.219822585582733e-05, 4.408881068229675e-05, 4.5979395508766174e-05, 4.7869980335235596e-05, 4.976056516170502e-05, 5.165114998817444e-05, 5.354173481464386e-05, 5.543231964111328e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 11.0, 12.0, 23.0, 44.0, 100.0, 348.0, 1745.0, 36931.0, 1004283.0, 4105.0, 647.0, 171.0, 43.0, 29.0, 16.0, 9.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.798828125, -0.7705078125, -0.7421875, -0.7138671875, -0.685546875, -0.6572265625, -0.62890625, -0.6005859375, -0.572265625, -0.5439453125, -0.515625, -0.4873046875, -0.458984375, -0.4306640625, -0.40234375, -0.3740234375, -0.345703125, -0.3173828125, -0.2890625, -0.2607421875, -0.232421875, -0.2041015625, -0.17578125, -0.1474609375, -0.119140625, -0.0908203125, -0.0625, -0.0341796875, -0.005859375, 0.0224609375, 0.05078125, 0.0791015625, 0.107421875, 0.1357421875, 0.1640625, 0.1923828125, 0.220703125, 0.2490234375, 0.27734375, 0.3056640625, 0.333984375, 0.3623046875, 0.390625, 0.4189453125, 0.447265625, 0.4755859375, 0.50390625, 0.5322265625, 0.560546875, 0.5888671875, 0.6171875, 0.6455078125, 0.673828125, 0.7021484375, 0.73046875, 0.7587890625, 0.787109375, 0.8154296875, 0.84375, 0.8720703125, 0.900390625, 0.9287109375, 0.95703125, 0.9853515625, 1.013671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 12.0, 20.0, 44.0, 90.0, 229.0, 259.0, 160.0, 95.0, 32.0, 16.0, 12.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083740234375, -0.08078861236572266, -0.07783699035644531, -0.07488536834716797, -0.07193374633789062, -0.06898212432861328, -0.06603050231933594, -0.0630788803100586, -0.06012725830078125, -0.057175636291503906, -0.05422401428222656, -0.05127239227294922, -0.048320770263671875, -0.04536914825439453, -0.04241752624511719, -0.039465904235839844, -0.0365142822265625, -0.033562660217285156, -0.030611038208007812, -0.02765941619873047, -0.024707794189453125, -0.02175617218017578, -0.018804550170898438, -0.015852928161621094, -0.01290130615234375, -0.009949684143066406, -0.0069980621337890625, -0.004046440124511719, -0.001094818115234375, 0.0018568038940429688, 0.0048084259033203125, 0.007760047912597656, 0.010711669921875, 0.013663291931152344, 0.016614913940429688, 0.01956653594970703, 0.022518157958984375, 0.02546977996826172, 0.028421401977539062, 0.031373023986816406, 0.03432464599609375, 0.037276268005371094, 0.04022789001464844, 0.04317951202392578, 0.046131134033203125, 0.04908275604248047, 0.05203437805175781, 0.054986000061035156, 0.0579376220703125, 0.060889244079589844, 0.06384086608886719, 0.06679248809814453, 0.06974411010742188, 0.07269573211669922, 0.07564735412597656, 0.0785989761352539, 0.08155059814453125, 0.0845022201538086, 0.08745384216308594, 0.09040546417236328, 0.09335708618164062, 0.09630870819091797, 0.09926033020019531, 0.10221195220947266, 0.10516357421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 23.0, 67.0, 337.0, 425.0, 120.0, 25.0, 4.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.27359390258789, -24.610843658447266, -23.948091506958008, -23.285341262817383, -22.622591018676758, -21.9598388671875, -21.297088623046875, -20.63433837890625, -19.971586227416992, -19.308835983276367, -18.64608383178711, -17.983333587646484, -17.32058334350586, -16.6578311920166, -15.995080947875977, -15.332329750061035, -14.66957950592041, -14.006828308105469, -13.344078063964844, -12.681326866149902, -12.018575668334961, -11.355825424194336, -10.693074226379395, -10.030323028564453, -9.367572784423828, -8.704821586608887, -8.042071342468262, -7.37932014465332, -6.716568946838379, -6.053818225860596, -5.3910675048828125, -4.728316307067871, -4.06556510925293, -3.4028141498565674, -2.740063190460205, -2.077312469482422, -1.4145615100860596, -0.7518105506896973, -0.08905982971191406, 0.5736913681030273, 1.2364420890808105, 1.8991930484771729, 2.561944007873535, 3.2246947288513184, 3.8874456882476807, 4.550196647644043, 5.212947368621826, 5.875698566436768, 6.538449287414551, 7.201200008392334, 7.863951206207275, 8.526701927185059, 9.189453125, 9.852203369140625, 10.514954566955566, 11.177705764770508, 11.840456008911133, 12.503207206726074, 13.1659574508667, 13.82870864868164, 14.491459846496582, 15.154211044311523, 15.816961288452148, 16.479713439941406, 17.14246368408203]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 8.0, 16.0, 19.0, 27.0, 18.0, 34.0, 49.0, 52.0, 95.0, 82.0, 84.0, 69.0, 70.0, 84.0, 69.0, 56.0, 39.0, 32.0, 31.0, 23.0, 14.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.827327728271484, -4.627806663513184, -4.428285121917725, -4.228764057159424, -4.029242515563965, -3.829721450805664, -3.6302003860473633, -3.4306790828704834, -3.2311577796936035, -3.0316364765167236, -2.8321151733398438, -2.632594108581543, -2.433072805404663, -2.233551502227783, -2.0340304374694824, -1.8345091342926025, -1.6349878311157227, -1.4354665279388428, -1.2359453439712524, -1.036424160003662, -0.8369028568267822, -0.6373816132545471, -0.437860369682312, -0.23833918571472168, -0.0388178825378418, 0.1607033610343933, 0.3602246046066284, 0.5597458481788635, 0.7592670917510986, 0.9587883353233337, 1.1583095788955688, 1.3578307628631592, 1.5573525428771973, 1.7568738460540771, 1.9563950300216675, 2.155916213989258, 2.3554375171661377, 2.5549588203430176, 2.7544798851013184, 2.9540011882781982, 3.153522491455078, 3.353043794631958, 3.552565097808838, 3.7520861625671387, 3.9516074657440186, 4.151128768920898, 4.350649833679199, 4.5501708984375, 4.749692440032959, 4.94921350479126, 5.148735046386719, 5.3482561111450195, 5.54777717590332, 5.747298717498779, 5.94681978225708, 6.146341323852539, 6.34586238861084, 6.545383453369141, 6.7449049949646, 6.9444260597229, 7.143947601318359, 7.34346866607666, 7.542989730834961, 7.742510795593262, 7.942032337188721]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 20.0, 17.0, 28.0, 36.0, 87.0, 152.0, 277.0, 606.0, 1362.0, 4074.0, 16488.0, 99666.0, 579280.0, 294071.0, 40213.0, 8057.0, 2349.0, 888.0, 378.0, 198.0, 102.0, 80.0, 47.0, 27.0, 13.0, 9.0, 6.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.166259765625, -4.99267578125, -4.819091796875, -4.6455078125, -4.471923828125, -4.29833984375, -4.124755859375, -3.951171875, -3.777587890625, -3.60400390625, -3.430419921875, -3.2568359375, -3.083251953125, -2.90966796875, -2.736083984375, -2.5625, -2.388916015625, -2.21533203125, -2.041748046875, -1.8681640625, -1.694580078125, -1.52099609375, -1.347412109375, -1.173828125, -1.000244140625, -0.82666015625, -0.653076171875, -0.4794921875, -0.305908203125, -0.13232421875, 0.041259765625, 0.21484375, 0.388427734375, 0.56201171875, 0.735595703125, 0.9091796875, 1.082763671875, 1.25634765625, 1.429931640625, 1.603515625, 1.777099609375, 1.95068359375, 2.124267578125, 2.2978515625, 2.471435546875, 2.64501953125, 2.818603515625, 2.9921875, 3.165771484375, 3.33935546875, 3.512939453125, 3.6865234375, 3.860107421875, 4.03369140625, 4.207275390625, 4.380859375, 4.554443359375, 4.72802734375, 4.901611328125, 5.0751953125, 5.248779296875, 5.42236328125, 5.595947265625, 5.76953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 20.0, 12.0, 19.0, 19.0, 21.0, 24.0, 27.0, 30.0, 49.0, 62.0, 52.0, 58.0, 74.0, 59.0, 66.0, 61.0, 43.0, 48.0, 41.0, 54.0, 29.0, 21.0, 24.0, 17.0, 14.0, 14.0, 9.0, 5.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.69342041015625, -6.4298095703125, -6.16619873046875, -5.902587890625, -5.63897705078125, -5.3753662109375, -5.11175537109375, -4.84814453125, -4.58453369140625, -4.3209228515625, -4.05731201171875, -3.793701171875, -3.53009033203125, -3.2664794921875, -3.00286865234375, -2.7392578125, -2.47564697265625, -2.2120361328125, -1.94842529296875, -1.684814453125, -1.42120361328125, -1.1575927734375, -0.89398193359375, -0.63037109375, -0.36676025390625, -0.1031494140625, 0.16046142578125, 0.424072265625, 0.68768310546875, 0.9512939453125, 1.21490478515625, 1.478515625, 1.74212646484375, 2.0057373046875, 2.26934814453125, 2.532958984375, 2.79656982421875, 3.0601806640625, 3.32379150390625, 3.58740234375, 3.85101318359375, 4.1146240234375, 4.37823486328125, 4.641845703125, 4.90545654296875, 5.1690673828125, 5.43267822265625, 5.6962890625, 5.95989990234375, 6.2235107421875, 6.48712158203125, 6.750732421875, 7.01434326171875, 7.2779541015625, 7.54156494140625, 7.80517578125, 8.06878662109375, 8.3323974609375, 8.59600830078125, 8.859619140625, 9.12322998046875, 9.3868408203125, 9.65045166015625, 9.9140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 8.0, 24.0, 23.0, 21.0, 23.0, 46.0, 51.0, 59.0, 74.0, 93.0, 131.0, 227.0, 539.0, 5735.0, 1012444.0, 27461.0, 725.0, 250.0, 123.0, 91.0, 73.0, 67.0, 48.0, 27.0, 34.0, 26.0, 23.0, 11.0, 9.0, 15.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.109375, -21.36328125, -20.6171875, -19.87109375, -19.125, -18.37890625, -17.6328125, -16.88671875, -16.140625, -15.39453125, -14.6484375, -13.90234375, -13.15625, -12.41015625, -11.6640625, -10.91796875, -10.171875, -9.42578125, -8.6796875, -7.93359375, -7.1875, -6.44140625, -5.6953125, -4.94921875, -4.203125, -3.45703125, -2.7109375, -1.96484375, -1.21875, -0.47265625, 0.2734375, 1.01953125, 1.765625, 2.51171875, 3.2578125, 4.00390625, 4.75, 5.49609375, 6.2421875, 6.98828125, 7.734375, 8.48046875, 9.2265625, 9.97265625, 10.71875, 11.46484375, 12.2109375, 12.95703125, 13.703125, 14.44921875, 15.1953125, 15.94140625, 16.6875, 17.43359375, 18.1796875, 18.92578125, 19.671875, 20.41796875, 21.1640625, 21.91015625, 22.65625, 23.40234375, 24.1484375, 24.89453125, 25.640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 11.0, 6.0, 16.0, 26.0, 17.0, 19.0, 33.0, 37.0, 43.0, 55.0, 43.0, 53.0, 44.0, 55.0, 62.0, 62.0, 43.0, 51.0, 40.0, 37.0, 48.0, 27.0, 36.0, 28.0, 25.0, 23.0, 11.0, 11.0, 10.0, 9.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6796875, -8.4229736328125, -8.166259765625, -7.9095458984375, -7.65283203125, -7.3961181640625, -7.139404296875, -6.8826904296875, -6.6259765625, -6.3692626953125, -6.112548828125, -5.8558349609375, -5.59912109375, -5.3424072265625, -5.085693359375, -4.8289794921875, -4.572265625, -4.3155517578125, -4.058837890625, -3.8021240234375, -3.54541015625, -3.2886962890625, -3.031982421875, -2.7752685546875, -2.5185546875, -2.2618408203125, -2.005126953125, -1.7484130859375, -1.49169921875, -1.2349853515625, -0.978271484375, -0.7215576171875, -0.46484375, -0.2081298828125, 0.048583984375, 0.3052978515625, 0.56201171875, 0.8187255859375, 1.075439453125, 1.3321533203125, 1.5888671875, 1.8455810546875, 2.102294921875, 2.3590087890625, 2.61572265625, 2.8724365234375, 3.129150390625, 3.3858642578125, 3.642578125, 3.8992919921875, 4.156005859375, 4.4127197265625, 4.66943359375, 4.9261474609375, 5.182861328125, 5.4395751953125, 5.6962890625, 5.9530029296875, 6.209716796875, 6.4664306640625, 6.72314453125, 6.9798583984375, 7.236572265625, 7.4932861328125, 7.75]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 10.0, 5.0, 11.0, 19.0, 28.0, 33.0, 99.0, 286.0, 1643.0, 796039.0, 248608.0, 1322.0, 244.0, 94.0, 36.0, 13.0, 16.0, 5.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.011474609375, -8.71044921875, -8.409423828125, -8.1083984375, -7.807373046875, -7.50634765625, -7.205322265625, -6.904296875, -6.603271484375, -6.30224609375, -6.001220703125, -5.7001953125, -5.399169921875, -5.09814453125, -4.797119140625, -4.49609375, -4.195068359375, -3.89404296875, -3.593017578125, -3.2919921875, -2.990966796875, -2.68994140625, -2.388916015625, -2.087890625, -1.786865234375, -1.48583984375, -1.184814453125, -0.8837890625, -0.582763671875, -0.28173828125, 0.019287109375, 0.3203125, 0.621337890625, 0.92236328125, 1.223388671875, 1.5244140625, 1.825439453125, 2.12646484375, 2.427490234375, 2.728515625, 3.029541015625, 3.33056640625, 3.631591796875, 3.9326171875, 4.233642578125, 4.53466796875, 4.835693359375, 5.13671875, 5.437744140625, 5.73876953125, 6.039794921875, 6.3408203125, 6.641845703125, 6.94287109375, 7.243896484375, 7.544921875, 7.845947265625, 8.14697265625, 8.447998046875, 8.7490234375, 9.050048828125, 9.35107421875, 9.652099609375, 9.953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 17.0, 34.0, 54.0, 79.0, 134.0, 159.0, 187.0, 138.0, 102.0, 52.0, 24.0, 11.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004165172576904297, -0.00040461495518684387, -0.00039271265268325806, -0.00038081035017967224, -0.0003689080476760864, -0.0003570057451725006, -0.0003451034426689148, -0.000333201140165329, -0.00032129883766174316, -0.00030939653515815735, -0.00029749423265457153, -0.0002855919301509857, -0.0002736896276473999, -0.0002617873251438141, -0.00024988502264022827, -0.00023798272013664246, -0.00022608041763305664, -0.00021417811512947083, -0.000202275812625885, -0.0001903735101222992, -0.00017847120761871338, -0.00016656890511512756, -0.00015466660261154175, -0.00014276430010795593, -0.00013086199760437012, -0.0001189596951007843, -0.00010705739259719849, -9.515509009361267e-05, -8.325278759002686e-05, -7.135048508644104e-05, -5.9448182582855225e-05, -4.754588007926941e-05, -3.5643577575683594e-05, -2.374127507209778e-05, -1.1838972568511963e-05, 6.332993507385254e-08, 1.1965632438659668e-05, 2.3867934942245483e-05, 3.57702374458313e-05, 4.7672539949417114e-05, 5.957484245300293e-05, 7.147714495658875e-05, 8.337944746017456e-05, 9.528174996376038e-05, 0.00010718405246734619, 0.00011908635497093201, 0.00013098865747451782, 0.00014289095997810364, 0.00015479326248168945, 0.00016669556498527527, 0.00017859786748886108, 0.0001905001699924469, 0.00020240247249603271, 0.00021430477499961853, 0.00022620707750320435, 0.00023810938000679016, 0.000250011682510376, 0.0002619139850139618, 0.0002738162875175476, 0.0002857185900211334, 0.00029762089252471924, 0.00030952319502830505, 0.00032142549753189087, 0.0003333278000354767, 0.0003452301025390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 5.0, 5.0, 3.0, 4.0, 7.0, 8.0, 12.0, 10.0, 16.0, 38.0, 83.0, 201.0, 699.0, 8116.0, 1003072.0, 34471.0, 1319.0, 263.0, 96.0, 54.0, 20.0, 14.0, 16.0, 7.0, 8.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.7734375, -8.55224609375, -8.3310546875, -8.10986328125, -7.888671875, -7.66748046875, -7.4462890625, -7.22509765625, -7.00390625, -6.78271484375, -6.5615234375, -6.34033203125, -6.119140625, -5.89794921875, -5.6767578125, -5.45556640625, -5.234375, -5.01318359375, -4.7919921875, -4.57080078125, -4.349609375, -4.12841796875, -3.9072265625, -3.68603515625, -3.46484375, -3.24365234375, -3.0224609375, -2.80126953125, -2.580078125, -2.35888671875, -2.1376953125, -1.91650390625, -1.6953125, -1.47412109375, -1.2529296875, -1.03173828125, -0.810546875, -0.58935546875, -0.3681640625, -0.14697265625, 0.07421875, 0.29541015625, 0.5166015625, 0.73779296875, 0.958984375, 1.18017578125, 1.4013671875, 1.62255859375, 1.84375, 2.06494140625, 2.2861328125, 2.50732421875, 2.728515625, 2.94970703125, 3.1708984375, 3.39208984375, 3.61328125, 3.83447265625, 4.0556640625, 4.27685546875, 4.498046875, 4.71923828125, 4.9404296875, 5.16162109375, 5.3828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 7.0, 4.0, 9.0, 17.0, 25.0, 44.0, 106.0, 154.0, 198.0, 169.0, 116.0, 60.0, 22.0, 14.0, 14.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.06640625, -2.0142669677734375, -1.962127685546875, -1.9099884033203125, -1.85784912109375, -1.8057098388671875, -1.753570556640625, -1.7014312744140625, -1.6492919921875, -1.5971527099609375, -1.545013427734375, -1.4928741455078125, -1.44073486328125, -1.3885955810546875, -1.336456298828125, -1.2843170166015625, -1.232177734375, -1.1800384521484375, -1.127899169921875, -1.0757598876953125, -1.02362060546875, -0.9714813232421875, -0.919342041015625, -0.8672027587890625, -0.8150634765625, -0.7629241943359375, -0.710784912109375, -0.6586456298828125, -0.60650634765625, -0.5543670654296875, -0.502227783203125, -0.4500885009765625, -0.39794921875, -0.3458099365234375, -0.293670654296875, -0.2415313720703125, -0.18939208984375, -0.1372528076171875, -0.085113525390625, -0.0329742431640625, 0.0191650390625, 0.0713043212890625, 0.123443603515625, 0.1755828857421875, 0.22772216796875, 0.2798614501953125, 0.332000732421875, 0.3841400146484375, 0.436279296875, 0.4884185791015625, 0.540557861328125, 0.5926971435546875, 0.64483642578125, 0.6969757080078125, 0.749114990234375, 0.8012542724609375, 0.8533935546875, 0.9055328369140625, 0.957672119140625, 1.0098114013671875, 1.06195068359375, 1.1140899658203125, 1.166229248046875, 1.2183685302734375, 1.2705078125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 12.0, 106.0, 765.0, 126.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-153.80059814453125, -151.1250457763672, -148.44949340820312, -145.77394104003906, -143.098388671875, -140.42283630371094, -137.74728393554688, -135.07171630859375, -132.3961639404297, -129.72061157226562, -127.04505920410156, -124.3695068359375, -121.6939468383789, -119.01839447021484, -116.34284210205078, -113.66728973388672, -110.99174499511719, -108.31619262695312, -105.64064025878906, -102.965087890625, -100.2895278930664, -97.61397552490234, -94.93842315673828, -92.26287078857422, -89.58731079101562, -86.91175842285156, -84.2362060546875, -81.56065368652344, -78.88509368896484, -76.20954132080078, -73.53398895263672, -70.85843658447266, -68.1828842163086, -65.50733184814453, -62.8317756652832, -60.15622329711914, -57.48067092895508, -54.80511474609375, -52.12956237792969, -49.454010009765625, -46.7784538269043, -44.102901458740234, -41.427345275878906, -38.751792907714844, -36.07624053955078, -33.40068817138672, -30.72513198852539, -28.049579620361328, -25.374025344848633, -22.698471069335938, -20.022918701171875, -17.34736442565918, -14.6718111038208, -11.996257781982422, -9.320703506469727, -6.645151138305664, -3.9695968627929688, -1.2940433025360107, 1.3815102577209473, 4.057064056396484, 6.732617378234863, 9.408170700073242, 12.083724975585938, 14.75927734375, 17.434831619262695]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 6.0, 14.0, 10.0, 18.0, 23.0, 22.0, 21.0, 20.0, 27.0, 41.0, 25.0, 28.0, 39.0, 39.0, 36.0, 33.0, 37.0, 39.0, 31.0, 38.0, 44.0, 43.0, 36.0, 29.0, 42.0, 34.0, 27.0, 37.0, 23.0, 20.0, 20.0, 14.0, 12.0, 9.0, 11.0, 7.0, 8.0, 3.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-10.17807388305664, -9.901121139526367, -9.624167442321777, -9.347214698791504, -9.070261001586914, -8.79330825805664, -8.51635456085205, -8.239401817321777, -7.962448596954346, -7.685495376586914, -7.408542156219482, -7.131588935852051, -6.854636192321777, -6.5776824951171875, -6.300729751586914, -6.023776531219482, -5.746823310852051, -5.469870090484619, -5.1929168701171875, -4.915963649749756, -4.639010429382324, -4.362057685852051, -4.085104465484619, -3.8081512451171875, -3.531198024749756, -3.254244804382324, -2.9772915840148926, -2.70033860206604, -2.4233853816986084, -2.1464321613311768, -1.8694790601730347, -1.5925259590148926, -1.3155732154846191, -1.0386199951171875, -0.7616668939590454, -0.48471373319625854, -0.20776057243347168, 0.06919264793395996, 0.34614574909210205, 0.6230988502502441, 0.9000520706176758, 1.1770052909851074, 1.4539583921432495, 1.7309114933013916, 2.0078647136688232, 2.284817934036255, 2.5617709159851074, 2.838724136352539, 3.1156773567199707, 3.3926305770874023, 3.669583797454834, 3.9465367794036865, 4.223489761352539, 4.500443458557129, 4.777396202087402, 5.054349422454834, 5.331302642822266, 5.608255863189697, 5.885209083557129, 6.1621623039245605, 6.439115524291992, 6.716068267822266, 6.993021488189697, 7.269974708557129, 7.5469279289245605]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 17.0, 25.0, 34.0, 65.0, 133.0, 243.0, 551.0, 1468.0, 2808.0, 5818.0, 51823.0, 873984.0, 2673286.0, 537677.0, 38889.0, 5570.0, 1208.0, 303.0, 146.0, 91.0, 49.0, 27.0, 22.0, 9.0, 6.0, 7.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.64453125, -7.35504150390625, -7.0655517578125, -6.77606201171875, -6.486572265625, -6.19708251953125, -5.9075927734375, -5.61810302734375, -5.32861328125, -5.03912353515625, -4.7496337890625, -4.46014404296875, -4.170654296875, -3.88116455078125, -3.5916748046875, -3.30218505859375, -3.0126953125, -2.72320556640625, -2.4337158203125, -2.14422607421875, -1.854736328125, -1.56524658203125, -1.2757568359375, -0.98626708984375, -0.69677734375, -0.40728759765625, -0.1177978515625, 0.17169189453125, 0.461181640625, 0.75067138671875, 1.0401611328125, 1.32965087890625, 1.619140625, 1.90863037109375, 2.1981201171875, 2.48760986328125, 2.777099609375, 3.06658935546875, 3.3560791015625, 3.64556884765625, 3.93505859375, 4.22454833984375, 4.5140380859375, 4.80352783203125, 5.093017578125, 5.38250732421875, 5.6719970703125, 5.96148681640625, 6.2509765625, 6.54046630859375, 6.8299560546875, 7.11944580078125, 7.408935546875, 7.69842529296875, 7.9879150390625, 8.27740478515625, 8.56689453125, 8.85638427734375, 9.1458740234375, 9.43536376953125, 9.724853515625, 10.01434326171875, 10.3038330078125, 10.59332275390625, 10.8828125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 18.0, 20.0, 27.0, 40.0, 48.0, 70.0, 71.0, 91.0, 89.0, 88.0, 93.0, 71.0, 75.0, 57.0, 49.0, 22.0, 17.0, 17.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.0546875, -8.7301025390625, -8.405517578125, -8.0809326171875, -7.75634765625, -7.4317626953125, -7.107177734375, -6.7825927734375, -6.4580078125, -6.1334228515625, -5.808837890625, -5.4842529296875, -5.15966796875, -4.8350830078125, -4.510498046875, -4.1859130859375, -3.861328125, -3.5367431640625, -3.212158203125, -2.8875732421875, -2.56298828125, -2.2384033203125, -1.913818359375, -1.5892333984375, -1.2646484375, -0.9400634765625, -0.615478515625, -0.2908935546875, 0.03369140625, 0.3582763671875, 0.682861328125, 1.0074462890625, 1.33203125, 1.6566162109375, 1.981201171875, 2.3057861328125, 2.63037109375, 2.9549560546875, 3.279541015625, 3.6041259765625, 3.9287109375, 4.2532958984375, 4.577880859375, 4.9024658203125, 5.22705078125, 5.5516357421875, 5.876220703125, 6.2008056640625, 6.525390625, 6.8499755859375, 7.174560546875, 7.4991455078125, 7.82373046875, 8.1483154296875, 8.472900390625, 8.7974853515625, 9.1220703125, 9.4466552734375, 9.771240234375, 10.0958251953125, 10.42041015625, 10.7449951171875, 11.069580078125, 11.3941650390625, 11.71875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 13.0, 10.0, 6.0, 15.0, 21.0, 46.0, 80.0, 209.0, 786.0, 7083.0, 4084182.0, 98647.0, 2322.0, 484.0, 176.0, 84.0, 36.0, 24.0, 11.0, 14.0, 7.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -21.986328125, -21.09765625, -20.208984375, -19.3203125, -18.431640625, -17.54296875, -16.654296875, -15.765625, -14.876953125, -13.98828125, -13.099609375, -12.2109375, -11.322265625, -10.43359375, -9.544921875, -8.65625, -7.767578125, -6.87890625, -5.990234375, -5.1015625, -4.212890625, -3.32421875, -2.435546875, -1.546875, -0.658203125, 0.23046875, 1.119140625, 2.0078125, 2.896484375, 3.78515625, 4.673828125, 5.5625, 6.451171875, 7.33984375, 8.228515625, 9.1171875, 10.005859375, 10.89453125, 11.783203125, 12.671875, 13.560546875, 14.44921875, 15.337890625, 16.2265625, 17.115234375, 18.00390625, 18.892578125, 19.78125, 20.669921875, 21.55859375, 22.447265625, 23.3359375, 24.224609375, 25.11328125, 26.001953125, 26.890625, 27.779296875, 28.66796875, 29.556640625, 30.4453125, 31.333984375, 32.22265625, 33.111328125, 34.0]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 2.0, 4.0, 0.0, 5.0, 4.0, 14.0, 17.0, 19.0, 39.0, 87.0, 156.0, 470.0, 1006.0, 1238.0, 610.0, 219.0, 81.0, 33.0, 25.0, 15.0, 6.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.85546875, -5.6978759765625, -5.540283203125, -5.3826904296875, -5.22509765625, -5.0675048828125, -4.909912109375, -4.7523193359375, -4.5947265625, -4.4371337890625, -4.279541015625, -4.1219482421875, -3.96435546875, -3.8067626953125, -3.649169921875, -3.4915771484375, -3.333984375, -3.1763916015625, -3.018798828125, -2.8612060546875, -2.70361328125, -2.5460205078125, -2.388427734375, -2.2308349609375, -2.0732421875, -1.9156494140625, -1.758056640625, -1.6004638671875, -1.44287109375, -1.2852783203125, -1.127685546875, -0.9700927734375, -0.8125, -0.6549072265625, -0.497314453125, -0.3397216796875, -0.18212890625, -0.0245361328125, 0.133056640625, 0.2906494140625, 0.4482421875, 0.6058349609375, 0.763427734375, 0.9210205078125, 1.07861328125, 1.2362060546875, 1.393798828125, 1.5513916015625, 1.708984375, 1.8665771484375, 2.024169921875, 2.1817626953125, 2.33935546875, 2.4969482421875, 2.654541015625, 2.8121337890625, 2.9697265625, 3.1273193359375, 3.284912109375, 3.4425048828125, 3.60009765625, 3.7576904296875, 3.915283203125, 4.0728759765625, 4.23046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 15.0, 18.0, 44.0, 101.0, 159.0, 225.0, 183.0, 130.0, 70.0, 29.0, 16.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09865951538086, -18.63007164001465, -18.161483764648438, -17.692893981933594, -17.224306106567383, -16.755718231201172, -16.287128448486328, -15.818540573120117, -15.349952697753906, -14.881364822387695, -14.412775993347168, -13.94418716430664, -13.47559928894043, -13.007011413574219, -12.538422584533691, -12.069833755493164, -11.601245880126953, -11.132658004760742, -10.664069175720215, -10.195480346679688, -9.726892471313477, -9.258304595947266, -8.789715766906738, -8.321126937866211, -7.8525390625, -7.383950710296631, -6.915362358093262, -6.446774005889893, -5.978185653686523, -5.509597301483154, -5.041008949279785, -4.572420597076416, -4.103833198547363, -3.635244846343994, -3.166656494140625, -2.698068141937256, -2.2294797897338867, -1.7608914375305176, -1.2923030853271484, -0.8237147331237793, -0.35512638092041016, 0.11346197128295898, 0.5820503234863281, 1.0506386756896973, 1.5192270278930664, 1.9878153800964355, 2.4564037322998047, 2.924992084503174, 3.393580436706543, 3.862168788909912, 4.330757141113281, 4.79934549331665, 5.2679338455200195, 5.736522197723389, 6.205110549926758, 6.673698902130127, 7.142287254333496, 7.610875606536865, 8.079463958740234, 8.548051834106445, 9.016640663146973, 9.4852294921875, 9.953817367553711, 10.422405242919922, 10.89099407196045]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 7.0, 5.0, 14.0, 17.0, 14.0, 24.0, 31.0, 36.0, 54.0, 43.0, 61.0, 43.0, 74.0, 78.0, 54.0, 76.0, 59.0, 51.0, 50.0, 52.0, 39.0, 29.0, 26.0, 21.0, 14.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.8070878982543945, -7.552324295043945, -7.297560691833496, -7.042797088623047, -6.788033485412598, -6.533269882202148, -6.278506755828857, -6.023743152618408, -5.768979549407959, -5.51421594619751, -5.2594523429870605, -5.004688739776611, -4.74992561340332, -4.495162010192871, -4.240398406982422, -3.9856348037719727, -3.7308712005615234, -3.476107597351074, -3.221343994140625, -2.966580629348755, -2.7118170261383057, -2.4570534229278564, -2.2022900581359863, -1.947526454925537, -1.692762851715088, -1.4379992485046387, -1.183235764503479, -0.9284722208976746, -0.6737086772918701, -0.4189450740814209, -0.16418159008026123, 0.09058189392089844, 0.34534549713134766, 0.6001090407371521, 0.8548725843429565, 1.1096360683441162, 1.3643996715545654, 1.6191632747650146, 1.8739267587661743, 2.128690242767334, 2.383453845977783, 2.6382174491882324, 2.8929810523986816, 3.1477444171905518, 3.402508020401001, 3.65727162361145, 3.9120349884033203, 4.1667985916137695, 4.421562194824219, 4.676325798034668, 4.931089401245117, 5.185853004455566, 5.440616607666016, 5.695380210876465, 5.950143337249756, 6.204906940460205, 6.459670543670654, 6.7144341468811035, 6.969197750091553, 7.223961353302002, 7.478724479675293, 7.733488082885742, 7.988251686096191, 8.24301528930664, 8.49777889251709]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 17.0, 15.0, 23.0, 27.0, 51.0, 75.0, 137.0, 246.0, 515.0, 1152.0, 3197.0, 14292.0, 240112.0, 751734.0, 29112.0, 4797.0, 1626.0, 685.0, 339.0, 138.0, 74.0, 68.0, 39.0, 16.0, 14.0, 8.0, 14.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.466796875, -2.38763427734375, -2.3084716796875, -2.22930908203125, -2.150146484375, -2.07098388671875, -1.9918212890625, -1.91265869140625, -1.83349609375, -1.75433349609375, -1.6751708984375, -1.59600830078125, -1.516845703125, -1.43768310546875, -1.3585205078125, -1.27935791015625, -1.2001953125, -1.12103271484375, -1.0418701171875, -0.96270751953125, -0.883544921875, -0.80438232421875, -0.7252197265625, -0.64605712890625, -0.56689453125, -0.48773193359375, -0.4085693359375, -0.32940673828125, -0.250244140625, -0.17108154296875, -0.0919189453125, -0.01275634765625, 0.06640625, 0.14556884765625, 0.2247314453125, 0.30389404296875, 0.383056640625, 0.46221923828125, 0.5413818359375, 0.62054443359375, 0.69970703125, 0.77886962890625, 0.8580322265625, 0.93719482421875, 1.016357421875, 1.09552001953125, 1.1746826171875, 1.25384521484375, 1.3330078125, 1.41217041015625, 1.4913330078125, 1.57049560546875, 1.649658203125, 1.72882080078125, 1.8079833984375, 1.88714599609375, 1.96630859375, 2.04547119140625, 2.1246337890625, 2.20379638671875, 2.282958984375, 2.36212158203125, 2.4412841796875, 2.52044677734375, 2.599609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 8.0, 9.0, 22.0, 18.0, 25.0, 46.0, 43.0, 60.0, 70.0, 79.0, 88.0, 86.0, 87.0, 65.0, 67.0, 71.0, 32.0, 35.0, 26.0, 22.0, 14.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.875, -5.68603515625, -5.4970703125, -5.30810546875, -5.119140625, -4.93017578125, -4.7412109375, -4.55224609375, -4.36328125, -4.17431640625, -3.9853515625, -3.79638671875, -3.607421875, -3.41845703125, -3.2294921875, -3.04052734375, -2.8515625, -2.66259765625, -2.4736328125, -2.28466796875, -2.095703125, -1.90673828125, -1.7177734375, -1.52880859375, -1.33984375, -1.15087890625, -0.9619140625, -0.77294921875, -0.583984375, -0.39501953125, -0.2060546875, -0.01708984375, 0.171875, 0.36083984375, 0.5498046875, 0.73876953125, 0.927734375, 1.11669921875, 1.3056640625, 1.49462890625, 1.68359375, 1.87255859375, 2.0615234375, 2.25048828125, 2.439453125, 2.62841796875, 2.8173828125, 3.00634765625, 3.1953125, 3.38427734375, 3.5732421875, 3.76220703125, 3.951171875, 4.14013671875, 4.3291015625, 4.51806640625, 4.70703125, 4.89599609375, 5.0849609375, 5.27392578125, 5.462890625, 5.65185546875, 5.8408203125, 6.02978515625, 6.21875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 4.0, 11.0, 10.0, 19.0, 23.0, 34.0, 74.0, 83.0, 118.0, 225.0, 392.0, 686.0, 1232.0, 2475.0, 5291.0, 12451.0, 32437.0, 99151.0, 411658.0, 348260.0, 84621.0, 28633.0, 10955.0, 4788.0, 2278.0, 1159.0, 571.0, 333.0, 219.0, 116.0, 67.0, 49.0, 40.0, 23.0, 18.0, 15.0, 9.0, 8.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5967636108398438, -0.5768280029296875, -0.5568923950195312, -0.536956787109375, -0.5170211791992188, -0.4970855712890625, -0.47714996337890625, -0.45721435546875, -0.43727874755859375, -0.4173431396484375, -0.39740753173828125, -0.377471923828125, -0.35753631591796875, -0.3376007080078125, -0.31766510009765625, -0.2977294921875, -0.27779388427734375, -0.2578582763671875, -0.23792266845703125, -0.217987060546875, -0.19805145263671875, -0.1781158447265625, -0.15818023681640625, -0.13824462890625, -0.11830902099609375, -0.0983734130859375, -0.07843780517578125, -0.058502197265625, -0.03856658935546875, -0.0186309814453125, 0.00130462646484375, 0.021240234375, 0.04117584228515625, 0.0611114501953125, 0.08104705810546875, 0.100982666015625, 0.12091827392578125, 0.1408538818359375, 0.16078948974609375, 0.18072509765625, 0.20066070556640625, 0.2205963134765625, 0.24053192138671875, 0.260467529296875, 0.28040313720703125, 0.3003387451171875, 0.32027435302734375, 0.3402099609375, 0.36014556884765625, 0.3800811767578125, 0.40001678466796875, 0.419952392578125, 0.43988800048828125, 0.4598236083984375, 0.47975921630859375, 0.49969482421875, 0.5196304321289062, 0.5395660400390625, 0.5595016479492188, 0.579437255859375, 0.5993728637695312, 0.6193084716796875, 0.6392440795898438, 0.6591796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 5.0, 2.0, 0.0, 8.0, 6.0, 10.0, 8.0, 18.0, 16.0, 13.0, 31.0, 23.0, 35.0, 32.0, 42.0, 44.0, 53.0, 57.0, 40.0, 45.0, 56.0, 53.0, 41.0, 53.0, 39.0, 32.0, 40.0, 28.0, 27.0, 30.0, 20.0, 20.0, 12.0, 14.0, 12.0, 10.0, 13.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.91668701171875, -5.7200927734375, -5.52349853515625, -5.326904296875, -5.13031005859375, -4.9337158203125, -4.73712158203125, -4.54052734375, -4.34393310546875, -4.1473388671875, -3.95074462890625, -3.754150390625, -3.55755615234375, -3.3609619140625, -3.16436767578125, -2.9677734375, -2.77117919921875, -2.5745849609375, -2.37799072265625, -2.181396484375, -1.98480224609375, -1.7882080078125, -1.59161376953125, -1.39501953125, -1.19842529296875, -1.0018310546875, -0.80523681640625, -0.608642578125, -0.41204833984375, -0.2154541015625, -0.01885986328125, 0.177734375, 0.37432861328125, 0.5709228515625, 0.76751708984375, 0.964111328125, 1.16070556640625, 1.3572998046875, 1.55389404296875, 1.75048828125, 1.94708251953125, 2.1436767578125, 2.34027099609375, 2.536865234375, 2.73345947265625, 2.9300537109375, 3.12664794921875, 3.3232421875, 3.51983642578125, 3.7164306640625, 3.91302490234375, 4.109619140625, 4.30621337890625, 4.5028076171875, 4.69940185546875, 4.89599609375, 5.09259033203125, 5.2891845703125, 5.48577880859375, 5.682373046875, 5.87896728515625, 6.0755615234375, 6.27215576171875, 6.46875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 4.0, 11.0, 14.0, 26.0, 24.0, 27.0, 54.0, 81.0, 134.0, 227.0, 444.0, 1028.0, 3031.0, 9529.0, 40243.0, 218315.0, 568865.0, 163142.0, 31281.0, 7780.0, 2410.0, 964.0, 392.0, 188.0, 119.0, 73.0, 43.0, 37.0, 12.0, 16.0, 16.0, 4.0, 5.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10266876220703125, -0.0996856689453125, -0.09670257568359375, -0.093719482421875, -0.09073638916015625, -0.0877532958984375, -0.08477020263671875, -0.081787109375, -0.07880401611328125, -0.0758209228515625, -0.07283782958984375, -0.069854736328125, -0.06687164306640625, -0.0638885498046875, -0.06090545654296875, -0.05792236328125, -0.05493927001953125, -0.0519561767578125, -0.04897308349609375, -0.045989990234375, -0.04300689697265625, -0.0400238037109375, -0.03704071044921875, -0.0340576171875, -0.03107452392578125, -0.0280914306640625, -0.02510833740234375, -0.022125244140625, -0.01914215087890625, -0.0161590576171875, -0.01317596435546875, -0.01019287109375, -0.00720977783203125, -0.0042266845703125, -0.00124359130859375, 0.001739501953125, 0.00472259521484375, 0.0077056884765625, 0.01068878173828125, 0.013671875, 0.01665496826171875, 0.0196380615234375, 0.02262115478515625, 0.025604248046875, 0.02858734130859375, 0.0315704345703125, 0.03455352783203125, 0.03753662109375, 0.04051971435546875, 0.0435028076171875, 0.04648590087890625, 0.049468994140625, 0.05245208740234375, 0.0554351806640625, 0.05841827392578125, 0.0614013671875, 0.06438446044921875, 0.0673675537109375, 0.07035064697265625, 0.073333740234375, 0.07631683349609375, 0.0792999267578125, 0.08228302001953125, 0.08526611328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 11.0, 11.0, 26.0, 35.0, 43.0, 67.0, 88.0, 123.0, 142.0, 121.0, 95.0, 67.0, 60.0, 34.0, 27.0, 19.0, 12.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.66191291809082e-05, -9.445194154977798e-05, -9.228475391864777e-05, -9.011756628751755e-05, -8.795037865638733e-05, -8.578319102525711e-05, -8.361600339412689e-05, -8.144881576299667e-05, -7.928162813186646e-05, -7.711444050073624e-05, -7.494725286960602e-05, -7.27800652384758e-05, -7.061287760734558e-05, -6.844568997621536e-05, -6.627850234508514e-05, -6.411131471395493e-05, -6.194412708282471e-05, -5.977693945169449e-05, -5.760975182056427e-05, -5.544256418943405e-05, -5.327537655830383e-05, -5.1108188927173615e-05, -4.8941001296043396e-05, -4.677381366491318e-05, -4.460662603378296e-05, -4.243943840265274e-05, -4.027225077152252e-05, -3.8105063140392303e-05, -3.5937875509262085e-05, -3.3770687878131866e-05, -3.160350024700165e-05, -2.943631261587143e-05, -2.726912498474121e-05, -2.5101937353610992e-05, -2.2934749722480774e-05, -2.0767562091350555e-05, -1.8600374460220337e-05, -1.643318682909012e-05, -1.42659991979599e-05, -1.2098811566829681e-05, -9.931623935699463e-06, -7.764436304569244e-06, -5.597248673439026e-06, -3.4300610423088074e-06, -1.2628734111785889e-06, 9.043142199516296e-07, 3.071501851081848e-06, 5.238689482212067e-06, 7.405877113342285e-06, 9.573064744472504e-06, 1.1740252375602722e-05, 1.390744000673294e-05, 1.607462763786316e-05, 1.8241815268993378e-05, 2.0409002900123596e-05, 2.2576190531253815e-05, 2.4743378162384033e-05, 2.6910565793514252e-05, 2.907775342464447e-05, 3.124494105577469e-05, 3.341212868690491e-05, 3.5579316318035126e-05, 3.7746503949165344e-05, 3.991369158029556e-05, 4.208087921142578e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 9.0, 11.0, 12.0, 13.0, 25.0, 42.0, 53.0, 87.0, 186.0, 532.0, 2020.0, 12074.0, 161044.0, 796744.0, 66778.0, 6882.0, 1298.0, 366.0, 147.0, 74.0, 40.0, 28.0, 19.0, 10.0, 13.0, 5.0, 12.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17431640625, -0.1693859100341797, -0.16445541381835938, -0.15952491760253906, -0.15459442138671875, -0.14966392517089844, -0.14473342895507812, -0.1398029327392578, -0.1348724365234375, -0.1299419403076172, -0.12501144409179688, -0.12008094787597656, -0.11515045166015625, -0.11021995544433594, -0.10528945922851562, -0.10035896301269531, -0.095428466796875, -0.09049797058105469, -0.08556747436523438, -0.08063697814941406, -0.07570648193359375, -0.07077598571777344, -0.06584548950195312, -0.06091499328613281, -0.0559844970703125, -0.05105400085449219, -0.046123504638671875, -0.04119300842285156, -0.03626251220703125, -0.03133201599121094, -0.026401519775390625, -0.021471023559570312, -0.01654052734375, -0.011610031127929688, -0.006679534912109375, -0.0017490386962890625, 0.00318145751953125, 0.008111953735351562, 0.013042449951171875, 0.017972946166992188, 0.0229034423828125, 0.027833938598632812, 0.032764434814453125, 0.03769493103027344, 0.04262542724609375, 0.04755592346191406, 0.052486419677734375, 0.05741691589355469, 0.062347412109375, 0.06727790832519531, 0.07220840454101562, 0.07713890075683594, 0.08206939697265625, 0.08699989318847656, 0.09193038940429688, 0.09686088562011719, 0.1017913818359375, 0.10672187805175781, 0.11165237426757812, 0.11658287048339844, 0.12151336669921875, 0.12644386291503906, 0.13137435913085938, 0.1363048553466797, 0.1412353515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 11.0, 4.0, 16.0, 15.0, 27.0, 34.0, 36.0, 57.0, 72.0, 86.0, 82.0, 107.0, 100.0, 89.0, 71.0, 55.0, 29.0, 25.0, 22.0, 19.0, 9.0, 2.0, 9.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.024139404296875, -0.023476839065551758, -0.022814273834228516, -0.022151708602905273, -0.02148914337158203, -0.02082657814025879, -0.020164012908935547, -0.019501447677612305, -0.018838882446289062, -0.01817631721496582, -0.017513751983642578, -0.016851186752319336, -0.016188621520996094, -0.015526056289672852, -0.01486349105834961, -0.014200925827026367, -0.013538360595703125, -0.012875795364379883, -0.01221323013305664, -0.011550664901733398, -0.010888099670410156, -0.010225534439086914, -0.009562969207763672, -0.00890040397644043, -0.008237838745117188, -0.007575273513793945, -0.006912708282470703, -0.006250143051147461, -0.005587577819824219, -0.0049250125885009766, -0.004262447357177734, -0.003599882125854492, -0.00293731689453125, -0.002274751663208008, -0.0016121864318847656, -0.0009496212005615234, -0.00028705596923828125, 0.00037550926208496094, 0.0010380744934082031, 0.0017006397247314453, 0.0023632049560546875, 0.0030257701873779297, 0.003688335418701172, 0.004350900650024414, 0.005013465881347656, 0.0056760311126708984, 0.006338596343994141, 0.007001161575317383, 0.007663726806640625, 0.008326292037963867, 0.00898885726928711, 0.009651422500610352, 0.010313987731933594, 0.010976552963256836, 0.011639118194580078, 0.01230168342590332, 0.012964248657226562, 0.013626813888549805, 0.014289379119873047, 0.014951944351196289, 0.015614509582519531, 0.016277074813842773, 0.016939640045166016, 0.017602205276489258, 0.0182647705078125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 23.0, 333.0, 599.0, 51.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.83651351928711, -45.8217658996582, -44.80701446533203, -43.792266845703125, -42.77751922607422, -41.76277160644531, -40.748023986816406, -39.733272552490234, -38.71852493286133, -37.70377731323242, -36.68902587890625, -35.674278259277344, -34.65953063964844, -33.64478302001953, -32.630035400390625, -31.615283966064453, -30.600536346435547, -29.58578872680664, -28.5710391998291, -27.556289672851562, -26.541542053222656, -25.52679443359375, -24.51204490661621, -23.497295379638672, -22.482547760009766, -21.46780014038086, -20.45305061340332, -19.43830108642578, -18.423553466796875, -17.40880584716797, -16.39405632019043, -15.379307746887207, -14.36456298828125, -13.349814414978027, -12.335065841674805, -11.320317268371582, -10.30556869506836, -9.290820121765137, -8.276071548461914, -7.261322975158691, -6.246574401855469, -5.231825828552246, -4.217077255249023, -3.202328681945801, -2.187580108642578, -1.1728315353393555, -0.1580829620361328, 0.8566656112670898, 1.8714141845703125, 2.886162757873535, 3.900911331176758, 4.9156599044799805, 5.930408477783203, 6.945157051086426, 7.959905624389648, 8.974654197692871, 9.989402770996094, 11.004151344299316, 12.018899917602539, 13.033648490905762, 14.048397064208984, 15.063145637512207, 16.07789421081543, 17.09264373779297, 18.107391357421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 7.0, 14.0, 20.0, 19.0, 36.0, 38.0, 72.0, 73.0, 67.0, 93.0, 93.0, 98.0, 73.0, 71.0, 62.0, 43.0, 42.0, 30.0, 17.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73043155670166, -5.5289998054504395, -5.327568054199219, -5.126136779785156, -4.9247050285339355, -4.723273277282715, -4.521841526031494, -4.320409774780273, -4.118978023529053, -3.917546272277832, -3.7161147594451904, -3.5146830081939697, -3.313251256942749, -3.1118197441101074, -2.9103879928588867, -2.708956241607666, -2.5075247287750244, -2.3060929775238037, -2.104661464691162, -1.9032297134399414, -1.7017979621887207, -1.5003663301467896, -1.2989346981048584, -1.0975029468536377, -0.8960713148117065, -0.6946396231651306, -0.4932079613208771, -0.29177629947662354, -0.09034460783004761, 0.11108708381652832, 0.3125187158584595, 0.5139504671096802, 0.7153820991516113, 0.9168137907981873, 1.1182454824447632, 1.3196771144866943, 1.521108865737915, 1.7225404977798462, 1.9239721298217773, 2.125403881072998, 2.3268356323242188, 2.5282673835754395, 2.729698896408081, 2.9311306476593018, 3.1325623989105225, 3.333993911743164, 3.5354256629943848, 3.7368574142456055, 3.938288927078247, 4.139720439910889, 4.341152191162109, 4.54258394241333, 4.744015693664551, 4.9454474449157715, 5.146879196166992, 5.348310470581055, 5.549742221832275, 5.751173973083496, 5.952605724334717, 6.1540374755859375, 6.35546875, 6.556900501251221, 6.758332252502441, 6.959764003753662, 7.161195755004883]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 12.0, 10.0, 30.0, 34.0, 49.0, 71.0, 120.0, 183.0, 308.0, 611.0, 1082.0, 2279.0, 5672.0, 17039.0, 60701.0, 222628.0, 417661.0, 229606.0, 62476.0, 17306.0, 5755.0, 2365.0, 1134.0, 563.0, 286.0, 185.0, 101.0, 102.0, 58.0, 32.0, 21.0, 16.0, 14.0, 4.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.83203125, -3.717681884765625, -3.60333251953125, -3.488983154296875, -3.3746337890625, -3.260284423828125, -3.14593505859375, -3.031585693359375, -2.917236328125, -2.802886962890625, -2.68853759765625, -2.574188232421875, -2.4598388671875, -2.345489501953125, -2.23114013671875, -2.116790771484375, -2.00244140625, -1.888092041015625, -1.77374267578125, -1.659393310546875, -1.5450439453125, -1.430694580078125, -1.31634521484375, -1.201995849609375, -1.087646484375, -0.973297119140625, -0.85894775390625, -0.744598388671875, -0.6302490234375, -0.515899658203125, -0.40155029296875, -0.287200927734375, -0.1728515625, -0.058502197265625, 0.05584716796875, 0.170196533203125, 0.2845458984375, 0.398895263671875, 0.51324462890625, 0.627593994140625, 0.741943359375, 0.856292724609375, 0.97064208984375, 1.084991455078125, 1.1993408203125, 1.313690185546875, 1.42803955078125, 1.542388916015625, 1.65673828125, 1.771087646484375, 1.88543701171875, 1.999786376953125, 2.1141357421875, 2.228485107421875, 2.34283447265625, 2.457183837890625, 2.571533203125, 2.685882568359375, 2.80023193359375, 2.914581298828125, 3.0289306640625, 3.143280029296875, 3.25762939453125, 3.371978759765625, 3.486328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 1.0, 5.0, 8.0, 5.0, 16.0, 5.0, 23.0, 25.0, 30.0, 31.0, 39.0, 50.0, 65.0, 71.0, 60.0, 63.0, 68.0, 81.0, 57.0, 55.0, 37.0, 38.0, 44.0, 40.0, 27.0, 19.0, 10.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.79296875, -7.53204345703125, -7.2711181640625, -7.01019287109375, -6.749267578125, -6.48834228515625, -6.2274169921875, -5.96649169921875, -5.70556640625, -5.44464111328125, -5.1837158203125, -4.92279052734375, -4.661865234375, -4.40093994140625, -4.1400146484375, -3.87908935546875, -3.6181640625, -3.35723876953125, -3.0963134765625, -2.83538818359375, -2.574462890625, -2.31353759765625, -2.0526123046875, -1.79168701171875, -1.53076171875, -1.26983642578125, -1.0089111328125, -0.74798583984375, -0.487060546875, -0.22613525390625, 0.0347900390625, 0.29571533203125, 0.556640625, 0.81756591796875, 1.0784912109375, 1.33941650390625, 1.600341796875, 1.86126708984375, 2.1221923828125, 2.38311767578125, 2.64404296875, 2.90496826171875, 3.1658935546875, 3.42681884765625, 3.687744140625, 3.94866943359375, 4.2095947265625, 4.47052001953125, 4.7314453125, 4.99237060546875, 5.2532958984375, 5.51422119140625, 5.775146484375, 6.03607177734375, 6.2969970703125, 6.55792236328125, 6.81884765625, 7.07977294921875, 7.3406982421875, 7.60162353515625, 7.862548828125, 8.12347412109375, 8.3843994140625, 8.64532470703125, 8.90625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 8.0, 5.0, 11.0, 14.0, 15.0, 20.0, 26.0, 39.0, 43.0, 91.0, 81.0, 140.0, 168.0, 269.0, 427.0, 1608.0, 223278.0, 816904.0, 3811.0, 566.0, 303.0, 213.0, 136.0, 103.0, 74.0, 56.0, 31.0, 35.0, 5.0, 18.0, 14.0, 16.0, 7.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.015625, -19.41162109375, -18.8076171875, -18.20361328125, -17.599609375, -16.99560546875, -16.3916015625, -15.78759765625, -15.18359375, -14.57958984375, -13.9755859375, -13.37158203125, -12.767578125, -12.16357421875, -11.5595703125, -10.95556640625, -10.3515625, -9.74755859375, -9.1435546875, -8.53955078125, -7.935546875, -7.33154296875, -6.7275390625, -6.12353515625, -5.51953125, -4.91552734375, -4.3115234375, -3.70751953125, -3.103515625, -2.49951171875, -1.8955078125, -1.29150390625, -0.6875, -0.08349609375, 0.5205078125, 1.12451171875, 1.728515625, 2.33251953125, 2.9365234375, 3.54052734375, 4.14453125, 4.74853515625, 5.3525390625, 5.95654296875, 6.560546875, 7.16455078125, 7.7685546875, 8.37255859375, 8.9765625, 9.58056640625, 10.1845703125, 10.78857421875, 11.392578125, 11.99658203125, 12.6005859375, 13.20458984375, 13.80859375, 14.41259765625, 15.0166015625, 15.62060546875, 16.224609375, 16.82861328125, 17.4326171875, 18.03662109375, 18.640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 8.0, 10.0, 2.0, 6.0, 16.0, 8.0, 11.0, 12.0, 26.0, 32.0, 30.0, 27.0, 41.0, 32.0, 34.0, 42.0, 48.0, 52.0, 44.0, 53.0, 39.0, 55.0, 45.0, 39.0, 40.0, 40.0, 32.0, 32.0, 19.0, 26.0, 13.0, 21.0, 14.0, 13.0, 9.0, 13.0, 7.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.46875, -6.26861572265625, -6.0684814453125, -5.86834716796875, -5.668212890625, -5.46807861328125, -5.2679443359375, -5.06781005859375, -4.86767578125, -4.66754150390625, -4.4674072265625, -4.26727294921875, -4.067138671875, -3.86700439453125, -3.6668701171875, -3.46673583984375, -3.2666015625, -3.06646728515625, -2.8663330078125, -2.66619873046875, -2.466064453125, -2.26593017578125, -2.0657958984375, -1.86566162109375, -1.66552734375, -1.46539306640625, -1.2652587890625, -1.06512451171875, -0.864990234375, -0.66485595703125, -0.4647216796875, -0.26458740234375, -0.064453125, 0.13568115234375, 0.3358154296875, 0.53594970703125, 0.736083984375, 0.93621826171875, 1.1363525390625, 1.33648681640625, 1.53662109375, 1.73675537109375, 1.9368896484375, 2.13702392578125, 2.337158203125, 2.53729248046875, 2.7374267578125, 2.93756103515625, 3.1376953125, 3.33782958984375, 3.5379638671875, 3.73809814453125, 3.938232421875, 4.13836669921875, 4.3385009765625, 4.53863525390625, 4.73876953125, 4.93890380859375, 5.1390380859375, 5.33917236328125, 5.539306640625, 5.73944091796875, 5.9395751953125, 6.13970947265625, 6.33984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 15.0, 11.0, 25.0, 42.0, 101.0, 275.0, 1198.0, 18352.0, 1002766.0, 23853.0, 1363.0, 308.0, 102.0, 48.0, 31.0, 20.0, 17.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94140625, -4.779541015625, -4.61767578125, -4.455810546875, -4.2939453125, -4.132080078125, -3.97021484375, -3.808349609375, -3.646484375, -3.484619140625, -3.32275390625, -3.160888671875, -2.9990234375, -2.837158203125, -2.67529296875, -2.513427734375, -2.3515625, -2.189697265625, -2.02783203125, -1.865966796875, -1.7041015625, -1.542236328125, -1.38037109375, -1.218505859375, -1.056640625, -0.894775390625, -0.73291015625, -0.571044921875, -0.4091796875, -0.247314453125, -0.08544921875, 0.076416015625, 0.23828125, 0.400146484375, 0.56201171875, 0.723876953125, 0.8857421875, 1.047607421875, 1.20947265625, 1.371337890625, 1.533203125, 1.695068359375, 1.85693359375, 2.018798828125, 2.1806640625, 2.342529296875, 2.50439453125, 2.666259765625, 2.828125, 2.989990234375, 3.15185546875, 3.313720703125, 3.4755859375, 3.637451171875, 3.79931640625, 3.961181640625, 4.123046875, 4.284912109375, 4.44677734375, 4.608642578125, 4.7705078125, 4.932373046875, 5.09423828125, 5.256103515625, 5.41796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 24.0, 30.0, 58.0, 75.0, 117.0, 161.0, 148.0, 119.0, 94.0, 59.0, 40.0, 23.0, 9.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003769397735595703, -0.0003667697310447693, -0.00035659968852996826, -0.00034642964601516724, -0.0003362596035003662, -0.0003260895609855652, -0.00031591951847076416, -0.00030574947595596313, -0.0002955794334411621, -0.0002854093909263611, -0.00027523934841156006, -0.00026506930589675903, -0.000254899263381958, -0.000244729220867157, -0.00023455917835235596, -0.00022438913583755493, -0.0002142190933227539, -0.00020404905080795288, -0.00019387900829315186, -0.00018370896577835083, -0.0001735389232635498, -0.00016336888074874878, -0.00015319883823394775, -0.00014302879571914673, -0.0001328587532043457, -0.00012268871068954468, -0.00011251866817474365, -0.00010234862565994263, -9.21785831451416e-05, -8.200854063034058e-05, -7.183849811553955e-05, -6.166845560073853e-05, -5.14984130859375e-05, -4.1328370571136475e-05, -3.115832805633545e-05, -2.0988285541534424e-05, -1.0818243026733398e-05, -6.48200511932373e-07, 9.521842002868652e-06, 1.9691884517669678e-05, 2.9861927032470703e-05, 4.003196954727173e-05, 5.0202012062072754e-05, 6.037205457687378e-05, 7.05420970916748e-05, 8.071213960647583e-05, 9.088218212127686e-05, 0.00010105222463607788, 0.0001112222671508789, 0.00012139230966567993, 0.00013156235218048096, 0.00014173239469528198, 0.000151902437210083, 0.00016207247972488403, 0.00017224252223968506, 0.00018241256475448608, 0.0001925826072692871, 0.00020275264978408813, 0.00021292269229888916, 0.00022309273481369019, 0.0002332627773284912, 0.00024343281984329224, 0.00025360286235809326, 0.0002637729048728943, 0.0002739429473876953]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 7.0, 7.0, 8.0, 11.0, 22.0, 38.0, 58.0, 101.0, 201.0, 623.0, 5510.0, 734893.0, 302984.0, 3200.0, 501.0, 172.0, 92.0, 51.0, 22.0, 12.0, 14.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.35546875, -5.206298828125, -5.05712890625, -4.907958984375, -4.7587890625, -4.609619140625, -4.46044921875, -4.311279296875, -4.162109375, -4.012939453125, -3.86376953125, -3.714599609375, -3.5654296875, -3.416259765625, -3.26708984375, -3.117919921875, -2.96875, -2.819580078125, -2.67041015625, -2.521240234375, -2.3720703125, -2.222900390625, -2.07373046875, -1.924560546875, -1.775390625, -1.626220703125, -1.47705078125, -1.327880859375, -1.1787109375, -1.029541015625, -0.88037109375, -0.731201171875, -0.58203125, -0.432861328125, -0.28369140625, -0.134521484375, 0.0146484375, 0.163818359375, 0.31298828125, 0.462158203125, 0.611328125, 0.760498046875, 0.90966796875, 1.058837890625, 1.2080078125, 1.357177734375, 1.50634765625, 1.655517578125, 1.8046875, 1.953857421875, 2.10302734375, 2.252197265625, 2.4013671875, 2.550537109375, 2.69970703125, 2.848876953125, 2.998046875, 3.147216796875, 3.29638671875, 3.445556640625, 3.5947265625, 3.743896484375, 3.89306640625, 4.042236328125, 4.19140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 22.0, 33.0, 51.0, 79.0, 114.0, 112.0, 122.0, 127.0, 113.0, 68.0, 48.0, 21.0, 23.0, 11.0, 5.0, 7.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2724609375, -1.24017333984375, -1.2078857421875, -1.17559814453125, -1.143310546875, -1.11102294921875, -1.0787353515625, -1.04644775390625, -1.01416015625, -0.98187255859375, -0.9495849609375, -0.91729736328125, -0.885009765625, -0.85272216796875, -0.8204345703125, -0.78814697265625, -0.755859375, -0.72357177734375, -0.6912841796875, -0.65899658203125, -0.626708984375, -0.59442138671875, -0.5621337890625, -0.52984619140625, -0.49755859375, -0.46527099609375, -0.4329833984375, -0.40069580078125, -0.368408203125, -0.33612060546875, -0.3038330078125, -0.27154541015625, -0.2392578125, -0.20697021484375, -0.1746826171875, -0.14239501953125, -0.110107421875, -0.07781982421875, -0.0455322265625, -0.01324462890625, 0.01904296875, 0.05133056640625, 0.0836181640625, 0.11590576171875, 0.148193359375, 0.18048095703125, 0.2127685546875, 0.24505615234375, 0.27734375, 0.30963134765625, 0.3419189453125, 0.37420654296875, 0.406494140625, 0.43878173828125, 0.4710693359375, 0.50335693359375, 0.53564453125, 0.56793212890625, 0.6002197265625, 0.63250732421875, 0.664794921875, 0.69708251953125, 0.7293701171875, 0.76165771484375, 0.7939453125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 87.0, 517.0, 357.0, 35.0, 8.0, 2.0, 3.0], "bins": [-98.89265441894531, -97.21212005615234, -95.53157806396484, -93.85104370117188, -92.1705093383789, -90.4899673461914, -88.80943298339844, -87.12889099121094, -85.44835662841797, -83.767822265625, -82.0872802734375, -80.40674591064453, -78.72621154785156, -77.04566955566406, -75.3651351928711, -73.68460083007812, -72.00405883789062, -70.32352447509766, -68.64298248291016, -66.96244812011719, -65.28191375732422, -63.60137176513672, -61.92083740234375, -60.240299224853516, -58.55976486206055, -56.87922668457031, -55.198692321777344, -53.51815414428711, -51.837615966796875, -50.157081604003906, -48.47654342651367, -46.79600524902344, -45.1154670715332, -43.43492889404297, -41.75439453125, -40.073856353759766, -38.39331817626953, -36.71278381347656, -35.03224563598633, -33.351707458496094, -31.67116928100586, -29.990633010864258, -28.310094833374023, -26.629558563232422, -24.949020385742188, -23.268484115600586, -21.587947845458984, -19.90740966796875, -18.22687339782715, -16.546337127685547, -14.865798950195312, -13.185262680053711, -11.504724502563477, -9.824188232421875, -8.143651008605957, -6.463113784790039, -4.782576560974121, -3.102039337158203, -1.4215023517608643, 0.2590346336364746, 1.9395718574523926, 3.6201086044311523, 5.30064582824707, 6.981183052062988, 8.661720275878906]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 10.0, 8.0, 10.0, 12.0, 11.0, 21.0, 23.0, 17.0, 21.0, 38.0, 34.0, 41.0, 34.0, 36.0, 40.0, 35.0, 43.0, 53.0, 42.0, 44.0, 42.0, 51.0, 36.0, 47.0, 32.0, 32.0, 27.0, 26.0, 27.0, 16.0, 16.0, 7.0, 12.0, 13.0, 9.0, 9.0, 2.0, 5.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-11.829901695251465, -11.503158569335938, -11.17641544342041, -10.849672317504883, -10.522929191589355, -10.196186065673828, -9.8694429397583, -9.542699813842773, -9.215957641601562, -8.889214515686035, -8.562471389770508, -8.23572826385498, -7.908985137939453, -7.582242012023926, -7.255499362945557, -6.928756237030029, -6.602012634277344, -6.275269508361816, -5.948526382446289, -5.621783256530762, -5.295040130615234, -4.968297004699707, -4.641554355621338, -4.3148112297058105, -3.988068103790283, -3.661324977874756, -3.3345818519592285, -3.0078389644622803, -2.681095838546753, -2.3543527126312256, -2.0276098251342773, -1.70086669921875, -1.374124526977539, -1.0473814010620117, -0.7206383943557739, -0.39389532804489136, -0.06715226173400879, 0.25959086418151855, 0.5863338708877563, 0.9130768775939941, 1.2398200035095215, 1.5665631294250488, 1.8933061361312866, 2.2200491428375244, 2.5467922687530518, 2.873535394668579, 3.2002782821655273, 3.5270214080810547, 3.853764533996582, 4.180507659912109, 4.507250785827637, 4.833993911743164, 5.160737037658691, 5.487480163574219, 5.814222812652588, 6.140965938568115, 6.467709064483643, 6.79445219039917, 7.121195316314697, 7.447938442230225, 7.774681091308594, 8.101424217224121, 8.428167343139648, 8.754910469055176, 9.081653594970703]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 9.0, 13.0, 25.0, 29.0, 41.0, 36.0, 62.0, 107.0, 142.0, 250.0, 350.0, 657.0, 1979.0, 9223.0, 95823.0, 1141574.0, 2439627.0, 462160.0, 33158.0, 6129.0, 1803.0, 484.0, 212.0, 127.0, 80.0, 59.0, 32.0, 19.0, 20.0, 12.0, 12.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95703125, -7.71807861328125, -7.4791259765625, -7.24017333984375, -7.001220703125, -6.76226806640625, -6.5233154296875, -6.28436279296875, -6.04541015625, -5.80645751953125, -5.5675048828125, -5.32855224609375, -5.089599609375, -4.85064697265625, -4.6116943359375, -4.37274169921875, -4.1337890625, -3.89483642578125, -3.6558837890625, -3.41693115234375, -3.177978515625, -2.93902587890625, -2.7000732421875, -2.46112060546875, -2.22216796875, -1.98321533203125, -1.7442626953125, -1.50531005859375, -1.266357421875, -1.02740478515625, -0.7884521484375, -0.54949951171875, -0.310546875, -0.07159423828125, 0.1673583984375, 0.40631103515625, 0.645263671875, 0.88421630859375, 1.1231689453125, 1.36212158203125, 1.60107421875, 1.84002685546875, 2.0789794921875, 2.31793212890625, 2.556884765625, 2.79583740234375, 3.0347900390625, 3.27374267578125, 3.5126953125, 3.75164794921875, 3.9906005859375, 4.22955322265625, 4.468505859375, 4.70745849609375, 4.9464111328125, 5.18536376953125, 5.42431640625, 5.66326904296875, 5.9022216796875, 6.14117431640625, 6.380126953125, 6.61907958984375, 6.8580322265625, 7.09698486328125, 7.3359375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 7.0, 7.0, 12.0, 17.0, 22.0, 25.0, 30.0, 42.0, 49.0, 57.0, 76.0, 77.0, 76.0, 84.0, 77.0, 67.0, 58.0, 51.0, 38.0, 37.0, 27.0, 23.0, 7.0, 12.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.26361083984375, -8.0194091796875, -7.77520751953125, -7.531005859375, -7.28680419921875, -7.0426025390625, -6.79840087890625, -6.55419921875, -6.30999755859375, -6.0657958984375, -5.82159423828125, -5.577392578125, -5.33319091796875, -5.0889892578125, -4.84478759765625, -4.6005859375, -4.35638427734375, -4.1121826171875, -3.86798095703125, -3.623779296875, -3.37957763671875, -3.1353759765625, -2.89117431640625, -2.64697265625, -2.40277099609375, -2.1585693359375, -1.91436767578125, -1.670166015625, -1.42596435546875, -1.1817626953125, -0.93756103515625, -0.693359375, -0.44915771484375, -0.2049560546875, 0.03924560546875, 0.283447265625, 0.52764892578125, 0.7718505859375, 1.01605224609375, 1.26025390625, 1.50445556640625, 1.7486572265625, 1.99285888671875, 2.237060546875, 2.48126220703125, 2.7254638671875, 2.96966552734375, 3.2138671875, 3.45806884765625, 3.7022705078125, 3.94647216796875, 4.190673828125, 4.43487548828125, 4.6790771484375, 4.92327880859375, 5.16748046875, 5.41168212890625, 5.6558837890625, 5.90008544921875, 6.144287109375, 6.38848876953125, 6.6326904296875, 6.87689208984375, 7.12109375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 8.0, 16.0, 34.0, 56.0, 187.0, 653.0, 8856.0, 4175885.0, 7674.0, 627.0, 159.0, 76.0, 31.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -42.07958984375, -41.0654296875, -40.05126953125, -39.037109375, -38.02294921875, -37.0087890625, -35.99462890625, -34.98046875, -33.96630859375, -32.9521484375, -31.93798828125, -30.923828125, -29.90966796875, -28.8955078125, -27.88134765625, -26.8671875, -25.85302734375, -24.8388671875, -23.82470703125, -22.810546875, -21.79638671875, -20.7822265625, -19.76806640625, -18.75390625, -17.73974609375, -16.7255859375, -15.71142578125, -14.697265625, -13.68310546875, -12.6689453125, -11.65478515625, -10.640625, -9.62646484375, -8.6123046875, -7.59814453125, -6.583984375, -5.56982421875, -4.5556640625, -3.54150390625, -2.52734375, -1.51318359375, -0.4990234375, 0.51513671875, 1.529296875, 2.54345703125, 3.5576171875, 4.57177734375, 5.5859375, 6.60009765625, 7.6142578125, 8.62841796875, 9.642578125, 10.65673828125, 11.6708984375, 12.68505859375, 13.69921875, 14.71337890625, 15.7275390625, 16.74169921875, 17.755859375, 18.77001953125, 19.7841796875, 20.79833984375, 21.8125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 11.0, 14.0, 17.0, 28.0, 52.0, 81.0, 122.0, 188.0, 345.0, 525.0, 601.0, 694.0, 509.0, 341.0, 182.0, 124.0, 87.0, 39.0, 32.0, 25.0, 9.0, 9.0, 7.0, 7.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.392578125, -2.317840576171875, -2.24310302734375, -2.168365478515625, -2.0936279296875, -2.018890380859375, -1.94415283203125, -1.869415283203125, -1.794677734375, -1.719940185546875, -1.64520263671875, -1.570465087890625, -1.4957275390625, -1.420989990234375, -1.34625244140625, -1.271514892578125, -1.19677734375, -1.122039794921875, -1.04730224609375, -0.972564697265625, -0.8978271484375, -0.823089599609375, -0.74835205078125, -0.673614501953125, -0.598876953125, -0.524139404296875, -0.44940185546875, -0.374664306640625, -0.2999267578125, -0.225189208984375, -0.15045166015625, -0.075714111328125, -0.0009765625, 0.073760986328125, 0.14849853515625, 0.223236083984375, 0.2979736328125, 0.372711181640625, 0.44744873046875, 0.522186279296875, 0.596923828125, 0.671661376953125, 0.74639892578125, 0.821136474609375, 0.8958740234375, 0.970611572265625, 1.04534912109375, 1.120086669921875, 1.19482421875, 1.269561767578125, 1.34429931640625, 1.419036865234375, 1.4937744140625, 1.568511962890625, 1.64324951171875, 1.717987060546875, 1.792724609375, 1.867462158203125, 1.94219970703125, 2.016937255859375, 2.0916748046875, 2.166412353515625, 2.24114990234375, 2.315887451171875, 2.390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 11.0, 22.0, 39.0, 105.0, 171.0, 239.0, 192.0, 127.0, 49.0, 27.0, 16.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.330196380615234, -20.882713317871094, -20.435230255126953, -19.987747192382812, -19.540264129638672, -19.09278106689453, -18.64529800415039, -18.19781494140625, -17.75033187866211, -17.30284881591797, -16.855365753173828, -16.407882690429688, -15.960399627685547, -15.512916564941406, -15.06543254852295, -14.617949485778809, -14.170465469360352, -13.722982406616211, -13.27549934387207, -12.82801628112793, -12.380533218383789, -11.933050155639648, -11.485566139221191, -11.03808307647705, -10.59060001373291, -10.14311695098877, -9.695633888244629, -9.248150825500488, -8.800666809082031, -8.35318374633789, -7.90570068359375, -7.458217620849609, -7.010735511779785, -6.5632524490356445, -6.115769386291504, -5.668285846710205, -5.2208027839660645, -4.773319721221924, -4.325836181640625, -3.8783531188964844, -3.4308700561523438, -2.983386993408203, -2.5359036922454834, -2.0884203910827637, -1.640937328338623, -1.1934542655944824, -0.7459709644317627, -0.29848766326904297, 0.14899539947509766, 0.5964785814285278, 1.043961763381958, 1.4914449453353882, 1.9389281272888184, 2.386411190032959, 2.8338944911956787, 3.2813777923583984, 3.728860855102539, 4.17634391784668, 4.62382698059082, 5.071310520172119, 5.51879358291626, 5.9662766456604, 6.413760185241699, 6.86124324798584, 7.3087263107299805]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 10.0, 6.0, 19.0, 16.0, 18.0, 29.0, 42.0, 54.0, 62.0, 58.0, 73.0, 71.0, 89.0, 78.0, 76.0, 76.0, 54.0, 37.0, 34.0, 27.0, 22.0, 23.0, 11.0, 11.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.096182823181152, -9.820223808288574, -9.54426383972168, -9.268304824829102, -8.992345809936523, -8.716386795043945, -8.44042682647705, -8.164467811584473, -7.888508319854736, -7.612548828125, -7.336589813232422, -7.0606303215026855, -6.784670829772949, -6.508711814880371, -6.232752323150635, -5.956792831420898, -5.68083381652832, -5.404874324798584, -5.128915309906006, -4.8529558181762695, -4.576996803283691, -4.301037311553955, -4.025077819824219, -3.7491185665130615, -3.4731593132019043, -3.197200059890747, -2.92124080657959, -2.6452813148498535, -2.3693220615386963, -2.093362808227539, -1.8174034357070923, -1.5414440631866455, -1.2654838562011719, -0.9895245432853699, -0.7135652303695679, -0.43760591745376587, -0.16164660453796387, 0.11431264877319336, 0.39027202129364014, 0.6662313938140869, 0.9421906471252441, 1.2181499004364014, 1.4941092729568481, 1.770068645477295, 2.046027898788452, 2.3219871520996094, 2.5979466438293457, 2.873905897140503, 3.14986515045166, 3.4258244037628174, 3.7017836570739746, 3.977743148803711, 4.253702163696289, 4.529661655426025, 4.805621147155762, 5.08158016204834, 5.357539653778076, 5.6334991455078125, 5.909458160400391, 6.185417652130127, 6.461377143859863, 6.737336158752441, 7.013295650482178, 7.289255142211914, 7.565214157104492]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 8.0, 8.0, 22.0, 20.0, 34.0, 61.0, 110.0, 222.0, 374.0, 795.0, 2373.0, 11296.0, 117754.0, 829663.0, 74040.0, 8340.0, 1952.0, 691.0, 349.0, 181.0, 91.0, 67.0, 35.0, 22.0, 17.0, 6.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.796356201171875, -1.73529052734375, -1.674224853515625, -1.6131591796875, -1.552093505859375, -1.49102783203125, -1.429962158203125, -1.368896484375, -1.307830810546875, -1.24676513671875, -1.185699462890625, -1.1246337890625, -1.063568115234375, -1.00250244140625, -0.941436767578125, -0.88037109375, -0.819305419921875, -0.75823974609375, -0.697174072265625, -0.6361083984375, -0.575042724609375, -0.51397705078125, -0.452911376953125, -0.391845703125, -0.330780029296875, -0.26971435546875, -0.208648681640625, -0.1475830078125, -0.086517333984375, -0.02545166015625, 0.035614013671875, 0.0966796875, 0.157745361328125, 0.21881103515625, 0.279876708984375, 0.3409423828125, 0.402008056640625, 0.46307373046875, 0.524139404296875, 0.585205078125, 0.646270751953125, 0.70733642578125, 0.768402099609375, 0.8294677734375, 0.890533447265625, 0.95159912109375, 1.012664794921875, 1.07373046875, 1.134796142578125, 1.19586181640625, 1.256927490234375, 1.3179931640625, 1.379058837890625, 1.44012451171875, 1.501190185546875, 1.562255859375, 1.623321533203125, 1.68438720703125, 1.745452880859375, 1.8065185546875, 1.867584228515625, 1.92864990234375, 1.989715576171875, 2.05078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 17.0, 18.0, 20.0, 49.0, 61.0, 75.0, 100.0, 100.0, 123.0, 120.0, 106.0, 62.0, 58.0, 36.0, 22.0, 22.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.35101318359375, -8.0926513671875, -7.83428955078125, -7.575927734375, -7.31756591796875, -7.0592041015625, -6.80084228515625, -6.54248046875, -6.28411865234375, -6.0257568359375, -5.76739501953125, -5.509033203125, -5.25067138671875, -4.9923095703125, -4.73394775390625, -4.4755859375, -4.21722412109375, -3.9588623046875, -3.70050048828125, -3.442138671875, -3.18377685546875, -2.9254150390625, -2.66705322265625, -2.40869140625, -2.15032958984375, -1.8919677734375, -1.63360595703125, -1.375244140625, -1.11688232421875, -0.8585205078125, -0.60015869140625, -0.341796875, -0.08343505859375, 0.1749267578125, 0.43328857421875, 0.691650390625, 0.95001220703125, 1.2083740234375, 1.46673583984375, 1.72509765625, 1.98345947265625, 2.2418212890625, 2.50018310546875, 2.758544921875, 3.01690673828125, 3.2752685546875, 3.53363037109375, 3.7919921875, 4.05035400390625, 4.3087158203125, 4.56707763671875, 4.825439453125, 5.08380126953125, 5.3421630859375, 5.60052490234375, 5.85888671875, 6.11724853515625, 6.3756103515625, 6.63397216796875, 6.892333984375, 7.15069580078125, 7.4090576171875, 7.66741943359375, 7.92578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 10.0, 5.0, 10.0, 18.0, 38.0, 49.0, 81.0, 126.0, 190.0, 376.0, 701.0, 1493.0, 3450.0, 8867.0, 26026.0, 88279.0, 439159.0, 366682.0, 76224.0, 22869.0, 7924.0, 3106.0, 1341.0, 671.0, 374.0, 177.0, 107.0, 69.0, 41.0, 34.0, 17.0, 17.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84716796875, -0.8214492797851562, -0.7957305908203125, -0.7700119018554688, -0.744293212890625, -0.7185745239257812, -0.6928558349609375, -0.6671371459960938, -0.64141845703125, -0.6156997680664062, -0.5899810791015625, -0.5642623901367188, -0.538543701171875, -0.5128250122070312, -0.4871063232421875, -0.46138763427734375, -0.4356689453125, -0.40995025634765625, -0.3842315673828125, -0.35851287841796875, -0.332794189453125, -0.30707550048828125, -0.2813568115234375, -0.25563812255859375, -0.22991943359375, -0.20420074462890625, -0.1784820556640625, -0.15276336669921875, -0.127044677734375, -0.10132598876953125, -0.0756072998046875, -0.04988861083984375, -0.024169921875, 0.00154876708984375, 0.0272674560546875, 0.05298614501953125, 0.078704833984375, 0.10442352294921875, 0.1301422119140625, 0.15586090087890625, 0.18157958984375, 0.20729827880859375, 0.2330169677734375, 0.25873565673828125, 0.284454345703125, 0.31017303466796875, 0.3358917236328125, 0.36161041259765625, 0.3873291015625, 0.41304779052734375, 0.4387664794921875, 0.46448516845703125, 0.490203857421875, 0.5159225463867188, 0.5416412353515625, 0.5673599243164062, 0.59307861328125, 0.6187973022460938, 0.6445159912109375, 0.6702346801757812, 0.695953369140625, 0.7216720581054688, 0.7473907470703125, 0.7731094360351562, 0.798828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 4.0, 4.0, 11.0, 10.0, 13.0, 17.0, 19.0, 19.0, 27.0, 23.0, 27.0, 26.0, 47.0, 46.0, 50.0, 55.0, 55.0, 49.0, 58.0, 52.0, 33.0, 47.0, 35.0, 43.0, 41.0, 36.0, 27.0, 18.0, 26.0, 16.0, 17.0, 16.0, 14.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.31640625, -7.09906005859375, -6.8817138671875, -6.66436767578125, -6.447021484375, -6.22967529296875, -6.0123291015625, -5.79498291015625, -5.57763671875, -5.36029052734375, -5.1429443359375, -4.92559814453125, -4.708251953125, -4.49090576171875, -4.2735595703125, -4.05621337890625, -3.8388671875, -3.62152099609375, -3.4041748046875, -3.18682861328125, -2.969482421875, -2.75213623046875, -2.5347900390625, -2.31744384765625, -2.10009765625, -1.88275146484375, -1.6654052734375, -1.44805908203125, -1.230712890625, -1.01336669921875, -0.7960205078125, -0.57867431640625, -0.361328125, -0.14398193359375, 0.0733642578125, 0.29071044921875, 0.508056640625, 0.72540283203125, 0.9427490234375, 1.16009521484375, 1.37744140625, 1.59478759765625, 1.8121337890625, 2.02947998046875, 2.246826171875, 2.46417236328125, 2.6815185546875, 2.89886474609375, 3.1162109375, 3.33355712890625, 3.5509033203125, 3.76824951171875, 3.985595703125, 4.20294189453125, 4.4202880859375, 4.63763427734375, 4.85498046875, 5.07232666015625, 5.2896728515625, 5.50701904296875, 5.724365234375, 5.94171142578125, 6.1590576171875, 6.37640380859375, 6.59375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 15.0, 15.0, 27.0, 32.0, 65.0, 86.0, 119.0, 175.0, 273.0, 476.0, 719.0, 1375.0, 3187.0, 9412.0, 42808.0, 313744.0, 561226.0, 89061.0, 16444.0, 4806.0, 1999.0, 953.0, 525.0, 311.0, 223.0, 138.0, 97.0, 82.0, 57.0, 26.0, 18.0, 12.0, 8.0, 10.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10784912109375, -0.10402393341064453, -0.10019874572753906, -0.0963735580444336, -0.09254837036132812, -0.08872318267822266, -0.08489799499511719, -0.08107280731201172, -0.07724761962890625, -0.07342243194580078, -0.06959724426269531, -0.06577205657958984, -0.061946868896484375, -0.058121681213378906, -0.05429649353027344, -0.05047130584716797, -0.0466461181640625, -0.04282093048095703, -0.03899574279785156, -0.035170555114746094, -0.031345367431640625, -0.027520179748535156, -0.023694992065429688, -0.01986980438232422, -0.01604461669921875, -0.012219429016113281, -0.008394241333007812, -0.004569053649902344, -0.000743865966796875, 0.0030813217163085938, 0.0069065093994140625, 0.010731697082519531, 0.014556884765625, 0.01838207244873047, 0.022207260131835938, 0.026032447814941406, 0.029857635498046875, 0.033682823181152344, 0.03750801086425781, 0.04133319854736328, 0.04515838623046875, 0.04898357391357422, 0.05280876159667969, 0.056633949279785156, 0.060459136962890625, 0.0642843246459961, 0.06810951232910156, 0.07193470001220703, 0.0757598876953125, 0.07958507537841797, 0.08341026306152344, 0.0872354507446289, 0.09106063842773438, 0.09488582611083984, 0.09871101379394531, 0.10253620147705078, 0.10636138916015625, 0.11018657684326172, 0.11401176452636719, 0.11783695220947266, 0.12166213989257812, 0.1254873275756836, 0.12931251525878906, 0.13313770294189453, 0.136962890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 8.0, 14.0, 10.0, 16.0, 17.0, 33.0, 46.0, 51.0, 63.0, 79.0, 86.0, 75.0, 79.0, 78.0, 59.0, 68.0, 41.0, 42.0, 21.0, 26.0, 21.0, 10.0, 14.0, 8.0, 11.0, 5.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.594160079956055e-05, -3.427267074584961e-05, -3.260374069213867e-05, -3.0934810638427734e-05, -2.9265880584716797e-05, -2.759695053100586e-05, -2.5928020477294922e-05, -2.4259090423583984e-05, -2.2590160369873047e-05, -2.092123031616211e-05, -1.9252300262451172e-05, -1.7583370208740234e-05, -1.5914440155029297e-05, -1.424551010131836e-05, -1.2576580047607422e-05, -1.0907649993896484e-05, -9.238719940185547e-06, -7.569789886474609e-06, -5.900859832763672e-06, -4.231929779052734e-06, -2.562999725341797e-06, -8.940696716308594e-07, 7.748603820800781e-07, 2.4437904357910156e-06, 4.112720489501953e-06, 5.781650543212891e-06, 7.450580596923828e-06, 9.119510650634766e-06, 1.0788440704345703e-05, 1.245737075805664e-05, 1.4126300811767578e-05, 1.5795230865478516e-05, 1.7464160919189453e-05, 1.913309097290039e-05, 2.0802021026611328e-05, 2.2470951080322266e-05, 2.4139881134033203e-05, 2.580881118774414e-05, 2.7477741241455078e-05, 2.9146671295166016e-05, 3.081560134887695e-05, 3.248453140258789e-05, 3.415346145629883e-05, 3.5822391510009766e-05, 3.74913215637207e-05, 3.916025161743164e-05, 4.082918167114258e-05, 4.2498111724853516e-05, 4.416704177856445e-05, 4.583597183227539e-05, 4.750490188598633e-05, 4.9173831939697266e-05, 5.08427619934082e-05, 5.251169204711914e-05, 5.418062210083008e-05, 5.5849552154541016e-05, 5.751848220825195e-05, 5.918741226196289e-05, 6.085634231567383e-05, 6.252527236938477e-05, 6.41942024230957e-05, 6.586313247680664e-05, 6.753206253051758e-05, 6.920099258422852e-05, 7.086992263793945e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 9.0, 17.0, 26.0, 33.0, 75.0, 129.0, 372.0, 1481.0, 13645.0, 585146.0, 434548.0, 11055.0, 1335.0, 358.0, 114.0, 70.0, 46.0, 26.0, 15.0, 7.0, 6.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2081298828125, -0.2006855010986328, -0.19324111938476562, -0.18579673767089844, -0.17835235595703125, -0.17090797424316406, -0.16346359252929688, -0.1560192108154297, -0.1485748291015625, -0.1411304473876953, -0.13368606567382812, -0.12624168395996094, -0.11879730224609375, -0.11135292053222656, -0.10390853881835938, -0.09646415710449219, -0.089019775390625, -0.08157539367675781, -0.07413101196289062, -0.06668663024902344, -0.05924224853515625, -0.05179786682128906, -0.044353485107421875, -0.03690910339355469, -0.0294647216796875, -0.022020339965820312, -0.014575958251953125, -0.0071315765380859375, 0.00031280517578125, 0.0077571868896484375, 0.015201568603515625, 0.022645950317382812, 0.03009033203125, 0.03753471374511719, 0.044979095458984375, 0.05242347717285156, 0.05986785888671875, 0.06731224060058594, 0.07475662231445312, 0.08220100402832031, 0.0896453857421875, 0.09708976745605469, 0.10453414916992188, 0.11197853088378906, 0.11942291259765625, 0.12686729431152344, 0.13431167602539062, 0.1417560577392578, 0.149200439453125, 0.1566448211669922, 0.16408920288085938, 0.17153358459472656, 0.17897796630859375, 0.18642234802246094, 0.19386672973632812, 0.2013111114501953, 0.2087554931640625, 0.2161998748779297, 0.22364425659179688, 0.23108863830566406, 0.23853302001953125, 0.24597740173339844, 0.2534217834472656, 0.2608661651611328, 0.268310546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 13.0, 13.0, 10.0, 20.0, 29.0, 28.0, 46.0, 74.0, 91.0, 100.0, 128.0, 105.0, 71.0, 76.0, 36.0, 30.0, 35.0, 20.0, 21.0, 13.0, 12.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0287933349609375, -0.027785539627075195, -0.02677774429321289, -0.025769948959350586, -0.02476215362548828, -0.023754358291625977, -0.022746562957763672, -0.021738767623901367, -0.020730972290039062, -0.019723176956176758, -0.018715381622314453, -0.01770758628845215, -0.016699790954589844, -0.01569199562072754, -0.014684200286865234, -0.01367640495300293, -0.012668609619140625, -0.01166081428527832, -0.010653018951416016, -0.009645223617553711, -0.008637428283691406, -0.0076296329498291016, -0.006621837615966797, -0.005614042282104492, -0.0046062469482421875, -0.003598451614379883, -0.002590656280517578, -0.0015828609466552734, -0.0005750656127929688, 0.00043272972106933594, 0.0014405250549316406, 0.0024483203887939453, 0.00345611572265625, 0.004463911056518555, 0.005471706390380859, 0.006479501724243164, 0.007487297058105469, 0.008495092391967773, 0.009502887725830078, 0.010510683059692383, 0.011518478393554688, 0.012526273727416992, 0.013534069061279297, 0.014541864395141602, 0.015549659729003906, 0.01655745506286621, 0.017565250396728516, 0.01857304573059082, 0.019580841064453125, 0.02058863639831543, 0.021596431732177734, 0.02260422706604004, 0.023612022399902344, 0.02461981773376465, 0.025627613067626953, 0.026635408401489258, 0.027643203735351562, 0.028650999069213867, 0.029658794403076172, 0.030666589736938477, 0.03167438507080078, 0.032682180404663086, 0.03368997573852539, 0.034697771072387695, 0.03570556640625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 35.0, 578.0, 379.0, 21.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.52688217163086, -56.41836166381836, -55.309837341308594, -54.201316833496094, -53.092796325683594, -51.984275817871094, -50.875755310058594, -49.76723098754883, -48.65871047973633, -47.55018997192383, -46.44166564941406, -45.33314514160156, -44.22462463378906, -43.11610412597656, -42.00758361816406, -40.8990592956543, -39.7905387878418, -38.6820182800293, -37.57349395751953, -36.46497344970703, -35.35645294189453, -34.24793243408203, -33.13941192626953, -32.030887603759766, -30.922367095947266, -29.813846588134766, -28.705324172973633, -27.5968017578125, -26.48828125, -25.3797607421875, -24.271238327026367, -23.162715911865234, -22.05419921875, -20.9456787109375, -19.837156295776367, -18.728633880615234, -17.620113372802734, -16.511592864990234, -15.403070449829102, -14.294548988342285, -13.186027526855469, -12.077506065368652, -10.968984603881836, -9.86046314239502, -8.751941680908203, -7.643420219421387, -6.53489875793457, -5.426377296447754, -4.3178558349609375, -3.209334373474121, -2.1008129119873047, -0.9922914505004883, 0.11623001098632812, 1.2247514724731445, 2.333272933959961, 3.4417943954467773, 4.550315856933594, 5.65883731842041, 6.767358779907227, 7.875880241394043, 8.98440170288086, 10.092923164367676, 11.201444625854492, 12.309966087341309, 13.418487548828125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 15.0, 22.0, 18.0, 44.0, 61.0, 81.0, 84.0, 105.0, 110.0, 108.0, 103.0, 72.0, 49.0, 43.0, 27.0, 24.0, 16.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.098264694213867, -7.863068103790283, -7.627871990203857, -7.392675399780273, -7.157479286193848, -6.922282695770264, -6.68708610534668, -6.451889991760254, -6.216693878173828, -5.981497287750244, -5.746301174163818, -5.511104583740234, -5.275908470153809, -5.040711879730225, -4.805515289306641, -4.570319175720215, -4.335122585296631, -4.099925994873047, -3.864729881286621, -3.629533290863037, -3.3943371772766113, -3.1591405868530273, -2.9239442348480225, -2.6887478828430176, -2.4535515308380127, -2.218355178833008, -1.983158826828003, -1.7479623556137085, -1.5127660036087036, -1.2775696516036987, -1.0423731803894043, -0.8071768283843994, -0.5719809532165527, -0.33678457140922546, -0.1015881896018982, 0.13360822200775146, 0.36880457401275635, 0.6040009260177612, 0.8391973972320557, 1.0743937492370605, 1.3095901012420654, 1.5447864532470703, 1.7799828052520752, 2.01517915725708, 2.250375747680664, 2.48557186126709, 2.720768451690674, 2.9559648036956787, 3.1911611557006836, 3.4263575077056885, 3.6615538597106934, 3.8967504501342773, 4.131946563720703, 4.367143154144287, 4.602339744567871, 4.837535858154297, 5.072731971740723, 5.307928562164307, 5.543124675750732, 5.778321266174316, 6.013517379760742, 6.248713970184326, 6.48391056060791, 6.719106674194336, 6.95430326461792]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 6.0, 9.0, 8.0, 16.0, 8.0, 9.0, 27.0, 26.0, 49.0, 50.0, 73.0, 138.0, 240.0, 409.0, 848.0, 2138.0, 6371.0, 25745.0, 114904.0, 364347.0, 374304.0, 120636.0, 27254.0, 6804.0, 2139.0, 883.0, 445.0, 277.0, 112.0, 90.0, 59.0, 40.0, 24.0, 11.0, 8.0, 8.0, 10.0, 6.0, 7.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.857421875, -3.733062744140625, -3.60870361328125, -3.484344482421875, -3.3599853515625, -3.235626220703125, -3.11126708984375, -2.986907958984375, -2.862548828125, -2.738189697265625, -2.61383056640625, -2.489471435546875, -2.3651123046875, -2.240753173828125, -2.11639404296875, -1.992034912109375, -1.86767578125, -1.743316650390625, -1.61895751953125, -1.494598388671875, -1.3702392578125, -1.245880126953125, -1.12152099609375, -0.997161865234375, -0.872802734375, -0.748443603515625, -0.62408447265625, -0.499725341796875, -0.3753662109375, -0.251007080078125, -0.12664794921875, -0.002288818359375, 0.1220703125, 0.246429443359375, 0.37078857421875, 0.495147705078125, 0.6195068359375, 0.743865966796875, 0.86822509765625, 0.992584228515625, 1.116943359375, 1.241302490234375, 1.36566162109375, 1.490020751953125, 1.6143798828125, 1.738739013671875, 1.86309814453125, 1.987457275390625, 2.11181640625, 2.236175537109375, 2.36053466796875, 2.484893798828125, 2.6092529296875, 2.733612060546875, 2.85797119140625, 2.982330322265625, 3.106689453125, 3.231048583984375, 3.35540771484375, 3.479766845703125, 3.6041259765625, 3.728485107421875, 3.85284423828125, 3.977203369140625, 4.1015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 17.0, 10.0, 15.0, 22.0, 20.0, 45.0, 47.0, 49.0, 65.0, 65.0, 79.0, 86.0, 102.0, 82.0, 63.0, 52.0, 40.0, 42.0, 22.0, 20.0, 20.0, 15.0, 13.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1875, -10.88934326171875, -10.5911865234375, -10.29302978515625, -9.994873046875, -9.69671630859375, -9.3985595703125, -9.10040283203125, -8.80224609375, -8.50408935546875, -8.2059326171875, -7.90777587890625, -7.609619140625, -7.31146240234375, -7.0133056640625, -6.71514892578125, -6.4169921875, -6.11883544921875, -5.8206787109375, -5.52252197265625, -5.224365234375, -4.92620849609375, -4.6280517578125, -4.32989501953125, -4.03173828125, -3.73358154296875, -3.4354248046875, -3.13726806640625, -2.839111328125, -2.54095458984375, -2.2427978515625, -1.94464111328125, -1.646484375, -1.34832763671875, -1.0501708984375, -0.75201416015625, -0.453857421875, -0.15570068359375, 0.1424560546875, 0.44061279296875, 0.73876953125, 1.03692626953125, 1.3350830078125, 1.63323974609375, 1.931396484375, 2.22955322265625, 2.5277099609375, 2.82586669921875, 3.1240234375, 3.42218017578125, 3.7203369140625, 4.01849365234375, 4.316650390625, 4.61480712890625, 4.9129638671875, 5.21112060546875, 5.50927734375, 5.80743408203125, 6.1055908203125, 6.40374755859375, 6.701904296875, 7.00006103515625, 7.2982177734375, 7.59637451171875, 7.89453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 12.0, 11.0, 27.0, 28.0, 29.0, 62.0, 79.0, 128.0, 146.0, 187.0, 257.0, 302.0, 433.0, 1559.0, 98512.0, 924716.0, 19546.0, 924.0, 367.0, 295.0, 218.0, 200.0, 152.0, 106.0, 71.0, 69.0, 31.0, 24.0, 19.0, 7.0, 8.0, 5.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1484375, -12.72900390625, -12.3095703125, -11.89013671875, -11.470703125, -11.05126953125, -10.6318359375, -10.21240234375, -9.79296875, -9.37353515625, -8.9541015625, -8.53466796875, -8.115234375, -7.69580078125, -7.2763671875, -6.85693359375, -6.4375, -6.01806640625, -5.5986328125, -5.17919921875, -4.759765625, -4.34033203125, -3.9208984375, -3.50146484375, -3.08203125, -2.66259765625, -2.2431640625, -1.82373046875, -1.404296875, -0.98486328125, -0.5654296875, -0.14599609375, 0.2734375, 0.69287109375, 1.1123046875, 1.53173828125, 1.951171875, 2.37060546875, 2.7900390625, 3.20947265625, 3.62890625, 4.04833984375, 4.4677734375, 4.88720703125, 5.306640625, 5.72607421875, 6.1455078125, 6.56494140625, 6.984375, 7.40380859375, 7.8232421875, 8.24267578125, 8.662109375, 9.08154296875, 9.5009765625, 9.92041015625, 10.33984375, 10.75927734375, 11.1787109375, 11.59814453125, 12.017578125, 12.43701171875, 12.8564453125, 13.27587890625, 13.6953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 4.0, 13.0, 8.0, 10.0, 15.0, 18.0, 20.0, 27.0, 37.0, 32.0, 27.0, 46.0, 56.0, 36.0, 43.0, 40.0, 49.0, 57.0, 49.0, 52.0, 42.0, 41.0, 39.0, 34.0, 34.0, 29.0, 27.0, 14.0, 27.0, 11.0, 16.0, 11.0, 5.0, 3.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.57421875, -6.3720703125, -6.169921875, -5.9677734375, -5.765625, -5.5634765625, -5.361328125, -5.1591796875, -4.95703125, -4.7548828125, -4.552734375, -4.3505859375, -4.1484375, -3.9462890625, -3.744140625, -3.5419921875, -3.33984375, -3.1376953125, -2.935546875, -2.7333984375, -2.53125, -2.3291015625, -2.126953125, -1.9248046875, -1.72265625, -1.5205078125, -1.318359375, -1.1162109375, -0.9140625, -0.7119140625, -0.509765625, -0.3076171875, -0.10546875, 0.0966796875, 0.298828125, 0.5009765625, 0.703125, 0.9052734375, 1.107421875, 1.3095703125, 1.51171875, 1.7138671875, 1.916015625, 2.1181640625, 2.3203125, 2.5224609375, 2.724609375, 2.9267578125, 3.12890625, 3.3310546875, 3.533203125, 3.7353515625, 3.9375, 4.1396484375, 4.341796875, 4.5439453125, 4.74609375, 4.9482421875, 5.150390625, 5.3525390625, 5.5546875, 5.7568359375, 5.958984375, 6.1611328125, 6.36328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 20.0, 30.0, 53.0, 99.0, 247.0, 1224.0, 20601.0, 1011802.0, 13100.0, 947.0, 189.0, 85.0, 43.0, 24.0, 14.0, 14.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.84765625, -6.64886474609375, -6.4500732421875, -6.25128173828125, -6.052490234375, -5.85369873046875, -5.6549072265625, -5.45611572265625, -5.25732421875, -5.05853271484375, -4.8597412109375, -4.66094970703125, -4.462158203125, -4.26336669921875, -4.0645751953125, -3.86578369140625, -3.6669921875, -3.46820068359375, -3.2694091796875, -3.07061767578125, -2.871826171875, -2.67303466796875, -2.4742431640625, -2.27545166015625, -2.07666015625, -1.87786865234375, -1.6790771484375, -1.48028564453125, -1.281494140625, -1.08270263671875, -0.8839111328125, -0.68511962890625, -0.486328125, -0.28753662109375, -0.0887451171875, 0.11004638671875, 0.308837890625, 0.50762939453125, 0.7064208984375, 0.90521240234375, 1.10400390625, 1.30279541015625, 1.5015869140625, 1.70037841796875, 1.899169921875, 2.09796142578125, 2.2967529296875, 2.49554443359375, 2.6943359375, 2.89312744140625, 3.0919189453125, 3.29071044921875, 3.489501953125, 3.68829345703125, 3.8870849609375, 4.08587646484375, 4.28466796875, 4.48345947265625, 4.6822509765625, 4.88104248046875, 5.079833984375, 5.27862548828125, 5.4774169921875, 5.67620849609375, 5.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 9.0, 22.0, 22.0, 31.0, 65.0, 74.0, 113.0, 105.0, 154.0, 117.0, 100.0, 63.0, 46.0, 30.0, 11.0, 10.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00035071372985839844, -0.0003405176103115082, -0.0003303214907646179, -0.00032012537121772766, -0.0003099292516708374, -0.00029973313212394714, -0.0002895370125770569, -0.0002793408930301666, -0.00026914477348327637, -0.0002589486539363861, -0.00024875253438949585, -0.0002385564148426056, -0.00022836029529571533, -0.00021816417574882507, -0.00020796805620193481, -0.00019777193665504456, -0.0001875758171081543, -0.00017737969756126404, -0.00016718357801437378, -0.00015698745846748352, -0.00014679133892059326, -0.000136595219373703, -0.00012639909982681274, -0.00011620298027992249, -0.00010600686073303223, -9.581074118614197e-05, -8.561462163925171e-05, -7.541850209236145e-05, -6.522238254547119e-05, -5.502626299858093e-05, -4.4830143451690674e-05, -3.4634023904800415e-05, -2.4437904357910156e-05, -1.4241784811019897e-05, -4.045665264129639e-06, 6.15045428276062e-06, 1.634657382965088e-05, 2.6542693376541138e-05, 3.6738812923431396e-05, 4.6934932470321655e-05, 5.7131052017211914e-05, 6.732717156410217e-05, 7.752329111099243e-05, 8.771941065788269e-05, 9.791553020477295e-05, 0.00010811164975166321, 0.00011830776929855347, 0.00012850388884544373, 0.00013870000839233398, 0.00014889612793922424, 0.0001590922474861145, 0.00016928836703300476, 0.00017948448657989502, 0.00018968060612678528, 0.00019987672567367554, 0.0002100728452205658, 0.00022026896476745605, 0.0002304650843143463, 0.00024066120386123657, 0.00025085732340812683, 0.0002610534429550171, 0.00027124956250190735, 0.0002814456820487976, 0.00029164180159568787, 0.0003018379211425781]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 7.0, 12.0, 22.0, 25.0, 59.0, 122.0, 327.0, 1423.0, 54790.0, 985097.0, 5671.0, 593.0, 189.0, 80.0, 47.0, 24.0, 15.0, 9.0, 10.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.9193115234375, -6.697998046875, -6.4766845703125, -6.25537109375, -6.0340576171875, -5.812744140625, -5.5914306640625, -5.3701171875, -5.1488037109375, -4.927490234375, -4.7061767578125, -4.48486328125, -4.2635498046875, -4.042236328125, -3.8209228515625, -3.599609375, -3.3782958984375, -3.156982421875, -2.9356689453125, -2.71435546875, -2.4930419921875, -2.271728515625, -2.0504150390625, -1.8291015625, -1.6077880859375, -1.386474609375, -1.1651611328125, -0.94384765625, -0.7225341796875, -0.501220703125, -0.2799072265625, -0.05859375, 0.1627197265625, 0.384033203125, 0.6053466796875, 0.82666015625, 1.0479736328125, 1.269287109375, 1.4906005859375, 1.7119140625, 1.9332275390625, 2.154541015625, 2.3758544921875, 2.59716796875, 2.8184814453125, 3.039794921875, 3.2611083984375, 3.482421875, 3.7037353515625, 3.925048828125, 4.1463623046875, 4.36767578125, 4.5889892578125, 4.810302734375, 5.0316162109375, 5.2529296875, 5.4742431640625, 5.695556640625, 5.9168701171875, 6.13818359375, 6.3594970703125, 6.580810546875, 6.8021240234375, 7.0234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 9.0, 15.0, 15.0, 33.0, 58.0, 91.0, 142.0, 143.0, 149.0, 133.0, 80.0, 46.0, 29.0, 16.0, 10.0, 10.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.216796875, -1.1760406494140625, -1.135284423828125, -1.0945281982421875, -1.05377197265625, -1.0130157470703125, -0.972259521484375, -0.9315032958984375, -0.8907470703125, -0.8499908447265625, -0.809234619140625, -0.7684783935546875, -0.72772216796875, -0.6869659423828125, -0.646209716796875, -0.6054534912109375, -0.564697265625, -0.5239410400390625, -0.483184814453125, -0.4424285888671875, -0.40167236328125, -0.3609161376953125, -0.320159912109375, -0.2794036865234375, -0.2386474609375, -0.1978912353515625, -0.157135009765625, -0.1163787841796875, -0.07562255859375, -0.0348663330078125, 0.005889892578125, 0.0466461181640625, 0.08740234375, 0.1281585693359375, 0.168914794921875, 0.2096710205078125, 0.25042724609375, 0.2911834716796875, 0.331939697265625, 0.3726959228515625, 0.4134521484375, 0.4542083740234375, 0.494964599609375, 0.5357208251953125, 0.57647705078125, 0.6172332763671875, 0.657989501953125, 0.6987457275390625, 0.739501953125, 0.7802581787109375, 0.821014404296875, 0.8617706298828125, 0.90252685546875, 0.9432830810546875, 0.984039306640625, 1.0247955322265625, 1.0655517578125, 1.1063079833984375, 1.147064208984375, 1.1878204345703125, 1.22857666015625, 1.2693328857421875, 1.310089111328125, 1.3508453369140625, 1.3916015625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 10.0, 23.0, 51.0, 133.0, 183.0, 261.0, 187.0, 99.0, 25.0, 21.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.183883666992188, -25.61830711364746, -25.0527286529541, -24.487152099609375, -23.92157554626465, -23.355998992919922, -22.790420532226562, -22.224843978881836, -21.65926742553711, -21.093690872192383, -20.528112411499023, -19.962535858154297, -19.39695930480957, -18.831382751464844, -18.265804290771484, -17.700227737426758, -17.1346492767334, -16.569072723388672, -16.003494262695312, -15.437917709350586, -14.87234115600586, -14.306763648986816, -13.741186141967773, -13.175609588623047, -12.610032081604004, -12.044454574584961, -11.478878021240234, -10.913300514221191, -10.347723007202148, -9.782146453857422, -9.216568946838379, -8.650991439819336, -8.08541488647461, -7.519837856292725, -6.95426082611084, -6.388683319091797, -5.823106288909912, -5.257529258728027, -4.691951751708984, -4.1263747215271, -3.560797691345215, -2.99522066116333, -2.429643392562866, -1.864066243171692, -1.2984890937805176, -0.7329120635986328, -0.16733479499816895, 0.3982424736022949, 0.9638195037841797, 1.529396653175354, 2.0949738025665283, 2.660551071166992, 3.226128101348877, 3.7917051315307617, 4.357282638549805, 4.9228596687316895, 5.488436698913574, 6.054013729095459, 6.619590759277344, 7.185168266296387, 7.7507452964782715, 8.316322326660156, 8.8818998336792, 9.447477340698242, 10.013053894042969]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 11.0, 15.0, 13.0, 16.0, 23.0, 18.0, 29.0, 40.0, 44.0, 49.0, 54.0, 56.0, 57.0, 56.0, 55.0, 55.0, 54.0, 64.0, 35.0, 46.0, 32.0, 27.0, 29.0, 22.0, 28.0, 17.0, 12.0, 13.0, 13.0, 9.0, 3.0, 6.0, 0.0, 6.0], "bins": [-18.969295501708984, -18.548797607421875, -18.128299713134766, -17.707801818847656, -17.28730583190918, -16.86680793762207, -16.44631004333496, -16.02581214904785, -15.605314254760742, -15.184816360473633, -14.76431941986084, -14.34382152557373, -13.923323631286621, -13.502826690673828, -13.082328796386719, -12.66183090209961, -12.241333961486816, -11.820836067199707, -11.400339126586914, -10.979841232299805, -10.559343338012695, -10.138845443725586, -9.718348503112793, -9.297850608825684, -8.87735366821289, -8.456855773925781, -8.036358833312988, -7.615860939025879, -7.1953630447387695, -6.774865627288818, -6.354368209838867, -5.933870315551758, -5.51337194442749, -5.092874526977539, -4.67237663269043, -4.2518792152404785, -3.8313815593719482, -3.410883903503418, -2.990386486053467, -2.5698888301849365, -2.1493911743164062, -1.728893518447876, -1.3083959817886353, -0.8878984451293945, -0.46740078926086426, -0.046903133392333984, 0.3735942840576172, 0.7940919399261475, 1.2145895957946777, 1.635087251663208, 2.0555849075317383, 2.4760823249816895, 2.8965799808502197, 3.31707763671875, 3.737575054168701, 4.158072471618652, 4.578570365905762, 4.999067783355713, 5.419565677642822, 5.840063095092773, 6.260560989379883, 6.681058406829834, 7.101555824279785, 7.5220537185668945, 7.942551136016846]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 3.0, 7.0, 18.0, 19.0, 26.0, 38.0, 52.0, 65.0, 93.0, 103.0, 205.0, 280.0, 416.0, 785.0, 2596.0, 16843.0, 306680.0, 2339616.0, 1402925.0, 108149.0, 9755.0, 3046.0, 1355.0, 574.0, 231.0, 132.0, 82.0, 46.0, 33.0, 18.0, 19.0, 14.0, 12.0, 10.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.8828125, -7.65643310546875, -7.4300537109375, -7.20367431640625, -6.977294921875, -6.75091552734375, -6.5245361328125, -6.29815673828125, -6.07177734375, -5.84539794921875, -5.6190185546875, -5.39263916015625, -5.166259765625, -4.93988037109375, -4.7135009765625, -4.48712158203125, -4.2607421875, -4.03436279296875, -3.8079833984375, -3.58160400390625, -3.355224609375, -3.12884521484375, -2.9024658203125, -2.67608642578125, -2.44970703125, -2.22332763671875, -1.9969482421875, -1.77056884765625, -1.544189453125, -1.31781005859375, -1.0914306640625, -0.86505126953125, -0.638671875, -0.41229248046875, -0.1859130859375, 0.04046630859375, 0.266845703125, 0.49322509765625, 0.7196044921875, 0.94598388671875, 1.17236328125, 1.39874267578125, 1.6251220703125, 1.85150146484375, 2.077880859375, 2.30426025390625, 2.5306396484375, 2.75701904296875, 2.9833984375, 3.20977783203125, 3.4361572265625, 3.66253662109375, 3.888916015625, 4.11529541015625, 4.3416748046875, 4.56805419921875, 4.79443359375, 5.02081298828125, 5.2471923828125, 5.47357177734375, 5.699951171875, 5.92633056640625, 6.1527099609375, 6.37908935546875, 6.60546875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 20.0, 32.0, 26.0, 39.0, 56.0, 60.0, 88.0, 93.0, 88.0, 95.0, 78.0, 55.0, 74.0, 42.0, 40.0, 33.0, 31.0, 11.0, 13.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.34375, -11.06585693359375, -10.7879638671875, -10.51007080078125, -10.232177734375, -9.95428466796875, -9.6763916015625, -9.39849853515625, -9.12060546875, -8.84271240234375, -8.5648193359375, -8.28692626953125, -8.009033203125, -7.73114013671875, -7.4532470703125, -7.17535400390625, -6.8974609375, -6.61956787109375, -6.3416748046875, -6.06378173828125, -5.785888671875, -5.50799560546875, -5.2301025390625, -4.95220947265625, -4.67431640625, -4.39642333984375, -4.1185302734375, -3.84063720703125, -3.562744140625, -3.28485107421875, -3.0069580078125, -2.72906494140625, -2.451171875, -2.17327880859375, -1.8953857421875, -1.61749267578125, -1.339599609375, -1.06170654296875, -0.7838134765625, -0.50592041015625, -0.22802734375, 0.04986572265625, 0.3277587890625, 0.60565185546875, 0.883544921875, 1.16143798828125, 1.4393310546875, 1.71722412109375, 1.9951171875, 2.27301025390625, 2.5509033203125, 2.82879638671875, 3.106689453125, 3.38458251953125, 3.6624755859375, 3.94036865234375, 4.21826171875, 4.49615478515625, 4.7740478515625, 5.05194091796875, 5.329833984375, 5.60772705078125, 5.8856201171875, 6.16351318359375, 6.44140625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 13.0, 12.0, 26.0, 53.0, 143.0, 420.0, 2351.0, 1973641.0, 2214233.0, 2648.0, 460.0, 151.0, 68.0, 27.0, 17.0, 9.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.828125, -30.968017578125, -30.10791015625, -29.247802734375, -28.3876953125, -27.527587890625, -26.66748046875, -25.807373046875, -24.947265625, -24.087158203125, -23.22705078125, -22.366943359375, -21.5068359375, -20.646728515625, -19.78662109375, -18.926513671875, -18.06640625, -17.206298828125, -16.34619140625, -15.486083984375, -14.6259765625, -13.765869140625, -12.90576171875, -12.045654296875, -11.185546875, -10.325439453125, -9.46533203125, -8.605224609375, -7.7451171875, -6.885009765625, -6.02490234375, -5.164794921875, -4.3046875, -3.444580078125, -2.58447265625, -1.724365234375, -0.8642578125, -0.004150390625, 0.85595703125, 1.716064453125, 2.576171875, 3.436279296875, 4.29638671875, 5.156494140625, 6.0166015625, 6.876708984375, 7.73681640625, 8.596923828125, 9.45703125, 10.317138671875, 11.17724609375, 12.037353515625, 12.8974609375, 13.757568359375, 14.61767578125, 15.477783203125, 16.337890625, 17.197998046875, 18.05810546875, 18.918212890625, 19.7783203125, 20.638427734375, 21.49853515625, 22.358642578125, 23.21875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 18.0, 12.0, 23.0, 42.0, 78.0, 171.0, 291.0, 578.0, 849.0, 860.0, 554.0, 279.0, 142.0, 64.0, 37.0, 19.0, 19.0, 11.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.109375, -4.015899658203125, -3.92242431640625, -3.828948974609375, -3.7354736328125, -3.641998291015625, -3.54852294921875, -3.455047607421875, -3.361572265625, -3.268096923828125, -3.17462158203125, -3.081146240234375, -2.9876708984375, -2.894195556640625, -2.80072021484375, -2.707244873046875, -2.61376953125, -2.520294189453125, -2.42681884765625, -2.333343505859375, -2.2398681640625, -2.146392822265625, -2.05291748046875, -1.959442138671875, -1.865966796875, -1.772491455078125, -1.67901611328125, -1.585540771484375, -1.4920654296875, -1.398590087890625, -1.30511474609375, -1.211639404296875, -1.1181640625, -1.024688720703125, -0.93121337890625, -0.837738037109375, -0.7442626953125, -0.650787353515625, -0.55731201171875, -0.463836669921875, -0.370361328125, -0.276885986328125, -0.18341064453125, -0.089935302734375, 0.0035400390625, 0.097015380859375, 0.19049072265625, 0.283966064453125, 0.37744140625, 0.470916748046875, 0.56439208984375, 0.657867431640625, 0.7513427734375, 0.844818115234375, 0.93829345703125, 1.031768798828125, 1.125244140625, 1.218719482421875, 1.31219482421875, 1.405670166015625, 1.4991455078125, 1.592620849609375, 1.68609619140625, 1.779571533203125, 1.873046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 20.0, 58.0, 121.0, 275.0, 273.0, 165.0, 67.0, 11.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-27.53299331665039, -26.97225570678711, -26.411518096923828, -25.85078239440918, -25.2900447845459, -24.729307174682617, -24.16857147216797, -23.607833862304688, -23.047096252441406, -22.486358642578125, -21.925621032714844, -21.364885330200195, -20.804147720336914, -20.243410110473633, -19.682674407958984, -19.121936798095703, -18.561199188232422, -18.00046157836914, -17.43972396850586, -16.87898826599121, -16.31825065612793, -15.757513046264648, -15.196776390075684, -14.636039733886719, -14.075302124023438, -13.514564514160156, -12.953827857971191, -12.393091201782227, -11.832353591918945, -11.271615982055664, -10.7108793258667, -10.150142669677734, -9.589405059814453, -9.028667449951172, -8.467930793762207, -7.907193660736084, -7.346456527709961, -6.785719394683838, -6.224982261657715, -5.664245128631592, -5.103507995605469, -4.542770862579346, -3.9820337295532227, -3.4212965965270996, -2.8605594635009766, -2.2998223304748535, -1.7390851974487305, -1.1783480644226074, -0.6176109313964844, -0.05687379837036133, 0.5038633346557617, 1.0646004676818848, 1.6253376007080078, 2.186074733734131, 2.746811866760254, 3.307548999786377, 3.8682861328125, 4.429023265838623, 4.989760398864746, 5.550497531890869, 6.111234664916992, 6.671971797943115, 7.232708930969238, 7.793446063995361, 8.354183197021484]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 10.0, 19.0, 18.0, 26.0, 30.0, 52.0, 60.0, 50.0, 64.0, 71.0, 66.0, 68.0, 67.0, 64.0, 84.0, 41.0, 39.0, 37.0, 35.0, 27.0, 25.0, 12.0, 4.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.445375442504883, -9.201064109802246, -8.956751823425293, -8.712440490722656, -8.468128204345703, -8.223816871643066, -7.97950553894043, -7.735193729400635, -7.49088191986084, -7.246570110321045, -7.00225830078125, -6.757946968078613, -6.513635158538818, -6.269323348999023, -6.025012016296387, -5.780700206756592, -5.536388397216797, -5.292076587677002, -5.047764778137207, -4.80345344543457, -4.559141635894775, -4.3148298263549805, -4.070518493652344, -3.826206684112549, -3.581894874572754, -3.337583065032959, -3.093271493911743, -2.8489599227905273, -2.6046481132507324, -2.3603363037109375, -2.1160247325897217, -1.8717130422592163, -1.6274008750915527, -1.3830891847610474, -1.138777494430542, -0.8944658041000366, -0.6501541137695312, -0.4058424234390259, -0.1615307331085205, 0.08278095722198486, 0.32709264755249023, 0.5714043378829956, 0.815716028213501, 1.0600277185440063, 1.3043394088745117, 1.548651099205017, 1.7929627895355225, 2.0372743606567383, 2.281586170196533, 2.525897979736328, 2.770209550857544, 3.0145211219787598, 3.2588329315185547, 3.5031447410583496, 3.7474563121795654, 3.9917678833007812, 4.236079692840576, 4.480391502380371, 4.724702835083008, 4.969014644622803, 5.213326454162598, 5.457638263702393, 5.7019500732421875, 5.946261405944824, 6.190573215484619]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 9.0, 15.0, 17.0, 11.0, 17.0, 31.0, 40.0, 67.0, 88.0, 170.0, 328.0, 815.0, 2178.0, 7268.0, 30527.0, 206711.0, 685156.0, 90529.0, 17335.0, 4547.0, 1443.0, 587.0, 243.0, 140.0, 94.0, 51.0, 31.0, 26.0, 20.0, 14.0, 11.0, 12.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5498046875, -1.5032806396484375, -1.456756591796875, -1.4102325439453125, -1.36370849609375, -1.3171844482421875, -1.270660400390625, -1.2241363525390625, -1.1776123046875, -1.1310882568359375, -1.084564208984375, -1.0380401611328125, -0.99151611328125, -0.9449920654296875, -0.898468017578125, -0.8519439697265625, -0.805419921875, -0.7588958740234375, -0.712371826171875, -0.6658477783203125, -0.61932373046875, -0.5727996826171875, -0.526275634765625, -0.4797515869140625, -0.4332275390625, -0.3867034912109375, -0.340179443359375, -0.2936553955078125, -0.24713134765625, -0.2006072998046875, -0.154083251953125, -0.1075592041015625, -0.06103515625, -0.0145111083984375, 0.032012939453125, 0.0785369873046875, 0.12506103515625, 0.1715850830078125, 0.218109130859375, 0.2646331787109375, 0.3111572265625, 0.3576812744140625, 0.404205322265625, 0.4507293701171875, 0.49725341796875, 0.5437774658203125, 0.590301513671875, 0.6368255615234375, 0.683349609375, 0.7298736572265625, 0.776397705078125, 0.8229217529296875, 0.86944580078125, 0.9159698486328125, 0.962493896484375, 1.0090179443359375, 1.0555419921875, 1.1020660400390625, 1.148590087890625, 1.1951141357421875, 1.24163818359375, 1.2881622314453125, 1.334686279296875, 1.3812103271484375, 1.427734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 15.0, 15.0, 27.0, 49.0, 71.0, 78.0, 110.0, 131.0, 98.0, 91.0, 113.0, 67.0, 42.0, 41.0, 26.0, 10.0, 5.0, 9.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.3416748046875, -8.073974609375, -7.8062744140625, -7.53857421875, -7.2708740234375, -7.003173828125, -6.7354736328125, -6.4677734375, -6.2000732421875, -5.932373046875, -5.6646728515625, -5.39697265625, -5.1292724609375, -4.861572265625, -4.5938720703125, -4.326171875, -4.0584716796875, -3.790771484375, -3.5230712890625, -3.25537109375, -2.9876708984375, -2.719970703125, -2.4522705078125, -2.1845703125, -1.9168701171875, -1.649169921875, -1.3814697265625, -1.11376953125, -0.8460693359375, -0.578369140625, -0.3106689453125, -0.04296875, 0.2247314453125, 0.492431640625, 0.7601318359375, 1.02783203125, 1.2955322265625, 1.563232421875, 1.8309326171875, 2.0986328125, 2.3663330078125, 2.634033203125, 2.9017333984375, 3.16943359375, 3.4371337890625, 3.704833984375, 3.9725341796875, 4.240234375, 4.5079345703125, 4.775634765625, 5.0433349609375, 5.31103515625, 5.5787353515625, 5.846435546875, 6.1141357421875, 6.3818359375, 6.6495361328125, 6.917236328125, 7.1849365234375, 7.45263671875, 7.7203369140625, 7.988037109375, 8.2557373046875, 8.5234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 6.0, 5.0, 17.0, 21.0, 35.0, 43.0, 45.0, 93.0, 119.0, 219.0, 402.0, 649.0, 1236.0, 2488.0, 5031.0, 11778.0, 29562.0, 89312.0, 351454.0, 398787.0, 101053.0, 32583.0, 12727.0, 5359.0, 2566.0, 1249.0, 700.0, 373.0, 225.0, 148.0, 82.0, 47.0, 33.0, 24.0, 30.0, 18.0, 6.0, 3.0, 7.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.83544921875, -0.8109130859375, -0.786376953125, -0.7618408203125, -0.7373046875, -0.7127685546875, -0.688232421875, -0.6636962890625, -0.63916015625, -0.6146240234375, -0.590087890625, -0.5655517578125, -0.541015625, -0.5164794921875, -0.491943359375, -0.4674072265625, -0.44287109375, -0.4183349609375, -0.393798828125, -0.3692626953125, -0.3447265625, -0.3201904296875, -0.295654296875, -0.2711181640625, -0.24658203125, -0.2220458984375, -0.197509765625, -0.1729736328125, -0.1484375, -0.1239013671875, -0.099365234375, -0.0748291015625, -0.05029296875, -0.0257568359375, -0.001220703125, 0.0233154296875, 0.0478515625, 0.0723876953125, 0.096923828125, 0.1214599609375, 0.14599609375, 0.1705322265625, 0.195068359375, 0.2196044921875, 0.244140625, 0.2686767578125, 0.293212890625, 0.3177490234375, 0.34228515625, 0.3668212890625, 0.391357421875, 0.4158935546875, 0.4404296875, 0.4649658203125, 0.489501953125, 0.5140380859375, 0.53857421875, 0.5631103515625, 0.587646484375, 0.6121826171875, 0.63671875, 0.6612548828125, 0.685791015625, 0.7103271484375, 0.73486328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 11.0, 7.0, 5.0, 12.0, 16.0, 15.0, 15.0, 8.0, 27.0, 29.0, 23.0, 42.0, 33.0, 41.0, 41.0, 37.0, 43.0, 39.0, 48.0, 52.0, 45.0, 44.0, 49.0, 37.0, 40.0, 30.0, 49.0, 34.0, 24.0, 20.0, 12.0, 11.0, 8.0, 12.0, 11.0, 7.0, 3.0, 7.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-8.296875, -8.06439208984375, -7.8319091796875, -7.59942626953125, -7.366943359375, -7.13446044921875, -6.9019775390625, -6.66949462890625, -6.43701171875, -6.20452880859375, -5.9720458984375, -5.73956298828125, -5.507080078125, -5.27459716796875, -5.0421142578125, -4.80963134765625, -4.5771484375, -4.34466552734375, -4.1121826171875, -3.87969970703125, -3.647216796875, -3.41473388671875, -3.1822509765625, -2.94976806640625, -2.71728515625, -2.48480224609375, -2.2523193359375, -2.01983642578125, -1.787353515625, -1.55487060546875, -1.3223876953125, -1.08990478515625, -0.857421875, -0.62493896484375, -0.3924560546875, -0.15997314453125, 0.072509765625, 0.30499267578125, 0.5374755859375, 0.76995849609375, 1.00244140625, 1.23492431640625, 1.4674072265625, 1.69989013671875, 1.932373046875, 2.16485595703125, 2.3973388671875, 2.62982177734375, 2.8623046875, 3.09478759765625, 3.3272705078125, 3.55975341796875, 3.792236328125, 4.02471923828125, 4.2572021484375, 4.48968505859375, 4.72216796875, 4.95465087890625, 5.1871337890625, 5.41961669921875, 5.652099609375, 5.88458251953125, 6.1170654296875, 6.34954833984375, 6.58203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 13.0, 15.0, 30.0, 43.0, 59.0, 74.0, 110.0, 167.0, 271.0, 422.0, 679.0, 1375.0, 2817.0, 7321.0, 24373.0, 158426.0, 703990.0, 116150.0, 20123.0, 6443.0, 2625.0, 1252.0, 628.0, 382.0, 229.0, 169.0, 98.0, 73.0, 73.0, 33.0, 33.0, 15.0, 14.0, 9.0, 1.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2108154296875, -0.204315185546875, -0.19781494140625, -0.191314697265625, -0.184814453125, -0.178314208984375, -0.17181396484375, -0.165313720703125, -0.1588134765625, -0.152313232421875, -0.14581298828125, -0.139312744140625, -0.1328125, -0.126312255859375, -0.11981201171875, -0.113311767578125, -0.1068115234375, -0.100311279296875, -0.09381103515625, -0.087310791015625, -0.080810546875, -0.074310302734375, -0.06781005859375, -0.061309814453125, -0.0548095703125, -0.048309326171875, -0.04180908203125, -0.035308837890625, -0.02880859375, -0.022308349609375, -0.01580810546875, -0.009307861328125, -0.0028076171875, 0.003692626953125, 0.01019287109375, 0.016693115234375, 0.023193359375, 0.029693603515625, 0.03619384765625, 0.042694091796875, 0.0491943359375, 0.055694580078125, 0.06219482421875, 0.068695068359375, 0.0751953125, 0.081695556640625, 0.08819580078125, 0.094696044921875, 0.1011962890625, 0.107696533203125, 0.11419677734375, 0.120697021484375, 0.127197265625, 0.133697509765625, 0.14019775390625, 0.146697998046875, 0.1531982421875, 0.159698486328125, 0.16619873046875, 0.172698974609375, 0.17919921875, 0.185699462890625, 0.19219970703125, 0.198699951171875, 0.2052001953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 8.0, 8.0, 10.0, 14.0, 17.0, 17.0, 20.0, 45.0, 51.0, 60.0, 71.0, 79.0, 95.0, 115.0, 72.0, 78.0, 69.0, 41.0, 31.0, 30.0, 16.0, 7.0, 11.0, 5.0, 3.0, 4.0, 3.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12275505065918e-05, -6.884988397359848e-05, -6.647221744060516e-05, -6.409455090761185e-05, -6.171688437461853e-05, -5.9339217841625214e-05, -5.69615513086319e-05, -5.458388477563858e-05, -5.2206218242645264e-05, -4.982855170965195e-05, -4.745088517665863e-05, -4.5073218643665314e-05, -4.2695552110672e-05, -4.031788557767868e-05, -3.7940219044685364e-05, -3.556255251169205e-05, -3.318488597869873e-05, -3.0807219445705414e-05, -2.8429552912712097e-05, -2.605188637971878e-05, -2.3674219846725464e-05, -2.1296553313732147e-05, -1.891888678073883e-05, -1.6541220247745514e-05, -1.4163553714752197e-05, -1.178588718175888e-05, -9.408220648765564e-06, -7.030554115772247e-06, -4.652887582778931e-06, -2.275221049785614e-06, 1.0244548320770264e-07, 2.4801120162010193e-06, 4.857778549194336e-06, 7.235445082187653e-06, 9.61311161518097e-06, 1.1990778148174286e-05, 1.4368444681167603e-05, 1.674611121416092e-05, 1.9123777747154236e-05, 2.1501444280147552e-05, 2.387911081314087e-05, 2.6256777346134186e-05, 2.8634443879127502e-05, 3.101211041212082e-05, 3.3389776945114136e-05, 3.576744347810745e-05, 3.814511001110077e-05, 4.0522776544094086e-05, 4.29004430770874e-05, 4.527810961008072e-05, 4.7655776143074036e-05, 5.003344267606735e-05, 5.241110920906067e-05, 5.4788775742053986e-05, 5.71664422750473e-05, 5.954410880804062e-05, 6.192177534103394e-05, 6.429944187402725e-05, 6.667710840702057e-05, 6.905477494001389e-05, 7.14324414730072e-05, 7.381010800600052e-05, 7.618777453899384e-05, 7.856544107198715e-05, 8.094310760498047e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 5.0, 8.0, 14.0, 22.0, 17.0, 28.0, 30.0, 59.0, 82.0, 147.0, 367.0, 1204.0, 6815.0, 79033.0, 893106.0, 59886.0, 5812.0, 1133.0, 320.0, 172.0, 90.0, 50.0, 41.0, 27.0, 21.0, 10.0, 11.0, 11.0, 4.0, 5.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30126953125, -0.2910423278808594, -0.28081512451171875, -0.2705879211425781, -0.2603607177734375, -0.2501335144042969, -0.23990631103515625, -0.22967910766601562, -0.219451904296875, -0.20922470092773438, -0.19899749755859375, -0.18877029418945312, -0.1785430908203125, -0.16831588745117188, -0.15808868408203125, -0.14786148071289062, -0.13763427734375, -0.12740707397460938, -0.11717987060546875, -0.10695266723632812, -0.0967254638671875, -0.08649826049804688, -0.07627105712890625, -0.06604385375976562, -0.055816650390625, -0.045589447021484375, -0.03536224365234375, -0.025135040283203125, -0.0149078369140625, -0.004680633544921875, 0.00554656982421875, 0.015773773193359375, 0.0260009765625, 0.036228179931640625, 0.04645538330078125, 0.056682586669921875, 0.0669097900390625, 0.07713699340820312, 0.08736419677734375, 0.09759140014648438, 0.107818603515625, 0.11804580688476562, 0.12827301025390625, 0.13850021362304688, 0.1487274169921875, 0.15895462036132812, 0.16918182373046875, 0.17940902709960938, 0.18963623046875, 0.19986343383789062, 0.21009063720703125, 0.22031784057617188, 0.2305450439453125, 0.24077224731445312, 0.25099945068359375, 0.2612266540527344, 0.271453857421875, 0.2816810607910156, 0.29190826416015625, 0.3021354675292969, 0.3123626708984375, 0.3225898742675781, 0.33281707763671875, 0.3430442810058594, 0.353271484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 11.0, 7.0, 8.0, 16.0, 16.0, 19.0, 30.0, 38.0, 59.0, 99.0, 156.0, 153.0, 111.0, 72.0, 29.0, 30.0, 26.0, 19.0, 12.0, 14.0, 6.0, 9.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.056304931640625, -0.05443239212036133, -0.052559852600097656, -0.050687313079833984, -0.04881477355957031, -0.04694223403930664, -0.04506969451904297, -0.0431971549987793, -0.041324615478515625, -0.03945207595825195, -0.03757953643798828, -0.03570699691772461, -0.03383445739746094, -0.031961917877197266, -0.030089378356933594, -0.028216838836669922, -0.02634429931640625, -0.024471759796142578, -0.022599220275878906, -0.020726680755615234, -0.018854141235351562, -0.01698160171508789, -0.015109062194824219, -0.013236522674560547, -0.011363983154296875, -0.009491443634033203, -0.007618904113769531, -0.005746364593505859, -0.0038738250732421875, -0.0020012855529785156, -0.00012874603271484375, 0.0017437934875488281, 0.0036163330078125, 0.005488872528076172, 0.007361412048339844, 0.009233951568603516, 0.011106491088867188, 0.01297903060913086, 0.014851570129394531, 0.016724109649658203, 0.018596649169921875, 0.020469188690185547, 0.02234172821044922, 0.02421426773071289, 0.026086807250976562, 0.027959346771240234, 0.029831886291503906, 0.03170442581176758, 0.03357696533203125, 0.03544950485229492, 0.037322044372558594, 0.039194583892822266, 0.04106712341308594, 0.04293966293334961, 0.04481220245361328, 0.04668474197387695, 0.048557281494140625, 0.0504298210144043, 0.05230236053466797, 0.05417490005493164, 0.05604743957519531, 0.057919979095458984, 0.059792518615722656, 0.06166505813598633, 0.06353759765625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 91.0, 835.0, 83.0, 3.0, 0.0, 2.0, 3.0], "bins": [-78.94815063476562, -77.5982666015625, -76.2483901977539, -74.89850616455078, -73.54862976074219, -72.19874572753906, -70.84886932373047, -69.49898529052734, -68.14910888671875, -66.79922485351562, -65.44934844970703, -64.0994644165039, -62.74958801269531, -61.39970397949219, -60.04982376098633, -58.69994354248047, -57.350059509277344, -56.000179290771484, -54.650299072265625, -53.300418853759766, -51.950538635253906, -50.60065460205078, -49.25077438354492, -47.90089416503906, -46.5510139465332, -45.201133728027344, -43.851253509521484, -42.501373291015625, -41.1514892578125, -39.80160903930664, -38.45172882080078, -37.10184860229492, -35.75196838378906, -34.4020881652832, -33.052207946777344, -31.70232582092285, -30.352445602416992, -29.002565383911133, -27.65268325805664, -26.30280303955078, -24.952922821044922, -23.603042602539062, -22.253162384033203, -20.90328025817871, -19.55340003967285, -18.203519821166992, -16.8536376953125, -15.50375747680664, -14.153877258300781, -12.803997039794922, -11.454115867614746, -10.10423469543457, -8.754354476928711, -7.404473781585693, -6.054593086242676, -4.7047119140625, -3.354832172393799, -2.0049514770507812, -0.6550707817077637, 0.6948099136352539, 2.0446906089782715, 3.394571304321289, 4.744451999664307, 6.094333171844482, 7.444213390350342]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 12.0, 16.0, 27.0, 37.0, 64.0, 68.0, 80.0, 90.0, 99.0, 79.0, 84.0, 99.0, 65.0, 45.0, 42.0, 32.0, 24.0, 9.0, 7.0, 10.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.058536529541016, -7.840708255767822, -7.622880458831787, -7.405052185058594, -7.187224388122559, -6.969396114349365, -6.75156831741333, -6.533740043640137, -6.315912246704102, -6.098083972930908, -5.880256175994873, -5.66242790222168, -5.4446001052856445, -5.226771831512451, -5.008944034576416, -4.791115760803223, -4.5732879638671875, -4.355459690093994, -4.137631893157959, -3.9198038578033447, -3.7019758224487305, -3.484147548675537, -3.266319751739502, -3.0484914779663086, -2.8306632041931152, -2.612835168838501, -2.3950071334838867, -2.1771790981292725, -1.9593510627746582, -1.7415229082107544, -1.5236948728561401, -1.3058668375015259, -1.0880389213562012, -0.8702108860015869, -0.6523828506469727, -0.4345547556877136, -0.21672672033309937, 0.001101374626159668, 0.21892940998077393, 0.4367574453353882, 0.6545854806900024, 0.8724135160446167, 1.090241551399231, 1.3080697059631348, 1.525897741317749, 1.7437257766723633, 1.9615538120269775, 2.179381847381592, 2.397209882736206, 2.6150379180908203, 2.8328659534454346, 3.050693988800049, 3.268522024154663, 3.4863500595092773, 3.7041783332824707, 3.922006130218506, 4.139834403991699, 4.357662677764893, 4.575490474700928, 4.793318748474121, 5.011146545410156, 5.22897481918335, 5.446802616119385, 5.664630889892578, 5.882458686828613]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 19.0, 37.0, 54.0, 93.0, 156.0, 275.0, 525.0, 1183.0, 3905.0, 19086.0, 123178.0, 488675.0, 336438.0, 60642.0, 9866.0, 2498.0, 897.0, 438.0, 225.0, 123.0, 64.0, 51.0, 40.0, 22.0, 19.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.754058837890625, -4.61749267578125, -4.480926513671875, -4.3443603515625, -4.207794189453125, -4.07122802734375, -3.934661865234375, -3.798095703125, -3.661529541015625, -3.52496337890625, -3.388397216796875, -3.2518310546875, -3.115264892578125, -2.97869873046875, -2.842132568359375, -2.70556640625, -2.569000244140625, -2.43243408203125, -2.295867919921875, -2.1593017578125, -2.022735595703125, -1.88616943359375, -1.749603271484375, -1.613037109375, -1.476470947265625, -1.33990478515625, -1.203338623046875, -1.0667724609375, -0.930206298828125, -0.79364013671875, -0.657073974609375, -0.5205078125, -0.383941650390625, -0.24737548828125, -0.110809326171875, 0.0257568359375, 0.162322998046875, 0.29888916015625, 0.435455322265625, 0.572021484375, 0.708587646484375, 0.84515380859375, 0.981719970703125, 1.1182861328125, 1.254852294921875, 1.39141845703125, 1.527984619140625, 1.66455078125, 1.801116943359375, 1.93768310546875, 2.074249267578125, 2.2108154296875, 2.347381591796875, 2.48394775390625, 2.620513916015625, 2.757080078125, 2.893646240234375, 3.03021240234375, 3.166778564453125, 3.3033447265625, 3.439910888671875, 3.57647705078125, 3.713043212890625, 3.849609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 9.0, 5.0, 13.0, 23.0, 23.0, 26.0, 37.0, 41.0, 57.0, 66.0, 72.0, 64.0, 57.0, 66.0, 65.0, 78.0, 67.0, 52.0, 30.0, 32.0, 25.0, 35.0, 14.0, 14.0, 9.0, 5.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.6328125, -10.344970703125, -10.05712890625, -9.769287109375, -9.4814453125, -9.193603515625, -8.90576171875, -8.617919921875, -8.330078125, -8.042236328125, -7.75439453125, -7.466552734375, -7.1787109375, -6.890869140625, -6.60302734375, -6.315185546875, -6.02734375, -5.739501953125, -5.45166015625, -5.163818359375, -4.8759765625, -4.588134765625, -4.30029296875, -4.012451171875, -3.724609375, -3.436767578125, -3.14892578125, -2.861083984375, -2.5732421875, -2.285400390625, -1.99755859375, -1.709716796875, -1.421875, -1.134033203125, -0.84619140625, -0.558349609375, -0.2705078125, 0.017333984375, 0.30517578125, 0.593017578125, 0.880859375, 1.168701171875, 1.45654296875, 1.744384765625, 2.0322265625, 2.320068359375, 2.60791015625, 2.895751953125, 3.18359375, 3.471435546875, 3.75927734375, 4.047119140625, 4.3349609375, 4.622802734375, 4.91064453125, 5.198486328125, 5.486328125, 5.774169921875, 6.06201171875, 6.349853515625, 6.6376953125, 6.925537109375, 7.21337890625, 7.501220703125, 7.7890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 5.0, 4.0, 6.0, 14.0, 10.0, 24.0, 26.0, 23.0, 51.0, 60.0, 70.0, 103.0, 118.0, 166.0, 221.0, 417.0, 859.0, 7322.0, 663473.0, 369365.0, 4264.0, 709.0, 363.0, 234.0, 166.0, 116.0, 83.0, 85.0, 51.0, 30.0, 23.0, 28.0, 20.0, 6.0, 8.0, 11.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.079833984375, -9.69091796875, -9.302001953125, -8.9130859375, -8.524169921875, -8.13525390625, -7.746337890625, -7.357421875, -6.968505859375, -6.57958984375, -6.190673828125, -5.8017578125, -5.412841796875, -5.02392578125, -4.635009765625, -4.24609375, -3.857177734375, -3.46826171875, -3.079345703125, -2.6904296875, -2.301513671875, -1.91259765625, -1.523681640625, -1.134765625, -0.745849609375, -0.35693359375, 0.031982421875, 0.4208984375, 0.809814453125, 1.19873046875, 1.587646484375, 1.9765625, 2.365478515625, 2.75439453125, 3.143310546875, 3.5322265625, 3.921142578125, 4.31005859375, 4.698974609375, 5.087890625, 5.476806640625, 5.86572265625, 6.254638671875, 6.6435546875, 7.032470703125, 7.42138671875, 7.810302734375, 8.19921875, 8.588134765625, 8.97705078125, 9.365966796875, 9.7548828125, 10.143798828125, 10.53271484375, 10.921630859375, 11.310546875, 11.699462890625, 12.08837890625, 12.477294921875, 12.8662109375, 13.255126953125, 13.64404296875, 14.032958984375, 14.421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 3.0, 8.0, 11.0, 8.0, 10.0, 24.0, 20.0, 25.0, 23.0, 31.0, 42.0, 48.0, 38.0, 49.0, 47.0, 52.0, 48.0, 52.0, 59.0, 50.0, 31.0, 46.0, 39.0, 34.0, 26.0, 35.0, 25.0, 11.0, 9.0, 10.0, 16.0, 10.0, 10.0, 13.0, 6.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.015625, -7.761962890625, -7.50830078125, -7.254638671875, -7.0009765625, -6.747314453125, -6.49365234375, -6.239990234375, -5.986328125, -5.732666015625, -5.47900390625, -5.225341796875, -4.9716796875, -4.718017578125, -4.46435546875, -4.210693359375, -3.95703125, -3.703369140625, -3.44970703125, -3.196044921875, -2.9423828125, -2.688720703125, -2.43505859375, -2.181396484375, -1.927734375, -1.674072265625, -1.42041015625, -1.166748046875, -0.9130859375, -0.659423828125, -0.40576171875, -0.152099609375, 0.1015625, 0.355224609375, 0.60888671875, 0.862548828125, 1.1162109375, 1.369873046875, 1.62353515625, 1.877197265625, 2.130859375, 2.384521484375, 2.63818359375, 2.891845703125, 3.1455078125, 3.399169921875, 3.65283203125, 3.906494140625, 4.16015625, 4.413818359375, 4.66748046875, 4.921142578125, 5.1748046875, 5.428466796875, 5.68212890625, 5.935791015625, 6.189453125, 6.443115234375, 6.69677734375, 6.950439453125, 7.2041015625, 7.457763671875, 7.71142578125, 7.965087890625, 8.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 8.0, 4.0, 6.0, 2.0, 14.0, 21.0, 52.0, 108.0, 439.0, 3531.0, 970222.0, 72326.0, 1422.0, 230.0, 91.0, 35.0, 13.0, 7.0, 7.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.26165771484375, -6.9803466796875, -6.69903564453125, -6.417724609375, -6.13641357421875, -5.8551025390625, -5.57379150390625, -5.29248046875, -5.01116943359375, -4.7298583984375, -4.44854736328125, -4.167236328125, -3.88592529296875, -3.6046142578125, -3.32330322265625, -3.0419921875, -2.76068115234375, -2.4793701171875, -2.19805908203125, -1.916748046875, -1.63543701171875, -1.3541259765625, -1.07281494140625, -0.79150390625, -0.51019287109375, -0.2288818359375, 0.05242919921875, 0.333740234375, 0.61505126953125, 0.8963623046875, 1.17767333984375, 1.458984375, 1.74029541015625, 2.0216064453125, 2.30291748046875, 2.584228515625, 2.86553955078125, 3.1468505859375, 3.42816162109375, 3.70947265625, 3.99078369140625, 4.2720947265625, 4.55340576171875, 4.834716796875, 5.11602783203125, 5.3973388671875, 5.67864990234375, 5.9599609375, 6.24127197265625, 6.5225830078125, 6.80389404296875, 7.085205078125, 7.36651611328125, 7.6478271484375, 7.92913818359375, 8.21044921875, 8.49176025390625, 8.7730712890625, 9.05438232421875, 9.335693359375, 9.61700439453125, 9.8983154296875, 10.17962646484375, 10.4609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 10.0, 20.0, 45.0, 66.0, 74.0, 111.0, 143.0, 124.0, 114.0, 100.0, 55.0, 46.0, 26.0, 20.0, 8.0, 6.0, 3.0, 2.0, 8.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026106834411621094, -0.00025036558508872986, -0.00023966282606124878, -0.0002289600670337677, -0.00021825730800628662, -0.00020755454897880554, -0.00019685178995132446, -0.00018614903092384338, -0.0001754462718963623, -0.00016474351286888123, -0.00015404075384140015, -0.00014333799481391907, -0.000132635235786438, -0.00012193247675895691, -0.00011122971773147583, -0.00010052695870399475, -8.982419967651367e-05, -7.912144064903259e-05, -6.841868162155151e-05, -5.7715922594070435e-05, -4.7013163566589355e-05, -3.6310404539108276e-05, -2.5607645511627197e-05, -1.4904886484146118e-05, -4.202127456665039e-06, 6.50063157081604e-06, 1.720339059829712e-05, 2.7906149625778198e-05, 3.860890865325928e-05, 4.9311667680740356e-05, 6.0014426708221436e-05, 7.071718573570251e-05, 8.14199447631836e-05, 9.212270379066467e-05, 0.00010282546281814575, 0.00011352822184562683, 0.0001242309808731079, 0.000134933739900589, 0.00014563649892807007, 0.00015633925795555115, 0.00016704201698303223, 0.0001777447760105133, 0.00018844753503799438, 0.00019915029406547546, 0.00020985305309295654, 0.00022055581212043762, 0.0002312585711479187, 0.00024196133017539978, 0.00025266408920288086, 0.00026336684823036194, 0.000274069607257843, 0.0002847723662853241, 0.0002954751253128052, 0.00030617788434028625, 0.00031688064336776733, 0.0003275834023952484, 0.0003382861614227295, 0.00034898892045021057, 0.00035969167947769165, 0.00037039443850517273, 0.0003810971975326538, 0.0003917999565601349, 0.00040250271558761597, 0.00041320547461509705, 0.0004239082336425781]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 3.0, 10.0, 10.0, 15.0, 28.0, 53.0, 124.0, 389.0, 2129.0, 183755.0, 857548.0, 3657.0, 520.0, 135.0, 72.0, 30.0, 20.0, 9.0, 3.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.890625, -6.636474609375, -6.38232421875, -6.128173828125, -5.8740234375, -5.619873046875, -5.36572265625, -5.111572265625, -4.857421875, -4.603271484375, -4.34912109375, -4.094970703125, -3.8408203125, -3.586669921875, -3.33251953125, -3.078369140625, -2.82421875, -2.570068359375, -2.31591796875, -2.061767578125, -1.8076171875, -1.553466796875, -1.29931640625, -1.045166015625, -0.791015625, -0.536865234375, -0.28271484375, -0.028564453125, 0.2255859375, 0.479736328125, 0.73388671875, 0.988037109375, 1.2421875, 1.496337890625, 1.75048828125, 2.004638671875, 2.2587890625, 2.512939453125, 2.76708984375, 3.021240234375, 3.275390625, 3.529541015625, 3.78369140625, 4.037841796875, 4.2919921875, 4.546142578125, 4.80029296875, 5.054443359375, 5.30859375, 5.562744140625, 5.81689453125, 6.071044921875, 6.3251953125, 6.579345703125, 6.83349609375, 7.087646484375, 7.341796875, 7.595947265625, 7.85009765625, 8.104248046875, 8.3583984375, 8.612548828125, 8.86669921875, 9.120849609375, 9.375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 17.0, 39.0, 54.0, 107.0, 134.0, 199.0, 154.0, 103.0, 73.0, 50.0, 13.0, 10.0, 6.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.666015625, -1.620574951171875, -1.57513427734375, -1.529693603515625, -1.4842529296875, -1.438812255859375, -1.39337158203125, -1.347930908203125, -1.302490234375, -1.257049560546875, -1.21160888671875, -1.166168212890625, -1.1207275390625, -1.075286865234375, -1.02984619140625, -0.984405517578125, -0.93896484375, -0.893524169921875, -0.84808349609375, -0.802642822265625, -0.7572021484375, -0.711761474609375, -0.66632080078125, -0.620880126953125, -0.575439453125, -0.529998779296875, -0.48455810546875, -0.439117431640625, -0.3936767578125, -0.348236083984375, -0.30279541015625, -0.257354736328125, -0.2119140625, -0.166473388671875, -0.12103271484375, -0.075592041015625, -0.0301513671875, 0.015289306640625, 0.06072998046875, 0.106170654296875, 0.151611328125, 0.197052001953125, 0.24249267578125, 0.287933349609375, 0.3333740234375, 0.378814697265625, 0.42425537109375, 0.469696044921875, 0.51513671875, 0.560577392578125, 0.60601806640625, 0.651458740234375, 0.6968994140625, 0.742340087890625, 0.78778076171875, 0.833221435546875, 0.878662109375, 0.924102783203125, 0.96954345703125, 1.014984130859375, 1.0604248046875, 1.105865478515625, 1.15130615234375, 1.196746826171875, 1.2421875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 28.0, 73.0, 241.0, 359.0, 206.0, 68.0, 21.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.40581130981445, -39.5704231262207, -38.73503112792969, -37.89964294433594, -37.06425476074219, -36.22886276245117, -35.39347457885742, -34.55808639526367, -33.722694396972656, -32.887306213378906, -32.05191421508789, -31.21652603149414, -30.381135940551758, -29.545745849609375, -28.710357666015625, -27.874967575073242, -27.039579391479492, -26.20418930053711, -25.36880111694336, -24.533411026000977, -23.698020935058594, -22.862632751464844, -22.02724266052246, -21.191852569580078, -20.356464385986328, -19.521074295043945, -18.685686111450195, -17.850296020507812, -17.01490592956543, -16.179515838623047, -15.344127655029297, -14.508737564086914, -13.673347473144531, -12.837958335876465, -12.002568244934082, -11.167179107666016, -10.331789016723633, -9.496399879455566, -8.6610107421875, -7.825621128082275, -6.990231513977051, -6.154841899871826, -5.319452285766602, -4.484063148498535, -3.6486735343933105, -2.813283920288086, -1.9778947830200195, -1.142505168914795, -0.3071155548095703, 0.5282739400863647, 1.3636634349822998, 2.1990528106689453, 3.03444242477417, 3.8698320388793945, 4.705221176147461, 5.5406107902526855, 6.37600040435791, 7.211390018463135, 8.04677963256836, 8.882168769836426, 9.717557907104492, 10.552947998046875, 11.388337135314941, 12.223726272583008, 13.05911636352539]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 11.0, 7.0, 5.0, 11.0, 21.0, 26.0, 25.0, 25.0, 27.0, 41.0, 44.0, 41.0, 43.0, 42.0, 46.0, 48.0, 58.0, 39.0, 53.0, 32.0, 34.0, 39.0, 30.0, 39.0, 26.0, 33.0, 28.0, 24.0, 18.0, 12.0, 11.0, 13.0, 6.0, 10.0, 10.0, 2.0, 2.0, 5.0, 3.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.744174003601074, -14.337994575500488, -13.931814193725586, -13.525634765625, -13.119455337524414, -12.713275909423828, -12.307096481323242, -11.90091609954834, -11.494736671447754, -11.088557243347168, -10.682376861572266, -10.27619743347168, -9.870018005371094, -9.463838577270508, -9.057659149169922, -8.65147876739502, -8.245299339294434, -7.839119911193848, -7.4329400062561035, -7.026760101318359, -6.620580673217773, -6.2144012451171875, -5.808221340179443, -5.402041435241699, -4.995862007141113, -4.589682579040527, -4.183502674102783, -3.777323007583618, -3.371143341064453, -2.964963674545288, -2.558784008026123, -2.152604341506958, -1.7464256286621094, -1.3402459621429443, -0.9340662956237793, -0.5278866291046143, -0.12170696258544922, 0.2844727039337158, 0.6906523704528809, 1.096832036972046, 1.503011703491211, 1.909191370010376, 2.315371036529541, 2.721550703048706, 3.127730369567871, 3.533910036087036, 3.940089702606201, 4.346269607543945, 4.752449035644531, 5.158628463745117, 5.564808368682861, 5.9709882736206055, 6.377167701721191, 6.783347129821777, 7.1895270347595215, 7.595706939697266, 8.001886367797852, 8.408065795898438, 8.814245223999023, 9.220425605773926, 9.626605033874512, 10.032784461975098, 10.43896484375, 10.845144271850586, 11.251323699951172]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 11.0, 17.0, 9.0, 22.0, 21.0, 56.0, 80.0, 107.0, 186.0, 339.0, 594.0, 994.0, 2643.0, 70942.0, 2725357.0, 1365135.0, 22649.0, 3370.0, 1117.0, 291.0, 145.0, 71.0, 48.0, 29.0, 21.0, 3.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.546875, -8.203125, -7.859375, -7.515625, -7.171875, -6.828125, -6.484375, -6.140625, -5.796875, -5.453125, -5.109375, -4.765625, -4.421875, -4.078125, -3.734375, -3.390625, -3.046875, -2.703125, -2.359375, -2.015625, -1.671875, -1.328125, -0.984375, -0.640625, -0.296875, 0.046875, 0.390625, 0.734375, 1.078125, 1.421875, 1.765625, 2.109375, 2.453125, 2.796875, 3.140625, 3.484375, 3.828125, 4.171875, 4.515625, 4.859375, 5.203125, 5.546875, 5.890625, 6.234375, 6.578125, 6.921875, 7.265625, 7.609375, 7.953125, 8.296875, 8.640625, 8.984375, 9.328125, 9.671875, 10.015625, 10.359375, 10.703125, 11.046875, 11.390625, 11.734375, 12.078125, 12.421875, 12.765625, 13.109375, 13.453125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 15.0, 21.0, 35.0, 47.0, 80.0, 102.0, 100.0, 110.0, 110.0, 93.0, 65.0, 76.0, 54.0, 34.0, 19.0, 12.0, 12.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.9287109375, -9.607421875, -9.2861328125, -8.96484375, -8.6435546875, -8.322265625, -8.0009765625, -7.6796875, -7.3583984375, -7.037109375, -6.7158203125, -6.39453125, -6.0732421875, -5.751953125, -5.4306640625, -5.109375, -4.7880859375, -4.466796875, -4.1455078125, -3.82421875, -3.5029296875, -3.181640625, -2.8603515625, -2.5390625, -2.2177734375, -1.896484375, -1.5751953125, -1.25390625, -0.9326171875, -0.611328125, -0.2900390625, 0.03125, 0.3525390625, 0.673828125, 0.9951171875, 1.31640625, 1.6376953125, 1.958984375, 2.2802734375, 2.6015625, 2.9228515625, 3.244140625, 3.5654296875, 3.88671875, 4.2080078125, 4.529296875, 4.8505859375, 5.171875, 5.4931640625, 5.814453125, 6.1357421875, 6.45703125, 6.7783203125, 7.099609375, 7.4208984375, 7.7421875, 8.0634765625, 8.384765625, 8.7060546875, 9.02734375, 9.3486328125, 9.669921875, 9.9912109375, 10.3125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 13.0, 17.0, 23.0, 36.0, 56.0, 134.0, 230.0, 535.0, 1515.0, 8166.0, 734603.0, 3426284.0, 19011.0, 2307.0, 684.0, 267.0, 123.0, 71.0, 65.0, 40.0, 21.0, 16.0, 16.0, 14.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.9453125, -14.54296875, -14.140625, -13.73828125, -13.3359375, -12.93359375, -12.53125, -12.12890625, -11.7265625, -11.32421875, -10.921875, -10.51953125, -10.1171875, -9.71484375, -9.3125, -8.91015625, -8.5078125, -8.10546875, -7.703125, -7.30078125, -6.8984375, -6.49609375, -6.09375, -5.69140625, -5.2890625, -4.88671875, -4.484375, -4.08203125, -3.6796875, -3.27734375, -2.875, -2.47265625, -2.0703125, -1.66796875, -1.265625, -0.86328125, -0.4609375, -0.05859375, 0.34375, 0.74609375, 1.1484375, 1.55078125, 1.953125, 2.35546875, 2.7578125, 3.16015625, 3.5625, 3.96484375, 4.3671875, 4.76953125, 5.171875, 5.57421875, 5.9765625, 6.37890625, 6.78125, 7.18359375, 7.5859375, 7.98828125, 8.390625, 8.79296875, 9.1953125, 9.59765625, 10.0, 10.40234375, 10.8046875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 13.0, 8.0, 9.0, 7.0, 17.0, 30.0, 52.0, 89.0, 173.0, 290.0, 460.0, 630.0, 719.0, 636.0, 361.0, 239.0, 129.0, 69.0, 40.0, 33.0, 16.0, 10.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7900390625, -1.7192840576171875, -1.648529052734375, -1.5777740478515625, -1.50701904296875, -1.4362640380859375, -1.365509033203125, -1.2947540283203125, -1.2239990234375, -1.1532440185546875, -1.082489013671875, -1.0117340087890625, -0.94097900390625, -0.8702239990234375, -0.799468994140625, -0.7287139892578125, -0.657958984375, -0.5872039794921875, -0.516448974609375, -0.4456939697265625, -0.37493896484375, -0.3041839599609375, -0.233428955078125, -0.1626739501953125, -0.0919189453125, -0.0211639404296875, 0.049591064453125, 0.1203460693359375, 0.19110107421875, 0.2618560791015625, 0.332611083984375, 0.4033660888671875, 0.47412109375, 0.5448760986328125, 0.615631103515625, 0.6863861083984375, 0.75714111328125, 0.8278961181640625, 0.898651123046875, 0.9694061279296875, 1.0401611328125, 1.1109161376953125, 1.181671142578125, 1.2524261474609375, 1.32318115234375, 1.3939361572265625, 1.464691162109375, 1.5354461669921875, 1.606201171875, 1.6769561767578125, 1.747711181640625, 1.8184661865234375, 1.88922119140625, 1.9599761962890625, 2.030731201171875, 2.1014862060546875, 2.1722412109375, 2.2429962158203125, 2.313751220703125, 2.3845062255859375, 2.45526123046875, 2.5260162353515625, 2.596771240234375, 2.6675262451171875, 2.73828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 15.0, 46.0, 141.0, 266.0, 291.0, 169.0, 51.0, 19.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.991241455078125, -26.41790771484375, -25.844573974609375, -25.271238327026367, -24.697904586791992, -24.124570846557617, -23.551237106323242, -22.977903366088867, -22.40456771850586, -21.831233978271484, -21.25790023803711, -20.6845645904541, -20.111230850219727, -19.53789710998535, -18.964563369750977, -18.3912296295166, -17.817895889282227, -17.24456214904785, -16.671228408813477, -16.09789276123047, -15.524559020996094, -14.951225280761719, -14.377891540527344, -13.804557800292969, -13.231223106384277, -12.657889366149902, -12.084554672241211, -11.511220932006836, -10.937887191772461, -10.36455249786377, -9.791218757629395, -9.217884063720703, -8.644550323486328, -8.071216583251953, -7.497881889343262, -6.924548149108887, -6.3512139320373535, -5.77787971496582, -5.204545974731445, -4.631211757659912, -4.057877540588379, -3.4845433235168457, -2.9112093448638916, -2.3378753662109375, -1.7645411491394043, -1.191206932067871, -0.617872953414917, -0.04453897476196289, 0.5287952423095703, 1.102129340171814, 1.6754634380340576, 2.2487974166870117, 2.822131633758545, 3.395465850830078, 3.9687998294830322, 4.542133808135986, 5.1154680252075195, 5.688802242279053, 6.262136459350586, 6.835470199584961, 7.408804416656494, 7.982138633728027, 8.555472373962402, 9.128807067871094, 9.702140808105469]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 11.0, 16.0, 15.0, 22.0, 19.0, 38.0, 42.0, 56.0, 54.0, 66.0, 91.0, 61.0, 79.0, 65.0, 68.0, 63.0, 40.0, 46.0, 37.0, 26.0, 29.0, 18.0, 18.0, 12.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.690203666687012, -8.46125316619873, -8.232301712036133, -8.003351211547852, -7.77440071105957, -7.545450210571289, -7.31649923324585, -7.08754825592041, -6.858597755432129, -6.629647254943848, -6.400696277618408, -6.171745300292969, -5.9427947998046875, -5.713844299316406, -5.484893321990967, -5.255942344665527, -5.026991844177246, -4.798041343688965, -4.569090366363525, -4.340139389038086, -4.111188888549805, -3.8822381496429443, -3.653287410736084, -3.4243366718292236, -3.1953859329223633, -2.966435194015503, -2.7374844551086426, -2.5085337162017822, -2.279582977294922, -2.0506322383880615, -1.8216814994812012, -1.5927307605743408, -1.3637804985046387, -1.1348297595977783, -0.905879020690918, -0.6769282817840576, -0.44797754287719727, -0.21902680397033691, 0.009923934936523438, 0.2388746738433838, 0.46782541275024414, 0.6967761516571045, 0.9257268905639648, 1.1546776294708252, 1.3836283683776855, 1.612579107284546, 1.8415298461914062, 2.0704805850982666, 2.299431324005127, 2.5283820629119873, 2.7573328018188477, 2.986283540725708, 3.2152342796325684, 3.4441850185394287, 3.673135757446289, 3.9020864963531494, 4.13103723526001, 4.359988212585449, 4.5889387130737305, 4.817889213562012, 5.046840190887451, 5.275791168212891, 5.504741668701172, 5.733692169189453, 5.962643146514893]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 14.0, 13.0, 27.0, 20.0, 46.0, 64.0, 98.0, 173.0, 279.0, 506.0, 929.0, 2279.0, 5979.0, 18535.0, 73112.0, 449466.0, 404181.0, 65617.0, 17270.0, 5630.0, 2099.0, 963.0, 476.0, 277.0, 147.0, 94.0, 59.0, 51.0, 35.0, 24.0, 19.0, 9.0, 12.0, 6.0, 8.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9140625, -0.8835601806640625, -0.853057861328125, -0.8225555419921875, -0.79205322265625, -0.7615509033203125, -0.731048583984375, -0.7005462646484375, -0.6700439453125, -0.6395416259765625, -0.609039306640625, -0.5785369873046875, -0.54803466796875, -0.5175323486328125, -0.487030029296875, -0.4565277099609375, -0.426025390625, -0.3955230712890625, -0.365020751953125, -0.3345184326171875, -0.30401611328125, -0.2735137939453125, -0.243011474609375, -0.2125091552734375, -0.1820068359375, -0.1515045166015625, -0.121002197265625, -0.0904998779296875, -0.05999755859375, -0.0294952392578125, 0.001007080078125, 0.0315093994140625, 0.06201171875, 0.0925140380859375, 0.123016357421875, 0.1535186767578125, 0.18402099609375, 0.2145233154296875, 0.245025634765625, 0.2755279541015625, 0.3060302734375, 0.3365325927734375, 0.367034912109375, 0.3975372314453125, 0.42803955078125, 0.4585418701171875, 0.489044189453125, 0.5195465087890625, 0.550048828125, 0.5805511474609375, 0.611053466796875, 0.6415557861328125, 0.67205810546875, 0.7025604248046875, 0.733062744140625, 0.7635650634765625, 0.7940673828125, 0.8245697021484375, 0.855072021484375, 0.8855743408203125, 0.91607666015625, 0.9465789794921875, 0.977081298828125, 1.0075836181640625, 1.0380859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 9.0, 14.0, 24.0, 26.0, 48.0, 48.0, 76.0, 79.0, 114.0, 82.0, 100.0, 94.0, 55.0, 58.0, 61.0, 38.0, 23.0, 23.0, 13.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46484375, -7.26702880859375, -7.0692138671875, -6.87139892578125, -6.673583984375, -6.47576904296875, -6.2779541015625, -6.08013916015625, -5.88232421875, -5.68450927734375, -5.4866943359375, -5.28887939453125, -5.091064453125, -4.89324951171875, -4.6954345703125, -4.49761962890625, -4.2998046875, -4.10198974609375, -3.9041748046875, -3.70635986328125, -3.508544921875, -3.31072998046875, -3.1129150390625, -2.91510009765625, -2.71728515625, -2.51947021484375, -2.3216552734375, -2.12384033203125, -1.926025390625, -1.72821044921875, -1.5303955078125, -1.33258056640625, -1.134765625, -0.93695068359375, -0.7391357421875, -0.54132080078125, -0.343505859375, -0.14569091796875, 0.0521240234375, 0.24993896484375, 0.44775390625, 0.64556884765625, 0.8433837890625, 1.04119873046875, 1.239013671875, 1.43682861328125, 1.6346435546875, 1.83245849609375, 2.0302734375, 2.22808837890625, 2.4259033203125, 2.62371826171875, 2.821533203125, 3.01934814453125, 3.2171630859375, 3.41497802734375, 3.61279296875, 3.81060791015625, 4.0084228515625, 4.20623779296875, 4.404052734375, 4.60186767578125, 4.7996826171875, 4.99749755859375, 5.1953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 3.0, 11.0, 20.0, 20.0, 28.0, 42.0, 79.0, 114.0, 173.0, 344.0, 656.0, 1299.0, 2693.0, 6564.0, 17148.0, 52724.0, 211198.0, 541290.0, 150046.0, 40496.0, 13667.0, 5303.0, 2283.0, 1037.0, 574.0, 288.0, 153.0, 114.0, 65.0, 34.0, 29.0, 13.0, 11.0, 9.0, 7.0, 11.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.70379638671875, -0.6781005859375, -0.65240478515625, -0.626708984375, -0.60101318359375, -0.5753173828125, -0.54962158203125, -0.52392578125, -0.49822998046875, -0.4725341796875, -0.44683837890625, -0.421142578125, -0.39544677734375, -0.3697509765625, -0.34405517578125, -0.318359375, -0.29266357421875, -0.2669677734375, -0.24127197265625, -0.215576171875, -0.18988037109375, -0.1641845703125, -0.13848876953125, -0.11279296875, -0.08709716796875, -0.0614013671875, -0.03570556640625, -0.010009765625, 0.01568603515625, 0.0413818359375, 0.06707763671875, 0.0927734375, 0.11846923828125, 0.1441650390625, 0.16986083984375, 0.195556640625, 0.22125244140625, 0.2469482421875, 0.27264404296875, 0.29833984375, 0.32403564453125, 0.3497314453125, 0.37542724609375, 0.401123046875, 0.42681884765625, 0.4525146484375, 0.47821044921875, 0.50390625, 0.52960205078125, 0.5552978515625, 0.58099365234375, 0.606689453125, 0.63238525390625, 0.6580810546875, 0.68377685546875, 0.70947265625, 0.73516845703125, 0.7608642578125, 0.78656005859375, 0.812255859375, 0.83795166015625, 0.8636474609375, 0.88934326171875, 0.9150390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 4.0, 6.0, 7.0, 10.0, 24.0, 17.0, 21.0, 14.0, 31.0, 33.0, 34.0, 42.0, 45.0, 42.0, 63.0, 54.0, 56.0, 48.0, 49.0, 47.0, 36.0, 52.0, 37.0, 37.0, 42.0, 27.0, 24.0, 13.0, 13.0, 15.0, 13.0, 12.0, 3.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.71636962890625, -6.4757080078125, -6.23504638671875, -5.994384765625, -5.75372314453125, -5.5130615234375, -5.27239990234375, -5.03173828125, -4.79107666015625, -4.5504150390625, -4.30975341796875, -4.069091796875, -3.82843017578125, -3.5877685546875, -3.34710693359375, -3.1064453125, -2.86578369140625, -2.6251220703125, -2.38446044921875, -2.143798828125, -1.90313720703125, -1.6624755859375, -1.42181396484375, -1.18115234375, -0.94049072265625, -0.6998291015625, -0.45916748046875, -0.218505859375, 0.02215576171875, 0.2628173828125, 0.50347900390625, 0.744140625, 0.98480224609375, 1.2254638671875, 1.46612548828125, 1.706787109375, 1.94744873046875, 2.1881103515625, 2.42877197265625, 2.66943359375, 2.91009521484375, 3.1507568359375, 3.39141845703125, 3.632080078125, 3.87274169921875, 4.1134033203125, 4.35406494140625, 4.5947265625, 4.83538818359375, 5.0760498046875, 5.31671142578125, 5.557373046875, 5.79803466796875, 6.0386962890625, 6.27935791015625, 6.52001953125, 6.76068115234375, 7.0013427734375, 7.24200439453125, 7.482666015625, 7.72332763671875, 7.9639892578125, 8.20465087890625, 8.4453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 13.0, 20.0, 46.0, 42.0, 63.0, 94.0, 165.0, 283.0, 405.0, 726.0, 1279.0, 2478.0, 5805.0, 17589.0, 78159.0, 531938.0, 337510.0, 49956.0, 12577.0, 4523.0, 2073.0, 1102.0, 643.0, 376.0, 223.0, 155.0, 106.0, 73.0, 42.0, 35.0, 18.0, 16.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1611328125, -0.1559123992919922, -0.15069198608398438, -0.14547157287597656, -0.14025115966796875, -0.13503074645996094, -0.12981033325195312, -0.12458992004394531, -0.1193695068359375, -0.11414909362792969, -0.10892868041992188, -0.10370826721191406, -0.09848785400390625, -0.09326744079589844, -0.08804702758789062, -0.08282661437988281, -0.077606201171875, -0.07238578796386719, -0.06716537475585938, -0.06194496154785156, -0.05672454833984375, -0.05150413513183594, -0.046283721923828125, -0.04106330871582031, -0.0358428955078125, -0.030622482299804688, -0.025402069091796875, -0.020181655883789062, -0.01496124267578125, -0.009740829467773438, -0.004520416259765625, 0.0006999969482421875, 0.00592041015625, 0.011140823364257812, 0.016361236572265625, 0.021581649780273438, 0.02680206298828125, 0.03202247619628906, 0.037242889404296875, 0.04246330261230469, 0.0476837158203125, 0.05290412902832031, 0.058124542236328125, 0.06334495544433594, 0.06856536865234375, 0.07378578186035156, 0.07900619506835938, 0.08422660827636719, 0.089447021484375, 0.09466743469238281, 0.09988784790039062, 0.10510826110839844, 0.11032867431640625, 0.11554908752441406, 0.12076950073242188, 0.1259899139404297, 0.1312103271484375, 0.1364307403564453, 0.14165115356445312, 0.14687156677246094, 0.15209197998046875, 0.15731239318847656, 0.16253280639648438, 0.1677532196044922, 0.1729736328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 11.0, 5.0, 15.0, 15.0, 25.0, 22.0, 41.0, 48.0, 78.0, 81.0, 107.0, 123.0, 94.0, 102.0, 45.0, 41.0, 30.0, 34.0, 16.0, 13.0, 17.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.49826431274414e-05, -7.280055433511734e-05, -7.061846554279327e-05, -6.843637675046921e-05, -6.625428795814514e-05, -6.407219916582108e-05, -6.189011037349701e-05, -5.970802158117294e-05, -5.752593278884888e-05, -5.534384399652481e-05, -5.3161755204200745e-05, -5.097966641187668e-05, -4.879757761955261e-05, -4.6615488827228546e-05, -4.443340003490448e-05, -4.2251311242580414e-05, -4.006922245025635e-05, -3.788713365793228e-05, -3.5705044865608215e-05, -3.352295607328415e-05, -3.134086728096008e-05, -2.9158778488636017e-05, -2.697668969631195e-05, -2.4794600903987885e-05, -2.261251211166382e-05, -2.0430423319339752e-05, -1.8248334527015686e-05, -1.606624573469162e-05, -1.3884156942367554e-05, -1.1702068150043488e-05, -9.519979357719421e-06, -7.337890565395355e-06, -5.155801773071289e-06, -2.973712980747223e-06, -7.916241884231567e-07, 1.3904646039009094e-06, 3.5725533962249756e-06, 5.754642188549042e-06, 7.936730980873108e-06, 1.0118819773197174e-05, 1.230090856552124e-05, 1.4482997357845306e-05, 1.6665086150169373e-05, 1.884717494249344e-05, 2.1029263734817505e-05, 2.321135252714157e-05, 2.5393441319465637e-05, 2.7575530111789703e-05, 2.975761890411377e-05, 3.1939707696437836e-05, 3.41217964887619e-05, 3.630388528108597e-05, 3.8485974073410034e-05, 4.06680628657341e-05, 4.2850151658058167e-05, 4.503224045038223e-05, 4.72143292427063e-05, 4.9396418035030365e-05, 5.157850682735443e-05, 5.37605956196785e-05, 5.5942684412002563e-05, 5.812477320432663e-05, 6.0306861996650696e-05, 6.248895078897476e-05, 6.467103958129883e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 0.0, 7.0, 6.0, 13.0, 16.0, 21.0, 9.0, 36.0, 37.0, 57.0, 86.0, 124.0, 172.0, 312.0, 547.0, 1112.0, 2559.0, 8413.0, 37155.0, 304203.0, 598338.0, 74701.0, 13599.0, 3851.0, 1442.0, 687.0, 331.0, 223.0, 119.0, 93.0, 65.0, 56.0, 38.0, 31.0, 21.0, 18.0, 11.0, 10.0, 4.0, 5.0, 9.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1534423828125, -0.1483592987060547, -0.14327621459960938, -0.13819313049316406, -0.13311004638671875, -0.12802696228027344, -0.12294387817382812, -0.11786079406738281, -0.1127777099609375, -0.10769462585449219, -0.10261154174804688, -0.09752845764160156, -0.09244537353515625, -0.08736228942871094, -0.08227920532226562, -0.07719612121582031, -0.072113037109375, -0.06702995300292969, -0.061946868896484375, -0.05686378479003906, -0.05178070068359375, -0.04669761657714844, -0.041614532470703125, -0.03653144836425781, -0.0314483642578125, -0.026365280151367188, -0.021282196044921875, -0.016199111938476562, -0.01111602783203125, -0.0060329437255859375, -0.000949859619140625, 0.0041332244873046875, 0.00921630859375, 0.014299392700195312, 0.019382476806640625, 0.024465560913085938, 0.02954864501953125, 0.03463172912597656, 0.039714813232421875, 0.04479789733886719, 0.0498809814453125, 0.05496406555175781, 0.060047149658203125, 0.06513023376464844, 0.07021331787109375, 0.07529640197753906, 0.08037948608398438, 0.08546257019042969, 0.090545654296875, 0.09562873840332031, 0.10071182250976562, 0.10579490661621094, 0.11087799072265625, 0.11596107482910156, 0.12104415893554688, 0.1261272430419922, 0.1312103271484375, 0.1362934112548828, 0.14137649536132812, 0.14645957946777344, 0.15154266357421875, 0.15662574768066406, 0.16170883178710938, 0.1667919158935547, 0.171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 2.0, 9.0, 9.0, 10.0, 8.0, 23.0, 13.0, 17.0, 34.0, 36.0, 52.0, 51.0, 53.0, 75.0, 67.0, 78.0, 76.0, 59.0, 49.0, 45.0, 40.0, 35.0, 36.0, 23.0, 24.0, 13.0, 19.0, 9.0, 9.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.046109676361083984, -0.04476451873779297, -0.04341936111450195, -0.04207420349121094, -0.04072904586791992, -0.039383888244628906, -0.03803873062133789, -0.036693572998046875, -0.03534841537475586, -0.034003257751464844, -0.03265810012817383, -0.03131294250488281, -0.029967784881591797, -0.02862262725830078, -0.027277469635009766, -0.02593231201171875, -0.024587154388427734, -0.02324199676513672, -0.021896839141845703, -0.020551681518554688, -0.019206523895263672, -0.017861366271972656, -0.01651620864868164, -0.015171051025390625, -0.01382589340209961, -0.012480735778808594, -0.011135578155517578, -0.009790420532226562, -0.008445262908935547, -0.007100105285644531, -0.005754947662353516, -0.0044097900390625, -0.0030646324157714844, -0.0017194747924804688, -0.0003743171691894531, 0.0009708404541015625, 0.002315998077392578, 0.0036611557006835938, 0.005006313323974609, 0.006351470947265625, 0.007696628570556641, 0.009041786193847656, 0.010386943817138672, 0.011732101440429688, 0.013077259063720703, 0.014422416687011719, 0.015767574310302734, 0.01711273193359375, 0.018457889556884766, 0.01980304718017578, 0.021148204803466797, 0.022493362426757812, 0.023838520050048828, 0.025183677673339844, 0.02652883529663086, 0.027873992919921875, 0.02921915054321289, 0.030564308166503906, 0.03190946578979492, 0.03325462341308594, 0.03459978103637695, 0.03594493865966797, 0.037290096282958984, 0.03863525390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 28.0, 688.0, 288.0, 10.0, 1.0, 1.0, 1.0, 3.0], "bins": [-70.49104309082031, -69.27152252197266, -68.05200958251953, -66.83248901367188, -65.61297607421875, -64.3934555053711, -63.1739387512207, -61.95442199707031, -60.734901428222656, -59.515384674072266, -58.295867919921875, -57.07634735107422, -55.85683059692383, -54.63731384277344, -53.41779708862305, -52.198280334472656, -50.978759765625, -49.75924301147461, -48.53972625732422, -47.32020568847656, -46.10068893432617, -44.88117218017578, -43.66165542602539, -42.442138671875, -41.22262191772461, -40.00310516357422, -38.78358840942383, -37.56406784057617, -36.34455108642578, -35.12503433227539, -33.905517578125, -32.685997009277344, -31.466482162475586, -30.246965408325195, -29.027446746826172, -27.80792999267578, -26.588411331176758, -25.368894577026367, -24.149375915527344, -22.929859161376953, -21.710342407226562, -20.490825653076172, -19.27130699157715, -18.051790237426758, -16.832271575927734, -15.612754821777344, -14.393237113952637, -13.17371940612793, -11.954200744628906, -10.7346830368042, -9.515165328979492, -8.295648574829102, -7.076130390167236, -5.856612682342529, -4.6370954513549805, -3.4175777435302734, -2.1980605125427246, -0.9785429239273071, 0.24097466468811035, 1.4604921340942383, 2.6800098419189453, 3.8995275497436523, 5.119044780731201, 6.338562488555908, 7.558080196380615]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 17.0, 21.0, 21.0, 33.0, 47.0, 63.0, 81.0, 104.0, 108.0, 102.0, 89.0, 83.0, 65.0, 56.0, 39.0, 30.0, 17.0, 17.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.420414447784424, -7.215081214904785, -7.009747505187988, -6.80441427230835, -6.599081039428711, -6.393747329711914, -6.188414096832275, -5.983080863952637, -5.77774715423584, -5.572413921356201, -5.367080211639404, -5.161746978759766, -4.956413269042969, -4.75108003616333, -4.545746803283691, -4.3404130935668945, -4.135079860687256, -3.929746389389038, -3.7244129180908203, -3.5190796852111816, -3.313746213912964, -3.108412742614746, -2.9030795097351074, -2.6977460384368896, -2.492412567138672, -2.287079095840454, -2.0817456245422363, -1.8764123916625977, -1.6710789203643799, -1.465745449066162, -1.2604120969772339, -1.0550787448883057, -0.8497457504272461, -0.6444123387336731, -0.4390789270401001, -0.2337455153465271, -0.0284121036529541, 0.17692136764526367, 0.3822547197341919, 0.5875880718231201, 0.7929215431213379, 0.9982549548149109, 1.2035883665084839, 1.408921718597412, 1.6142551898956299, 1.8195886611938477, 2.0249218940734863, 2.230255365371704, 2.435588836669922, 2.6409223079681396, 2.8462557792663574, 3.051589012145996, 3.256922483444214, 3.4622559547424316, 3.6675891876220703, 3.872922658920288, 4.078256130218506, 4.2835893630981445, 4.488923072814941, 4.69425630569458, 4.899589538574219, 5.104923248291016, 5.310256481170654, 5.515589714050293, 5.72092342376709]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 10.0, 17.0, 29.0, 52.0, 79.0, 113.0, 291.0, 626.0, 1631.0, 6622.0, 45820.0, 330118.0, 533789.0, 110727.0, 14226.0, 2680.0, 889.0, 370.0, 197.0, 105.0, 60.0, 32.0, 24.0, 10.0, 13.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.4677734375, -3.318359375, -3.1689453125, -3.01953125, -2.8701171875, -2.720703125, -2.5712890625, -2.421875, -2.2724609375, -2.123046875, -1.9736328125, -1.82421875, -1.6748046875, -1.525390625, -1.3759765625, -1.2265625, -1.0771484375, -0.927734375, -0.7783203125, -0.62890625, -0.4794921875, -0.330078125, -0.1806640625, -0.03125, 0.1181640625, 0.267578125, 0.4169921875, 0.56640625, 0.7158203125, 0.865234375, 1.0146484375, 1.1640625, 1.3134765625, 1.462890625, 1.6123046875, 1.76171875, 1.9111328125, 2.060546875, 2.2099609375, 2.359375, 2.5087890625, 2.658203125, 2.8076171875, 2.95703125, 3.1064453125, 3.255859375, 3.4052734375, 3.5546875, 3.7041015625, 3.853515625, 4.0029296875, 4.15234375, 4.3017578125, 4.451171875, 4.6005859375, 4.75, 4.8994140625, 5.048828125, 5.1982421875, 5.34765625, 5.4970703125, 5.646484375, 5.7958984375, 5.9453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 13.0, 10.0, 12.0, 16.0, 22.0, 35.0, 35.0, 48.0, 55.0, 63.0, 73.0, 77.0, 67.0, 78.0, 68.0, 60.0, 52.0, 41.0, 46.0, 43.0, 25.0, 16.0, 19.0, 5.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.78125, -10.49432373046875, -10.2073974609375, -9.92047119140625, -9.633544921875, -9.34661865234375, -9.0596923828125, -8.77276611328125, -8.48583984375, -8.19891357421875, -7.9119873046875, -7.62506103515625, -7.338134765625, -7.05120849609375, -6.7642822265625, -6.47735595703125, -6.1904296875, -5.90350341796875, -5.6165771484375, -5.32965087890625, -5.042724609375, -4.75579833984375, -4.4688720703125, -4.18194580078125, -3.89501953125, -3.60809326171875, -3.3211669921875, -3.03424072265625, -2.747314453125, -2.46038818359375, -2.1734619140625, -1.88653564453125, -1.599609375, -1.31268310546875, -1.0257568359375, -0.73883056640625, -0.451904296875, -0.16497802734375, 0.1219482421875, 0.40887451171875, 0.69580078125, 0.98272705078125, 1.2696533203125, 1.55657958984375, 1.843505859375, 2.13043212890625, 2.4173583984375, 2.70428466796875, 2.9912109375, 3.27813720703125, 3.5650634765625, 3.85198974609375, 4.138916015625, 4.42584228515625, 4.7127685546875, 4.99969482421875, 5.28662109375, 5.57354736328125, 5.8604736328125, 6.14739990234375, 6.434326171875, 6.72125244140625, 7.0081787109375, 7.29510498046875, 7.58203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 8.0, 15.0, 10.0, 12.0, 23.0, 32.0, 49.0, 59.0, 81.0, 108.0, 157.0, 233.0, 356.0, 737.0, 4632.0, 445285.0, 588338.0, 6252.0, 835.0, 405.0, 260.0, 161.0, 113.0, 87.0, 67.0, 56.0, 34.0, 19.0, 26.0, 20.0, 14.0, 8.0, 16.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.6640625, -10.30908203125, -9.9541015625, -9.59912109375, -9.244140625, -8.88916015625, -8.5341796875, -8.17919921875, -7.82421875, -7.46923828125, -7.1142578125, -6.75927734375, -6.404296875, -6.04931640625, -5.6943359375, -5.33935546875, -4.984375, -4.62939453125, -4.2744140625, -3.91943359375, -3.564453125, -3.20947265625, -2.8544921875, -2.49951171875, -2.14453125, -1.78955078125, -1.4345703125, -1.07958984375, -0.724609375, -0.36962890625, -0.0146484375, 0.34033203125, 0.6953125, 1.05029296875, 1.4052734375, 1.76025390625, 2.115234375, 2.47021484375, 2.8251953125, 3.18017578125, 3.53515625, 3.89013671875, 4.2451171875, 4.60009765625, 4.955078125, 5.31005859375, 5.6650390625, 6.02001953125, 6.375, 6.72998046875, 7.0849609375, 7.43994140625, 7.794921875, 8.14990234375, 8.5048828125, 8.85986328125, 9.21484375, 9.56982421875, 9.9248046875, 10.27978515625, 10.634765625, 10.98974609375, 11.3447265625, 11.69970703125, 12.0546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 4.0, 5.0, 6.0, 17.0, 13.0, 14.0, 15.0, 17.0, 24.0, 28.0, 41.0, 34.0, 39.0, 47.0, 46.0, 54.0, 49.0, 41.0, 60.0, 42.0, 57.0, 47.0, 40.0, 44.0, 34.0, 33.0, 22.0, 23.0, 13.0, 10.0, 15.0, 9.0, 12.0, 5.0, 10.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.091796875, -7.83203125, -7.572265625, -7.3125, -7.052734375, -6.79296875, -6.533203125, -6.2734375, -6.013671875, -5.75390625, -5.494140625, -5.234375, -4.974609375, -4.71484375, -4.455078125, -4.1953125, -3.935546875, -3.67578125, -3.416015625, -3.15625, -2.896484375, -2.63671875, -2.376953125, -2.1171875, -1.857421875, -1.59765625, -1.337890625, -1.078125, -0.818359375, -0.55859375, -0.298828125, -0.0390625, 0.220703125, 0.48046875, 0.740234375, 1.0, 1.259765625, 1.51953125, 1.779296875, 2.0390625, 2.298828125, 2.55859375, 2.818359375, 3.078125, 3.337890625, 3.59765625, 3.857421875, 4.1171875, 4.376953125, 4.63671875, 4.896484375, 5.15625, 5.416015625, 5.67578125, 5.935546875, 6.1953125, 6.455078125, 6.71484375, 6.974609375, 7.234375, 7.494140625, 7.75390625, 8.013671875, 8.2734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 8.0, 18.0, 19.0, 35.0, 72.0, 165.0, 591.0, 2726.0, 89368.0, 947143.0, 6821.0, 1013.0, 268.0, 116.0, 57.0, 36.0, 13.0, 18.0, 5.0, 3.0, 6.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.2578125, -6.06353759765625, -5.8692626953125, -5.67498779296875, -5.480712890625, -5.28643798828125, -5.0921630859375, -4.89788818359375, -4.70361328125, -4.50933837890625, -4.3150634765625, -4.12078857421875, -3.926513671875, -3.73223876953125, -3.5379638671875, -3.34368896484375, -3.1494140625, -2.95513916015625, -2.7608642578125, -2.56658935546875, -2.372314453125, -2.17803955078125, -1.9837646484375, -1.78948974609375, -1.59521484375, -1.40093994140625, -1.2066650390625, -1.01239013671875, -0.818115234375, -0.62384033203125, -0.4295654296875, -0.23529052734375, -0.041015625, 0.15325927734375, 0.3475341796875, 0.54180908203125, 0.736083984375, 0.93035888671875, 1.1246337890625, 1.31890869140625, 1.51318359375, 1.70745849609375, 1.9017333984375, 2.09600830078125, 2.290283203125, 2.48455810546875, 2.6788330078125, 2.87310791015625, 3.0673828125, 3.26165771484375, 3.4559326171875, 3.65020751953125, 3.844482421875, 4.03875732421875, 4.2330322265625, 4.42730712890625, 4.62158203125, 4.81585693359375, 5.0101318359375, 5.20440673828125, 5.398681640625, 5.59295654296875, 5.7872314453125, 5.98150634765625, 6.17578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 14.0, 19.0, 37.0, 76.0, 134.0, 173.0, 174.0, 136.0, 106.0, 54.0, 28.0, 15.0, 16.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005311965942382812, -0.0005176737904548645, -0.0005041509866714478, -0.000490628182888031, -0.00047710537910461426, -0.0004635825753211975, -0.00045005977153778076, -0.000436536967754364, -0.00042301416397094727, -0.0004094913601875305, -0.00039596855640411377, -0.000382445752620697, -0.0003689229488372803, -0.0003554001450538635, -0.0003418773412704468, -0.00032835453748703003, -0.0003148317337036133, -0.00030130892992019653, -0.0002877861261367798, -0.00027426332235336304, -0.0002607405185699463, -0.00024721771478652954, -0.0002336949110031128, -0.00022017210721969604, -0.0002066493034362793, -0.00019312649965286255, -0.0001796036958694458, -0.00016608089208602905, -0.0001525580883026123, -0.00013903528451919556, -0.0001255124807357788, -0.00011198967695236206, -9.846687316894531e-05, -8.494406938552856e-05, -7.142126560211182e-05, -5.789846181869507e-05, -4.437565803527832e-05, -3.085285425186157e-05, -1.7330050468444824e-05, -3.807246685028076e-06, 9.715557098388672e-06, 2.323836088180542e-05, 3.676116466522217e-05, 5.0283968448638916e-05, 6.380677223205566e-05, 7.732957601547241e-05, 9.085237979888916e-05, 0.00010437518358230591, 0.00011789798736572266, 0.0001314207911491394, 0.00014494359493255615, 0.0001584663987159729, 0.00017198920249938965, 0.0001855120062828064, 0.00019903481006622314, 0.0002125576138496399, 0.00022608041763305664, 0.0002396032214164734, 0.00025312602519989014, 0.0002666488289833069, 0.00028017163276672363, 0.0002936944365501404, 0.00030721724033355713, 0.0003207400441169739, 0.0003342628479003906]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 8.0, 7.0, 10.0, 9.0, 20.0, 23.0, 50.0, 75.0, 183.0, 496.0, 1179.0, 4546.0, 189270.0, 841490.0, 8371.0, 1646.0, 627.0, 263.0, 114.0, 43.0, 30.0, 18.0, 7.0, 14.0, 6.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.38189697265625, -5.2091064453125, -5.03631591796875, -4.863525390625, -4.69073486328125, -4.5179443359375, -4.34515380859375, -4.17236328125, -3.99957275390625, -3.8267822265625, -3.65399169921875, -3.481201171875, -3.30841064453125, -3.1356201171875, -2.96282958984375, -2.7900390625, -2.61724853515625, -2.4444580078125, -2.27166748046875, -2.098876953125, -1.92608642578125, -1.7532958984375, -1.58050537109375, -1.40771484375, -1.23492431640625, -1.0621337890625, -0.88934326171875, -0.716552734375, -0.54376220703125, -0.3709716796875, -0.19818115234375, -0.025390625, 0.14739990234375, 0.3201904296875, 0.49298095703125, 0.665771484375, 0.83856201171875, 1.0113525390625, 1.18414306640625, 1.35693359375, 1.52972412109375, 1.7025146484375, 1.87530517578125, 2.048095703125, 2.22088623046875, 2.3936767578125, 2.56646728515625, 2.7392578125, 2.91204833984375, 3.0848388671875, 3.25762939453125, 3.430419921875, 3.60321044921875, 3.7760009765625, 3.94879150390625, 4.12158203125, 4.29437255859375, 4.4671630859375, 4.63995361328125, 4.812744140625, 4.98553466796875, 5.1583251953125, 5.33111572265625, 5.50390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 6.0, 11.0, 30.0, 38.0, 63.0, 105.0, 110.0, 147.0, 107.0, 103.0, 81.0, 55.0, 40.0, 25.0, 15.0, 18.0, 6.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.052734375, -1.0197601318359375, -0.986785888671875, -0.9538116455078125, -0.92083740234375, -0.8878631591796875, -0.854888916015625, -0.8219146728515625, -0.7889404296875, -0.7559661865234375, -0.722991943359375, -0.6900177001953125, -0.65704345703125, -0.6240692138671875, -0.591094970703125, -0.5581207275390625, -0.525146484375, -0.4921722412109375, -0.459197998046875, -0.4262237548828125, -0.39324951171875, -0.3602752685546875, -0.327301025390625, -0.2943267822265625, -0.2613525390625, -0.2283782958984375, -0.195404052734375, -0.1624298095703125, -0.12945556640625, -0.0964813232421875, -0.063507080078125, -0.0305328369140625, 0.00244140625, 0.0354156494140625, 0.068389892578125, 0.1013641357421875, 0.13433837890625, 0.1673126220703125, 0.200286865234375, 0.2332611083984375, 0.2662353515625, 0.2992095947265625, 0.332183837890625, 0.3651580810546875, 0.39813232421875, 0.4311065673828125, 0.464080810546875, 0.4970550537109375, 0.530029296875, 0.5630035400390625, 0.595977783203125, 0.6289520263671875, 0.66192626953125, 0.6949005126953125, 0.727874755859375, 0.7608489990234375, 0.7938232421875, 0.8267974853515625, 0.859771728515625, 0.8927459716796875, 0.92572021484375, 0.9586944580078125, 0.991668701171875, 1.0246429443359375, 1.0576171875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 44.0, 316.0, 488.0, 140.0, 13.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-72.83810424804688, -71.51814270019531, -70.19818878173828, -68.87822723388672, -67.55827331542969, -66.23831176757812, -64.91835021972656, -63.59839630126953, -62.27843475341797, -60.95847702026367, -59.638519287109375, -58.31855773925781, -56.998600006103516, -55.67864227294922, -54.35868453979492, -53.038726806640625, -51.71876907348633, -50.39881134033203, -49.078853607177734, -47.75889205932617, -46.438934326171875, -45.11897659301758, -43.79901885986328, -42.479061126708984, -41.15910339355469, -39.83914566040039, -38.519187927246094, -37.19922637939453, -35.879268646240234, -34.55931091308594, -33.23935317993164, -31.919395446777344, -30.599435806274414, -29.279478073120117, -27.959518432617188, -26.63956069946289, -25.319602966308594, -23.999643325805664, -22.679685592651367, -21.359725952148438, -20.03976821899414, -18.719810485839844, -17.399850845336914, -16.079893112182617, -14.759934425354004, -13.43997573852539, -12.120018005371094, -10.80005931854248, -9.480100631713867, -8.160141944885254, -6.840183734893799, -5.520225524902344, -4.2002668380737305, -2.880308151245117, -1.560349941253662, -0.24039173126220703, 1.0795669555664062, 2.3995254039764404, 3.7194838523864746, 5.03944206237793, 6.359400749206543, 7.679359436035156, 8.999317169189453, 10.319275856018066, 11.63923454284668]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 14.0, 14.0, 17.0, 24.0, 29.0, 21.0, 20.0, 29.0, 35.0, 38.0, 43.0, 50.0, 46.0, 45.0, 41.0, 49.0, 43.0, 50.0, 48.0, 44.0, 47.0, 24.0, 28.0, 33.0, 27.0, 21.0, 24.0, 16.0, 10.0, 9.0, 14.0, 6.0, 7.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-17.439943313598633, -16.99299430847168, -16.546045303344727, -16.099096298217773, -15.65214729309082, -15.205198287963867, -14.758249282836914, -14.311301231384277, -13.864352226257324, -13.417403221130371, -12.970454216003418, -12.523505210876465, -12.076556205749512, -11.629608154296875, -11.182659149169922, -10.735710144042969, -10.288761138916016, -9.841812133789062, -9.39486312866211, -8.947914123535156, -8.500965118408203, -8.05401611328125, -7.607067584991455, -7.16011905670166, -6.713169097900391, -6.2662200927734375, -5.819271087646484, -5.372322082519531, -4.925373554229736, -4.478424549102783, -4.03147554397583, -3.584526777267456, -3.137578010559082, -2.690629005432129, -2.243680238723755, -1.7967312335968018, -1.3497823476791382, -0.9028334617614746, -0.4558844566345215, -0.008935689926147461, 0.43801331520080566, 0.8849622011184692, 1.3319110870361328, 1.778860092163086, 2.225809097290039, 2.672757863998413, 3.119706869125366, 3.5666556358337402, 4.013604640960693, 4.4605536460876465, 4.9075026512146, 5.3544511795043945, 5.801400184631348, 6.248349189758301, 6.695298194885254, 7.142247200012207, 7.58919620513916, 8.036145210266113, 8.483094215393066, 8.93004322052002, 9.376992225646973, 9.82394027709961, 10.270889282226562, 10.717838287353516, 11.164787292480469]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 10.0, 11.0, 16.0, 18.0, 22.0, 27.0, 49.0, 88.0, 158.0, 294.0, 552.0, 1033.0, 2317.0, 15154.0, 347111.0, 3044398.0, 746422.0, 29957.0, 4477.0, 1316.0, 411.0, 182.0, 81.0, 58.0, 45.0, 24.0, 9.0, 11.0, 4.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.31640625, -6.05987548828125, -5.8033447265625, -5.54681396484375, -5.290283203125, -5.03375244140625, -4.7772216796875, -4.52069091796875, -4.26416015625, -4.00762939453125, -3.7510986328125, -3.49456787109375, -3.238037109375, -2.98150634765625, -2.7249755859375, -2.46844482421875, -2.2119140625, -1.95538330078125, -1.6988525390625, -1.44232177734375, -1.185791015625, -0.92926025390625, -0.6727294921875, -0.41619873046875, -0.15966796875, 0.09686279296875, 0.3533935546875, 0.60992431640625, 0.866455078125, 1.12298583984375, 1.3795166015625, 1.63604736328125, 1.892578125, 2.14910888671875, 2.4056396484375, 2.66217041015625, 2.918701171875, 3.17523193359375, 3.4317626953125, 3.68829345703125, 3.94482421875, 4.20135498046875, 4.4578857421875, 4.71441650390625, 4.970947265625, 5.22747802734375, 5.4840087890625, 5.74053955078125, 5.9970703125, 6.25360107421875, 6.5101318359375, 6.76666259765625, 7.023193359375, 7.27972412109375, 7.5362548828125, 7.79278564453125, 8.04931640625, 8.30584716796875, 8.5623779296875, 8.81890869140625, 9.075439453125, 9.33197021484375, 9.5885009765625, 9.84503173828125, 10.1015625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 25.0, 33.0, 41.0, 79.0, 66.0, 82.0, 96.0, 115.0, 101.0, 97.0, 62.0, 59.0, 52.0, 29.0, 15.0, 19.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.9337158203125, -8.648681640625, -8.3636474609375, -8.07861328125, -7.7935791015625, -7.508544921875, -7.2235107421875, -6.9384765625, -6.6534423828125, -6.368408203125, -6.0833740234375, -5.79833984375, -5.5133056640625, -5.228271484375, -4.9432373046875, -4.658203125, -4.3731689453125, -4.088134765625, -3.8031005859375, -3.51806640625, -3.2330322265625, -2.947998046875, -2.6629638671875, -2.3779296875, -2.0928955078125, -1.807861328125, -1.5228271484375, -1.23779296875, -0.9527587890625, -0.667724609375, -0.3826904296875, -0.09765625, 0.1873779296875, 0.472412109375, 0.7574462890625, 1.04248046875, 1.3275146484375, 1.612548828125, 1.8975830078125, 2.1826171875, 2.4676513671875, 2.752685546875, 3.0377197265625, 3.32275390625, 3.6077880859375, 3.892822265625, 4.1778564453125, 4.462890625, 4.7479248046875, 5.032958984375, 5.3179931640625, 5.60302734375, 5.8880615234375, 6.173095703125, 6.4581298828125, 6.7431640625, 7.0281982421875, 7.313232421875, 7.5982666015625, 7.88330078125, 8.1683349609375, 8.453369140625, 8.7384033203125, 9.0234375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 5.0, 12.0, 20.0, 39.0, 49.0, 105.0, 256.0, 666.0, 2998.0, 87775.0, 4073152.0, 26022.0, 2052.0, 575.0, 252.0, 120.0, 66.0, 30.0, 27.0, 14.0, 13.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.375, -11.867431640625, -11.35986328125, -10.852294921875, -10.3447265625, -9.837158203125, -9.32958984375, -8.822021484375, -8.314453125, -7.806884765625, -7.29931640625, -6.791748046875, -6.2841796875, -5.776611328125, -5.26904296875, -4.761474609375, -4.25390625, -3.746337890625, -3.23876953125, -2.731201171875, -2.2236328125, -1.716064453125, -1.20849609375, -0.700927734375, -0.193359375, 0.314208984375, 0.82177734375, 1.329345703125, 1.8369140625, 2.344482421875, 2.85205078125, 3.359619140625, 3.8671875, 4.374755859375, 4.88232421875, 5.389892578125, 5.8974609375, 6.405029296875, 6.91259765625, 7.420166015625, 7.927734375, 8.435302734375, 8.94287109375, 9.450439453125, 9.9580078125, 10.465576171875, 10.97314453125, 11.480712890625, 11.98828125, 12.495849609375, 13.00341796875, 13.510986328125, 14.0185546875, 14.526123046875, 15.03369140625, 15.541259765625, 16.048828125, 16.556396484375, 17.06396484375, 17.571533203125, 18.0791015625, 18.586669921875, 19.09423828125, 19.601806640625, 20.109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 7.0, 6.0, 13.0, 19.0, 27.0, 47.0, 70.0, 139.0, 322.0, 672.0, 994.0, 855.0, 485.0, 215.0, 97.0, 33.0, 27.0, 20.0, 6.0, 10.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5703125, -3.473052978515625, -3.37579345703125, -3.278533935546875, -3.1812744140625, -3.084014892578125, -2.98675537109375, -2.889495849609375, -2.792236328125, -2.694976806640625, -2.59771728515625, -2.500457763671875, -2.4031982421875, -2.305938720703125, -2.20867919921875, -2.111419677734375, -2.01416015625, -1.916900634765625, -1.81964111328125, -1.722381591796875, -1.6251220703125, -1.527862548828125, -1.43060302734375, -1.333343505859375, -1.236083984375, -1.138824462890625, -1.04156494140625, -0.944305419921875, -0.8470458984375, -0.749786376953125, -0.65252685546875, -0.555267333984375, -0.4580078125, -0.360748291015625, -0.26348876953125, -0.166229248046875, -0.0689697265625, 0.028289794921875, 0.12554931640625, 0.222808837890625, 0.320068359375, 0.417327880859375, 0.51458740234375, 0.611846923828125, 0.7091064453125, 0.806365966796875, 0.90362548828125, 1.000885009765625, 1.09814453125, 1.195404052734375, 1.29266357421875, 1.389923095703125, 1.4871826171875, 1.584442138671875, 1.68170166015625, 1.778961181640625, 1.876220703125, 1.973480224609375, 2.07073974609375, 2.167999267578125, 2.2652587890625, 2.362518310546875, 2.45977783203125, 2.557037353515625, 2.654296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 20.0, 55.0, 171.0, 291.0, 263.0, 139.0, 47.0, 16.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.139326095581055, -27.538997650146484, -26.938671112060547, -26.338342666625977, -25.738014221191406, -25.137685775756836, -24.5373592376709, -23.937030792236328, -23.336702346801758, -22.736373901367188, -22.13604736328125, -21.53571891784668, -20.93539047241211, -20.33506202697754, -19.7347354888916, -19.13440704345703, -18.534080505371094, -17.933752059936523, -17.333425521850586, -16.733097076416016, -16.132768630981445, -15.532441139221191, -14.932113647460938, -14.331785202026367, -13.731456756591797, -13.131129264831543, -12.530800819396973, -11.930473327636719, -11.330144882202148, -10.729817390441895, -10.12948989868164, -9.52916145324707, -8.928832054138184, -8.32850456237793, -7.728176116943359, -7.1278486251831055, -6.527520179748535, -5.927192687988281, -5.326864719390869, -4.726536750793457, -4.126208782196045, -3.525880813598633, -2.9255528450012207, -2.3252251148223877, -1.7248971462249756, -1.1245691776275635, -0.5242414474487305, 0.07608652114868164, 0.6764144897460938, 1.2767424583435059, 1.8770703077316284, 2.477398157119751, 3.077726125717163, 3.678054094314575, 4.278381824493408, 4.87870979309082, 5.479037761688232, 6.0793657302856445, 6.679693698883057, 7.280021667480469, 7.880349159240723, 8.480677604675293, 9.081005096435547, 9.681333541870117, 10.281661033630371]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 5.0, 8.0, 8.0, 14.0, 28.0, 32.0, 25.0, 43.0, 44.0, 60.0, 56.0, 48.0, 57.0, 71.0, 56.0, 68.0, 66.0, 68.0, 43.0, 44.0, 40.0, 26.0, 22.0, 23.0, 16.0, 14.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.72708797454834, -7.524438858032227, -7.321789741516113, -7.119141101837158, -6.916491985321045, -6.713842868804932, -6.511194229125977, -6.308545112609863, -6.10589599609375, -5.903246879577637, -5.700597763061523, -5.497949123382568, -5.295300006866455, -5.092650890350342, -4.890002250671387, -4.687353134155273, -4.48470401763916, -4.282054901123047, -4.079405784606934, -3.8767571449279785, -3.6741080284118652, -3.471458911895752, -3.2688100337982178, -3.0661611557006836, -2.8635120391845703, -2.660862922668457, -2.458214044570923, -2.2555651664733887, -2.0529160499572754, -1.8502670526504517, -1.647618055343628, -1.4449690580368042, -1.2423205375671387, -1.039671540260315, -0.8370225429534912, -0.6343735456466675, -0.43172454833984375, -0.22907555103302002, -0.02642655372619629, 0.17622244358062744, 0.37887144088745117, 0.5815204381942749, 0.7841694355010986, 0.9868184328079224, 1.189467430114746, 1.3921164274215698, 1.5947654247283936, 1.7974144220352173, 2.000063419342041, 2.2027125358581543, 2.4053614139556885, 2.6080102920532227, 2.810659408569336, 3.013308525085449, 3.2159574031829834, 3.4186062812805176, 3.621255397796631, 3.823904514312744, 4.026553153991699, 4.2292022705078125, 4.431851387023926, 4.634500503540039, 4.837149620056152, 5.039798259735107, 5.242447376251221]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 2.0, 4.0, 5.0, 14.0, 14.0, 28.0, 36.0, 59.0, 91.0, 158.0, 355.0, 691.0, 1743.0, 4890.0, 18606.0, 98570.0, 659562.0, 218016.0, 33580.0, 7708.0, 2490.0, 957.0, 429.0, 220.0, 106.0, 86.0, 49.0, 37.0, 18.0, 10.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.646484375, -1.6039276123046875, -1.561370849609375, -1.5188140869140625, -1.47625732421875, -1.4337005615234375, -1.391143798828125, -1.3485870361328125, -1.3060302734375, -1.2634735107421875, -1.220916748046875, -1.1783599853515625, -1.13580322265625, -1.0932464599609375, -1.050689697265625, -1.0081329345703125, -0.965576171875, -0.9230194091796875, -0.880462646484375, -0.8379058837890625, -0.79534912109375, -0.7527923583984375, -0.710235595703125, -0.6676788330078125, -0.6251220703125, -0.5825653076171875, -0.540008544921875, -0.4974517822265625, -0.45489501953125, -0.4123382568359375, -0.369781494140625, -0.3272247314453125, -0.28466796875, -0.2421112060546875, -0.199554443359375, -0.1569976806640625, -0.11444091796875, -0.0718841552734375, -0.029327392578125, 0.0132293701171875, 0.0557861328125, 0.0983428955078125, 0.140899658203125, 0.1834564208984375, 0.22601318359375, 0.2685699462890625, 0.311126708984375, 0.3536834716796875, 0.396240234375, 0.4387969970703125, 0.481353759765625, 0.5239105224609375, 0.56646728515625, 0.6090240478515625, 0.651580810546875, 0.6941375732421875, 0.7366943359375, 0.7792510986328125, 0.821807861328125, 0.8643646240234375, 0.90692138671875, 0.9494781494140625, 0.992034912109375, 1.0345916748046875, 1.0771484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 21.0, 21.0, 43.0, 44.0, 46.0, 56.0, 76.0, 79.0, 71.0, 87.0, 72.0, 65.0, 81.0, 56.0, 45.0, 33.0, 27.0, 22.0, 19.0, 12.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.15234375, -6.9786376953125, -6.804931640625, -6.6312255859375, -6.45751953125, -6.2838134765625, -6.110107421875, -5.9364013671875, -5.7626953125, -5.5889892578125, -5.415283203125, -5.2415771484375, -5.06787109375, -4.8941650390625, -4.720458984375, -4.5467529296875, -4.373046875, -4.1993408203125, -4.025634765625, -3.8519287109375, -3.67822265625, -3.5045166015625, -3.330810546875, -3.1571044921875, -2.9833984375, -2.8096923828125, -2.635986328125, -2.4622802734375, -2.28857421875, -2.1148681640625, -1.941162109375, -1.7674560546875, -1.59375, -1.4200439453125, -1.246337890625, -1.0726318359375, -0.89892578125, -0.7252197265625, -0.551513671875, -0.3778076171875, -0.2041015625, -0.0303955078125, 0.143310546875, 0.3170166015625, 0.49072265625, 0.6644287109375, 0.838134765625, 1.0118408203125, 1.185546875, 1.3592529296875, 1.532958984375, 1.7066650390625, 1.88037109375, 2.0540771484375, 2.227783203125, 2.4014892578125, 2.5751953125, 2.7489013671875, 2.922607421875, 3.0963134765625, 3.27001953125, 3.4437255859375, 3.617431640625, 3.7911376953125, 3.96484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 6.0, 6.0, 12.0, 22.0, 29.0, 35.0, 49.0, 69.0, 114.0, 149.0, 228.0, 383.0, 597.0, 983.0, 1790.0, 3180.0, 6111.0, 12276.0, 25913.0, 59058.0, 153682.0, 404176.0, 231637.0, 80652.0, 34364.0, 15827.0, 7831.0, 4019.0, 2123.0, 1214.0, 709.0, 434.0, 260.0, 200.0, 128.0, 71.0, 59.0, 32.0, 23.0, 20.0, 20.0, 14.0, 14.0, 4.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.53759765625, -0.5200729370117188, -0.5025482177734375, -0.48502349853515625, -0.467498779296875, -0.44997406005859375, -0.4324493408203125, -0.41492462158203125, -0.39739990234375, -0.37987518310546875, -0.3623504638671875, -0.34482574462890625, -0.327301025390625, -0.30977630615234375, -0.2922515869140625, -0.27472686767578125, -0.2572021484375, -0.23967742919921875, -0.2221527099609375, -0.20462799072265625, -0.187103271484375, -0.16957855224609375, -0.1520538330078125, -0.13452911376953125, -0.11700439453125, -0.09947967529296875, -0.0819549560546875, -0.06443023681640625, -0.046905517578125, -0.02938079833984375, -0.0118560791015625, 0.00566864013671875, 0.023193359375, 0.04071807861328125, 0.0582427978515625, 0.07576751708984375, 0.093292236328125, 0.11081695556640625, 0.1283416748046875, 0.14586639404296875, 0.16339111328125, 0.18091583251953125, 0.1984405517578125, 0.21596527099609375, 0.233489990234375, 0.25101470947265625, 0.2685394287109375, 0.28606414794921875, 0.3035888671875, 0.32111358642578125, 0.3386383056640625, 0.35616302490234375, 0.373687744140625, 0.39121246337890625, 0.4087371826171875, 0.42626190185546875, 0.44378662109375, 0.46131134033203125, 0.4788360595703125, 0.49636077880859375, 0.513885498046875, 0.5314102172851562, 0.5489349365234375, 0.5664596557617188, 0.583984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 4.0, 5.0, 9.0, 11.0, 17.0, 14.0, 13.0, 24.0, 24.0, 20.0, 27.0, 30.0, 36.0, 33.0, 26.0, 36.0, 43.0, 44.0, 50.0, 43.0, 34.0, 43.0, 33.0, 43.0, 35.0, 36.0, 26.0, 31.0, 28.0, 32.0, 20.0, 23.0, 20.0, 15.0, 10.0, 9.0, 4.0, 10.0, 3.0, 9.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.25, -6.0579833984375, -5.865966796875, -5.6739501953125, -5.48193359375, -5.2899169921875, -5.097900390625, -4.9058837890625, -4.7138671875, -4.5218505859375, -4.329833984375, -4.1378173828125, -3.94580078125, -3.7537841796875, -3.561767578125, -3.3697509765625, -3.177734375, -2.9857177734375, -2.793701171875, -2.6016845703125, -2.40966796875, -2.2176513671875, -2.025634765625, -1.8336181640625, -1.6416015625, -1.4495849609375, -1.257568359375, -1.0655517578125, -0.87353515625, -0.6815185546875, -0.489501953125, -0.2974853515625, -0.10546875, 0.0865478515625, 0.278564453125, 0.4705810546875, 0.66259765625, 0.8546142578125, 1.046630859375, 1.2386474609375, 1.4306640625, 1.6226806640625, 1.814697265625, 2.0067138671875, 2.19873046875, 2.3907470703125, 2.582763671875, 2.7747802734375, 2.966796875, 3.1588134765625, 3.350830078125, 3.5428466796875, 3.73486328125, 3.9268798828125, 4.118896484375, 4.3109130859375, 4.5029296875, 4.6949462890625, 4.886962890625, 5.0789794921875, 5.27099609375, 5.4630126953125, 5.655029296875, 5.8470458984375, 6.0390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 6.0, 20.0, 23.0, 35.0, 58.0, 91.0, 120.0, 194.0, 287.0, 501.0, 705.0, 1213.0, 2237.0, 4834.0, 10786.0, 28838.0, 93334.0, 313742.0, 391434.0, 133418.0, 39993.0, 14294.0, 5936.0, 2759.0, 1437.0, 795.0, 502.0, 331.0, 200.0, 115.0, 100.0, 68.0, 39.0, 25.0, 24.0, 17.0, 13.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.084228515625, -0.08152389526367188, -0.07881927490234375, -0.07611465454101562, -0.0734100341796875, -0.07070541381835938, -0.06800079345703125, -0.06529617309570312, -0.062591552734375, -0.059886932373046875, -0.05718231201171875, -0.054477691650390625, -0.0517730712890625, -0.049068450927734375, -0.04636383056640625, -0.043659210205078125, -0.04095458984375, -0.038249969482421875, -0.03554534912109375, -0.032840728759765625, -0.0301361083984375, -0.027431488037109375, -0.02472686767578125, -0.022022247314453125, -0.019317626953125, -0.016613006591796875, -0.01390838623046875, -0.011203765869140625, -0.0084991455078125, -0.005794525146484375, -0.00308990478515625, -0.000385284423828125, 0.0023193359375, 0.005023956298828125, 0.00772857666015625, 0.010433197021484375, 0.0131378173828125, 0.015842437744140625, 0.01854705810546875, 0.021251678466796875, 0.023956298828125, 0.026660919189453125, 0.02936553955078125, 0.032070159912109375, 0.0347747802734375, 0.037479400634765625, 0.04018402099609375, 0.042888641357421875, 0.04559326171875, 0.048297882080078125, 0.05100250244140625, 0.053707122802734375, 0.0564117431640625, 0.059116363525390625, 0.06182098388671875, 0.06452560424804688, 0.067230224609375, 0.06993484497070312, 0.07263946533203125, 0.07534408569335938, 0.0780487060546875, 0.08075332641601562, 0.08345794677734375, 0.08616256713867188, 0.0888671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 3.0, 8.0, 6.0, 15.0, 16.0, 18.0, 32.0, 32.0, 46.0, 55.0, 88.0, 113.0, 96.0, 76.0, 83.0, 80.0, 70.0, 50.0, 34.0, 14.0, 20.0, 12.0, 7.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.866455078125e-05, -6.6426582634449e-05, -6.418861448764801e-05, -6.195064634084702e-05, -5.971267819404602e-05, -5.7474710047245026e-05, -5.523674190044403e-05, -5.2998773753643036e-05, -5.076080560684204e-05, -4.8522837460041046e-05, -4.628486931324005e-05, -4.4046901166439056e-05, -4.180893301963806e-05, -3.957096487283707e-05, -3.733299672603607e-05, -3.509502857923508e-05, -3.285706043243408e-05, -3.061909228563309e-05, -2.8381124138832092e-05, -2.6143155992031097e-05, -2.3905187845230103e-05, -2.1667219698429108e-05, -1.9429251551628113e-05, -1.7191283404827118e-05, -1.4953315258026123e-05, -1.2715347111225128e-05, -1.0477378964424133e-05, -8.239410817623138e-06, -6.0014426708221436e-06, -3.7634745240211487e-06, -1.5255063772201538e-06, 7.124617695808411e-07, 2.950429916381836e-06, 5.188398063182831e-06, 7.426366209983826e-06, 9.66433435678482e-06, 1.1902302503585815e-05, 1.414027065038681e-05, 1.6378238797187805e-05, 1.86162069439888e-05, 2.0854175090789795e-05, 2.309214323759079e-05, 2.5330111384391785e-05, 2.756807953119278e-05, 2.9806047677993774e-05, 3.204401582479477e-05, 3.4281983971595764e-05, 3.651995211839676e-05, 3.8757920265197754e-05, 4.099588841199875e-05, 4.3233856558799744e-05, 4.547182470560074e-05, 4.7709792852401733e-05, 4.994776099920273e-05, 5.218572914600372e-05, 5.442369729280472e-05, 5.666166543960571e-05, 5.889963358640671e-05, 6.11376017332077e-05, 6.33755698800087e-05, 6.561353802680969e-05, 6.785150617361069e-05, 7.008947432041168e-05, 7.232744246721268e-05, 7.456541061401367e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 8.0, 6.0, 10.0, 12.0, 17.0, 26.0, 57.0, 71.0, 111.0, 159.0, 222.0, 401.0, 756.0, 1654.0, 4315.0, 13497.0, 48488.0, 215786.0, 520568.0, 182507.0, 41085.0, 11661.0, 3905.0, 1497.0, 676.0, 346.0, 212.0, 146.0, 103.0, 64.0, 52.0, 34.0, 29.0, 15.0, 16.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.11627197265625, -0.11316680908203125, -0.1100616455078125, -0.10695648193359375, -0.103851318359375, -0.10074615478515625, -0.0976409912109375, -0.09453582763671875, -0.0914306640625, -0.08832550048828125, -0.0852203369140625, -0.08211517333984375, -0.079010009765625, -0.07590484619140625, -0.0727996826171875, -0.06969451904296875, -0.06658935546875, -0.06348419189453125, -0.0603790283203125, -0.05727386474609375, -0.054168701171875, -0.05106353759765625, -0.0479583740234375, -0.04485321044921875, -0.041748046875, -0.03864288330078125, -0.0355377197265625, -0.03243255615234375, -0.029327392578125, -0.02622222900390625, -0.0231170654296875, -0.02001190185546875, -0.01690673828125, -0.01380157470703125, -0.0106964111328125, -0.00759124755859375, -0.004486083984375, -0.00138092041015625, 0.0017242431640625, 0.00482940673828125, 0.0079345703125, 0.01103973388671875, 0.0141448974609375, 0.01725006103515625, 0.020355224609375, 0.02346038818359375, 0.0265655517578125, 0.02967071533203125, 0.03277587890625, 0.03588104248046875, 0.0389862060546875, 0.04209136962890625, 0.045196533203125, 0.04830169677734375, 0.0514068603515625, 0.05451202392578125, 0.0576171875, 0.06072235107421875, 0.0638275146484375, 0.06693267822265625, 0.070037841796875, 0.07314300537109375, 0.0762481689453125, 0.07935333251953125, 0.08245849609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 3.0, 9.0, 2.0, 13.0, 8.0, 13.0, 19.0, 15.0, 19.0, 16.0, 33.0, 42.0, 43.0, 58.0, 61.0, 99.0, 87.0, 101.0, 81.0, 49.0, 41.0, 34.0, 32.0, 23.0, 29.0, 14.0, 11.0, 10.0, 11.0, 10.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025604248046875, -0.02470874786376953, -0.023813247680664062, -0.022917747497558594, -0.022022247314453125, -0.021126747131347656, -0.020231246948242188, -0.01933574676513672, -0.01844024658203125, -0.01754474639892578, -0.016649246215820312, -0.015753746032714844, -0.014858245849609375, -0.013962745666503906, -0.013067245483398438, -0.012171745300292969, -0.0112762451171875, -0.010380744934082031, -0.009485244750976562, -0.008589744567871094, -0.007694244384765625, -0.006798744201660156, -0.0059032440185546875, -0.005007743835449219, -0.00411224365234375, -0.0032167434692382812, -0.0023212432861328125, -0.0014257431030273438, -0.000530242919921875, 0.00036525726318359375, 0.0012607574462890625, 0.0021562576293945312, 0.0030517578125, 0.003947257995605469, 0.0048427581787109375, 0.005738258361816406, 0.006633758544921875, 0.007529258728027344, 0.008424758911132812, 0.009320259094238281, 0.01021575927734375, 0.011111259460449219, 0.012006759643554688, 0.012902259826660156, 0.013797760009765625, 0.014693260192871094, 0.015588760375976562, 0.01648426055908203, 0.0173797607421875, 0.01827526092529297, 0.019170761108398438, 0.020066261291503906, 0.020961761474609375, 0.021857261657714844, 0.022752761840820312, 0.02364826202392578, 0.02454376220703125, 0.02543926239013672, 0.026334762573242188, 0.027230262756347656, 0.028125762939453125, 0.029021263122558594, 0.029916763305664062, 0.03081226348876953, 0.031707763671875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 250.0, 728.0, 31.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-70.77766418457031, -69.51912689208984, -68.26058959960938, -67.00204467773438, -65.7435073852539, -64.48497009277344, -63.2264289855957, -61.967891693115234, -60.7093505859375, -59.45081329345703, -58.1922721862793, -56.93373489379883, -55.675193786621094, -54.416656494140625, -53.15811538696289, -51.89957809448242, -50.64103698730469, -49.38249969482422, -48.123958587646484, -46.865421295166016, -45.60688018798828, -44.34834289550781, -43.08980178833008, -41.83126449584961, -40.57272720336914, -39.31418991088867, -38.05564880371094, -36.79711151123047, -35.538570404052734, -34.280033111572266, -33.02149200439453, -31.762954711914062, -30.504411697387695, -29.245872497558594, -27.987333297729492, -26.72879409790039, -25.47025489807129, -24.211715698242188, -22.95317840576172, -21.694637298583984, -20.436100006103516, -19.177560806274414, -17.919021606445312, -16.66048240661621, -15.40194320678711, -14.143404006958008, -12.884865760803223, -11.626326560974121, -10.367786407470703, -9.109247207641602, -7.8507080078125, -6.592169284820557, -5.333630084991455, -4.0750908851623535, -2.81655216217041, -1.5580129623413086, -0.29947376251220703, 0.959065318107605, 2.217604398727417, 3.4761433601379395, 4.734682559967041, 5.993221759796143, 7.251760482788086, 8.510299682617188, 9.768838882446289]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 7.0, 13.0, 30.0, 42.0, 41.0, 64.0, 68.0, 80.0, 73.0, 89.0, 87.0, 86.0, 83.0, 59.0, 61.0, 27.0, 28.0, 25.0, 15.0, 10.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.096746444702148, -6.908555030822754, -6.720363616943359, -6.532172203063965, -6.34398078918457, -6.155789375305176, -5.967597961425781, -5.779406547546387, -5.591215133666992, -5.403023719787598, -5.214832305908203, -5.026640892028809, -4.838449478149414, -4.6502580642700195, -4.462066650390625, -4.2738752365112305, -4.085683822631836, -3.8974924087524414, -3.709300994873047, -3.5211095809936523, -3.332918167114258, -3.1447267532348633, -2.9565353393554688, -2.768343925476074, -2.5801525115966797, -2.391961097717285, -2.2037696838378906, -2.015578269958496, -1.8273868560791016, -1.639195442199707, -1.4510040283203125, -1.262812614440918, -1.0746207237243652, -0.8864293098449707, -0.6982378959655762, -0.5100464820861816, -0.3218550682067871, -0.13366365432739258, 0.05452775955200195, 0.24271917343139648, 0.430910587310791, 0.6191020011901855, 0.8072934150695801, 0.9954848289489746, 1.1836762428283691, 1.3718676567077637, 1.5600590705871582, 1.7482504844665527, 1.9364418983459473, 2.124633312225342, 2.3128247261047363, 2.501016139984131, 2.6892075538635254, 2.87739896774292, 3.0655903816223145, 3.253781795501709, 3.4419732093811035, 3.630164623260498, 3.8183560371398926, 4.006547451019287, 4.194738864898682, 4.382930278778076, 4.571121692657471, 4.759313106536865, 4.94750452041626]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 6.0, 12.0, 21.0, 34.0, 53.0, 101.0, 159.0, 342.0, 665.0, 1622.0, 4893.0, 20246.0, 104568.0, 530579.0, 310855.0, 57271.0, 11653.0, 3193.0, 1160.0, 523.0, 280.0, 128.0, 64.0, 51.0, 21.0, 15.0, 15.0, 4.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.19921875, -3.0703125, -2.94140625, -2.8125, -2.68359375, -2.5546875, -2.42578125, -2.296875, -2.16796875, -2.0390625, -1.91015625, -1.78125, -1.65234375, -1.5234375, -1.39453125, -1.265625, -1.13671875, -1.0078125, -0.87890625, -0.75, -0.62109375, -0.4921875, -0.36328125, -0.234375, -0.10546875, 0.0234375, 0.15234375, 0.28125, 0.41015625, 0.5390625, 0.66796875, 0.796875, 0.92578125, 1.0546875, 1.18359375, 1.3125, 1.44140625, 1.5703125, 1.69921875, 1.828125, 1.95703125, 2.0859375, 2.21484375, 2.34375, 2.47265625, 2.6015625, 2.73046875, 2.859375, 2.98828125, 3.1171875, 3.24609375, 3.375, 3.50390625, 3.6328125, 3.76171875, 3.890625, 4.01953125, 4.1484375, 4.27734375, 4.40625, 4.53515625, 4.6640625, 4.79296875, 4.921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 22.0, 19.0, 35.0, 16.0, 38.0, 47.0, 56.0, 72.0, 67.0, 54.0, 68.0, 66.0, 71.0, 71.0, 58.0, 59.0, 29.0, 37.0, 25.0, 25.0, 16.0, 11.0, 13.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.259033203125, -9.98681640625, -9.714599609375, -9.4423828125, -9.170166015625, -8.89794921875, -8.625732421875, -8.353515625, -8.081298828125, -7.80908203125, -7.536865234375, -7.2646484375, -6.992431640625, -6.72021484375, -6.447998046875, -6.17578125, -5.903564453125, -5.63134765625, -5.359130859375, -5.0869140625, -4.814697265625, -4.54248046875, -4.270263671875, -3.998046875, -3.725830078125, -3.45361328125, -3.181396484375, -2.9091796875, -2.636962890625, -2.36474609375, -2.092529296875, -1.8203125, -1.548095703125, -1.27587890625, -1.003662109375, -0.7314453125, -0.459228515625, -0.18701171875, 0.085205078125, 0.357421875, 0.629638671875, 0.90185546875, 1.174072265625, 1.4462890625, 1.718505859375, 1.99072265625, 2.262939453125, 2.53515625, 2.807373046875, 3.07958984375, 3.351806640625, 3.6240234375, 3.896240234375, 4.16845703125, 4.440673828125, 4.712890625, 4.985107421875, 5.25732421875, 5.529541015625, 5.8017578125, 6.073974609375, 6.34619140625, 6.618408203125, 6.890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 12.0, 18.0, 21.0, 34.0, 36.0, 49.0, 65.0, 100.0, 150.0, 223.0, 399.0, 919.0, 6881.0, 682673.0, 350784.0, 4320.0, 840.0, 347.0, 216.0, 135.0, 99.0, 60.0, 34.0, 20.0, 18.0, 16.0, 13.0, 20.0, 9.0, 8.0, 7.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3203125, -11.9571533203125, -11.593994140625, -11.2308349609375, -10.86767578125, -10.5045166015625, -10.141357421875, -9.7781982421875, -9.4150390625, -9.0518798828125, -8.688720703125, -8.3255615234375, -7.96240234375, -7.5992431640625, -7.236083984375, -6.8729248046875, -6.509765625, -6.1466064453125, -5.783447265625, -5.4202880859375, -5.05712890625, -4.6939697265625, -4.330810546875, -3.9676513671875, -3.6044921875, -3.2413330078125, -2.878173828125, -2.5150146484375, -2.15185546875, -1.7886962890625, -1.425537109375, -1.0623779296875, -0.69921875, -0.3360595703125, 0.027099609375, 0.3902587890625, 0.75341796875, 1.1165771484375, 1.479736328125, 1.8428955078125, 2.2060546875, 2.5692138671875, 2.932373046875, 3.2955322265625, 3.65869140625, 4.0218505859375, 4.385009765625, 4.7481689453125, 5.111328125, 5.4744873046875, 5.837646484375, 6.2008056640625, 6.56396484375, 6.9271240234375, 7.290283203125, 7.6534423828125, 8.0166015625, 8.3797607421875, 8.742919921875, 9.1060791015625, 9.46923828125, 9.8323974609375, 10.195556640625, 10.5587158203125, 10.921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 11.0, 8.0, 11.0, 11.0, 13.0, 24.0, 26.0, 47.0, 48.0, 37.0, 53.0, 62.0, 65.0, 78.0, 54.0, 65.0, 57.0, 44.0, 54.0, 34.0, 52.0, 32.0, 20.0, 31.0, 18.0, 19.0, 10.0, 7.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1204833984375, -8.756591796875, -8.3927001953125, -8.02880859375, -7.6649169921875, -7.301025390625, -6.9371337890625, -6.5732421875, -6.2093505859375, -5.845458984375, -5.4815673828125, -5.11767578125, -4.7537841796875, -4.389892578125, -4.0260009765625, -3.662109375, -3.2982177734375, -2.934326171875, -2.5704345703125, -2.20654296875, -1.8426513671875, -1.478759765625, -1.1148681640625, -0.7509765625, -0.3870849609375, -0.023193359375, 0.3406982421875, 0.70458984375, 1.0684814453125, 1.432373046875, 1.7962646484375, 2.16015625, 2.5240478515625, 2.887939453125, 3.2518310546875, 3.61572265625, 3.9796142578125, 4.343505859375, 4.7073974609375, 5.0712890625, 5.4351806640625, 5.799072265625, 6.1629638671875, 6.52685546875, 6.8907470703125, 7.254638671875, 7.6185302734375, 7.982421875, 8.3463134765625, 8.710205078125, 9.0740966796875, 9.43798828125, 9.8018798828125, 10.165771484375, 10.5296630859375, 10.8935546875, 11.2574462890625, 11.621337890625, 11.9852294921875, 12.34912109375, 12.7130126953125, 13.076904296875, 13.4407958984375, 13.8046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 14.0, 24.0, 27.0, 85.0, 379.0, 4028.0, 1026235.0, 16777.0, 689.0, 164.0, 50.0, 27.0, 7.0, 12.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.9580078125, -8.666015625, -8.3740234375, -8.08203125, -7.7900390625, -7.498046875, -7.2060546875, -6.9140625, -6.6220703125, -6.330078125, -6.0380859375, -5.74609375, -5.4541015625, -5.162109375, -4.8701171875, -4.578125, -4.2861328125, -3.994140625, -3.7021484375, -3.41015625, -3.1181640625, -2.826171875, -2.5341796875, -2.2421875, -1.9501953125, -1.658203125, -1.3662109375, -1.07421875, -0.7822265625, -0.490234375, -0.1982421875, 0.09375, 0.3857421875, 0.677734375, 0.9697265625, 1.26171875, 1.5537109375, 1.845703125, 2.1376953125, 2.4296875, 2.7216796875, 3.013671875, 3.3056640625, 3.59765625, 3.8896484375, 4.181640625, 4.4736328125, 4.765625, 5.0576171875, 5.349609375, 5.6416015625, 5.93359375, 6.2255859375, 6.517578125, 6.8095703125, 7.1015625, 7.3935546875, 7.685546875, 7.9775390625, 8.26953125, 8.5615234375, 8.853515625, 9.1455078125, 9.4375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 10.0, 16.0, 36.0, 56.0, 104.0, 182.0, 231.0, 145.0, 86.0, 58.0, 27.0, 15.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004260540008544922, -0.00041201338171958923, -0.0003979727625846863, -0.0003839321434497833, -0.00036989152431488037, -0.0003558509051799774, -0.00034181028604507446, -0.0003277696669101715, -0.00031372904777526855, -0.0002996884286403656, -0.00028564780950546265, -0.0002716071903705597, -0.00025756657123565674, -0.00024352595210075378, -0.00022948533296585083, -0.00021544471383094788, -0.00020140409469604492, -0.00018736347556114197, -0.00017332285642623901, -0.00015928223729133606, -0.0001452416181564331, -0.00013120099902153015, -0.0001171603798866272, -0.00010311976075172424, -8.907914161682129e-05, -7.503852248191833e-05, -6.099790334701538e-05, -4.695728421211243e-05, -3.291666507720947e-05, -1.887604594230652e-05, -4.8354268074035645e-06, 9.20519232749939e-06, 2.3245811462402344e-05, 3.72864305973053e-05, 5.132704973220825e-05, 6.53676688671112e-05, 7.940828800201416e-05, 9.344890713691711e-05, 0.00010748952627182007, 0.00012153014540672302, 0.00013557076454162598, 0.00014961138367652893, 0.00016365200281143188, 0.00017769262194633484, 0.0001917332410812378, 0.00020577386021614075, 0.0002198144793510437, 0.00023385509848594666, 0.0002478957176208496, 0.00026193633675575256, 0.0002759769558906555, 0.00029001757502555847, 0.0003040581941604614, 0.0003180988132953644, 0.00033213943243026733, 0.0003461800515651703, 0.00036022067070007324, 0.0003742612898349762, 0.00038830190896987915, 0.0004023425281047821, 0.00041638314723968506, 0.000430423766374588, 0.00044446438550949097, 0.0004585050046443939, 0.0004725456237792969]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 5.0, 7.0, 15.0, 28.0, 58.0, 132.0, 441.0, 2435.0, 99624.0, 939403.0, 5277.0, 732.0, 217.0, 74.0, 29.0, 24.0, 9.0, 6.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.546875, -8.31695556640625, -8.0870361328125, -7.85711669921875, -7.627197265625, -7.39727783203125, -7.1673583984375, -6.93743896484375, -6.70751953125, -6.47760009765625, -6.2476806640625, -6.01776123046875, -5.787841796875, -5.55792236328125, -5.3280029296875, -5.09808349609375, -4.8681640625, -4.63824462890625, -4.4083251953125, -4.17840576171875, -3.948486328125, -3.71856689453125, -3.4886474609375, -3.25872802734375, -3.02880859375, -2.79888916015625, -2.5689697265625, -2.33905029296875, -2.109130859375, -1.87921142578125, -1.6492919921875, -1.41937255859375, -1.189453125, -0.95953369140625, -0.7296142578125, -0.49969482421875, -0.269775390625, -0.03985595703125, 0.1900634765625, 0.41998291015625, 0.64990234375, 0.87982177734375, 1.1097412109375, 1.33966064453125, 1.569580078125, 1.79949951171875, 2.0294189453125, 2.25933837890625, 2.4892578125, 2.71917724609375, 2.9490966796875, 3.17901611328125, 3.408935546875, 3.63885498046875, 3.8687744140625, 4.09869384765625, 4.32861328125, 4.55853271484375, 4.7884521484375, 5.01837158203125, 5.248291015625, 5.47821044921875, 5.7081298828125, 5.93804931640625, 6.16796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 13.0, 17.0, 24.0, 41.0, 74.0, 135.0, 187.0, 177.0, 117.0, 82.0, 44.0, 32.0, 15.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4372100830078125, -1.394927978515625, -1.3526458740234375, -1.31036376953125, -1.2680816650390625, -1.225799560546875, -1.1835174560546875, -1.1412353515625, -1.0989532470703125, -1.056671142578125, -1.0143890380859375, -0.97210693359375, -0.9298248291015625, -0.887542724609375, -0.8452606201171875, -0.802978515625, -0.7606964111328125, -0.718414306640625, -0.6761322021484375, -0.63385009765625, -0.5915679931640625, -0.549285888671875, -0.5070037841796875, -0.4647216796875, -0.4224395751953125, -0.380157470703125, -0.3378753662109375, -0.29559326171875, -0.2533111572265625, -0.211029052734375, -0.1687469482421875, -0.12646484375, -0.0841827392578125, -0.041900634765625, 0.0003814697265625, 0.04266357421875, 0.0849456787109375, 0.127227783203125, 0.1695098876953125, 0.2117919921875, 0.2540740966796875, 0.296356201171875, 0.3386383056640625, 0.38092041015625, 0.4232025146484375, 0.465484619140625, 0.5077667236328125, 0.550048828125, 0.5923309326171875, 0.634613037109375, 0.6768951416015625, 0.71917724609375, 0.7614593505859375, 0.803741455078125, 0.8460235595703125, 0.8883056640625, 0.9305877685546875, 0.972869873046875, 1.0151519775390625, 1.05743408203125, 1.0997161865234375, 1.141998291015625, 1.1842803955078125, 1.2265625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 30.0, 86.0, 244.0, 351.0, 201.0, 62.0, 22.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.399810791015625, -28.614139556884766, -27.828468322753906, -27.042797088623047, -26.257125854492188, -25.471454620361328, -24.68578338623047, -23.90011215209961, -23.11444091796875, -22.32876968383789, -21.54309844970703, -20.757427215576172, -19.971755981445312, -19.186084747314453, -18.400413513183594, -17.614742279052734, -16.829072952270508, -16.04340171813965, -15.257730484008789, -14.47205924987793, -13.68638801574707, -12.900716781616211, -12.115046501159668, -11.329375267028809, -10.54370403289795, -9.75803279876709, -8.97236156463623, -8.186691284179688, -7.40101957321167, -6.6153483390808105, -5.829677581787109, -5.04400634765625, -4.258337020874023, -3.472665786743164, -2.686994791030884, -1.9013237953186035, -1.1156525611877441, -0.32998132705688477, 0.4556894302368164, 1.2413606643676758, 2.027031898498535, 2.8127031326293945, 3.598374128341675, 4.384045124053955, 5.1697163581848145, 5.955387592315674, 6.741058349609375, 7.526729583740234, 8.312400817871094, 9.098072052001953, 9.883743286132812, 10.669414520263672, 11.455085754394531, 12.24075698852539, 13.026427268981934, 13.812098503112793, 14.597769737243652, 15.383440971374512, 16.169111251831055, 16.954782485961914, 17.740453720092773, 18.526124954223633, 19.311796188354492, 20.09746742248535, 20.88313865661621]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 6.0, 13.0, 13.0, 21.0, 24.0, 40.0, 44.0, 53.0, 43.0, 54.0, 65.0, 60.0, 66.0, 77.0, 54.0, 65.0, 50.0, 53.0, 36.0, 47.0, 22.0, 27.0, 19.0, 9.0, 12.0, 3.0, 8.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.250505447387695, -25.62093734741211, -24.991369247436523, -24.36180305480957, -23.732234954833984, -23.1026668548584, -22.473098754882812, -21.843530654907227, -21.21396255493164, -20.584394454956055, -19.95482635498047, -19.325260162353516, -18.69569206237793, -18.066123962402344, -17.436555862426758, -16.806987762451172, -16.17742156982422, -15.547853469848633, -14.918286323547363, -14.288718223571777, -13.659151077270508, -13.029582977294922, -12.400014877319336, -11.77044677734375, -11.14087963104248, -10.511311531066895, -9.881744384765625, -9.252176284790039, -8.622608184814453, -7.993041038513184, -7.363472938537598, -6.73390531539917, -6.104337692260742, -5.4747700691223145, -4.845202445983887, -4.215634346008301, -3.586066722869873, -2.9564990997314453, -2.3269312381744385, -1.6973633766174316, -1.067795753479004, -0.4382280111312866, 0.19133973121643066, 0.820907473564148, 1.4504752159118652, 2.080042839050293, 2.7096107006073, 3.3391785621643066, 3.9687461853027344, 4.598313808441162, 5.22788143157959, 5.857449531555176, 6.4870171546936035, 7.116584777832031, 7.746152877807617, 8.375720977783203, 9.005288124084473, 9.634856224060059, 10.264423370361328, 10.893991470336914, 11.5235595703125, 12.15312671661377, 12.782694816589355, 13.412261962890625, 14.041830062866211]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 10.0, 6.0, 10.0, 16.0, 28.0, 31.0, 50.0, 68.0, 129.0, 168.0, 287.0, 486.0, 892.0, 2274.0, 21831.0, 1101141.0, 2962846.0, 96043.0, 5716.0, 1112.0, 395.0, 223.0, 147.0, 106.0, 87.0, 54.0, 38.0, 19.0, 18.0, 11.0, 8.0, 5.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0390625, -10.7423095703125, -10.445556640625, -10.1488037109375, -9.85205078125, -9.5552978515625, -9.258544921875, -8.9617919921875, -8.6650390625, -8.3682861328125, -8.071533203125, -7.7747802734375, -7.47802734375, -7.1812744140625, -6.884521484375, -6.5877685546875, -6.291015625, -5.9942626953125, -5.697509765625, -5.4007568359375, -5.10400390625, -4.8072509765625, -4.510498046875, -4.2137451171875, -3.9169921875, -3.6202392578125, -3.323486328125, -3.0267333984375, -2.72998046875, -2.4332275390625, -2.136474609375, -1.8397216796875, -1.54296875, -1.2462158203125, -0.949462890625, -0.6527099609375, -0.35595703125, -0.0592041015625, 0.237548828125, 0.5343017578125, 0.8310546875, 1.1278076171875, 1.424560546875, 1.7213134765625, 2.01806640625, 2.3148193359375, 2.611572265625, 2.9083251953125, 3.205078125, 3.5018310546875, 3.798583984375, 4.0953369140625, 4.39208984375, 4.6888427734375, 4.985595703125, 5.2823486328125, 5.5791015625, 5.8758544921875, 6.172607421875, 6.4693603515625, 6.76611328125, 7.0628662109375, 7.359619140625, 7.6563720703125, 7.953125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 19.0, 25.0, 27.0, 61.0, 59.0, 79.0, 69.0, 96.0, 90.0, 85.0, 86.0, 89.0, 60.0, 49.0, 35.0, 28.0, 14.0, 10.0, 11.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.36669921875, -8.1318359375, -7.89697265625, -7.662109375, -7.42724609375, -7.1923828125, -6.95751953125, -6.72265625, -6.48779296875, -6.2529296875, -6.01806640625, -5.783203125, -5.54833984375, -5.3134765625, -5.07861328125, -4.84375, -4.60888671875, -4.3740234375, -4.13916015625, -3.904296875, -3.66943359375, -3.4345703125, -3.19970703125, -2.96484375, -2.72998046875, -2.4951171875, -2.26025390625, -2.025390625, -1.79052734375, -1.5556640625, -1.32080078125, -1.0859375, -0.85107421875, -0.6162109375, -0.38134765625, -0.146484375, 0.08837890625, 0.3232421875, 0.55810546875, 0.79296875, 1.02783203125, 1.2626953125, 1.49755859375, 1.732421875, 1.96728515625, 2.2021484375, 2.43701171875, 2.671875, 2.90673828125, 3.1416015625, 3.37646484375, 3.611328125, 3.84619140625, 4.0810546875, 4.31591796875, 4.55078125, 4.78564453125, 5.0205078125, 5.25537109375, 5.490234375, 5.72509765625, 5.9599609375, 6.19482421875, 6.4296875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 9.0, 11.0, 16.0, 28.0, 39.0, 96.0, 216.0, 812.0, 6460.0, 3814228.0, 368257.0, 3177.0, 531.0, 188.0, 87.0, 35.0, 25.0, 21.0, 16.0, 11.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -8.7073974609375, -8.078857421875, -7.4503173828125, -6.82177734375, -6.1932373046875, -5.564697265625, -4.9361572265625, -4.3076171875, -3.6790771484375, -3.050537109375, -2.4219970703125, -1.79345703125, -1.1649169921875, -0.536376953125, 0.0921630859375, 0.720703125, 1.3492431640625, 1.977783203125, 2.6063232421875, 3.23486328125, 3.8634033203125, 4.491943359375, 5.1204833984375, 5.7490234375, 6.3775634765625, 7.006103515625, 7.6346435546875, 8.26318359375, 8.8917236328125, 9.520263671875, 10.1488037109375, 10.77734375, 11.4058837890625, 12.034423828125, 12.6629638671875, 13.29150390625, 13.9200439453125, 14.548583984375, 15.1771240234375, 15.8056640625, 16.4342041015625, 17.062744140625, 17.6912841796875, 18.31982421875, 18.9483642578125, 19.576904296875, 20.2054443359375, 20.833984375, 21.4625244140625, 22.091064453125, 22.7196044921875, 23.34814453125, 23.9766845703125, 24.605224609375, 25.2337646484375, 25.8623046875, 26.4908447265625, 27.119384765625, 27.7479248046875, 28.37646484375, 29.0050048828125, 29.633544921875, 30.2620849609375, 30.890625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 1.0, 6.0, 9.0, 12.0, 17.0, 30.0, 57.0, 148.0, 391.0, 825.0, 1164.0, 841.0, 323.0, 120.0, 50.0, 24.0, 17.0, 11.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0], "bins": [-5.31640625, -5.208831787109375, -5.10125732421875, -4.993682861328125, -4.8861083984375, -4.778533935546875, -4.67095947265625, -4.563385009765625, -4.455810546875, -4.348236083984375, -4.24066162109375, -4.133087158203125, -4.0255126953125, -3.917938232421875, -3.81036376953125, -3.702789306640625, -3.59521484375, -3.487640380859375, -3.38006591796875, -3.272491455078125, -3.1649169921875, -3.057342529296875, -2.94976806640625, -2.842193603515625, -2.734619140625, -2.627044677734375, -2.51947021484375, -2.411895751953125, -2.3043212890625, -2.196746826171875, -2.08917236328125, -1.981597900390625, -1.8740234375, -1.766448974609375, -1.65887451171875, -1.551300048828125, -1.4437255859375, -1.336151123046875, -1.22857666015625, -1.121002197265625, -1.013427734375, -0.905853271484375, -0.79827880859375, -0.690704345703125, -0.5831298828125, -0.475555419921875, -0.36798095703125, -0.260406494140625, -0.15283203125, -0.045257568359375, 0.06231689453125, 0.169891357421875, 0.2774658203125, 0.385040283203125, 0.49261474609375, 0.600189208984375, 0.707763671875, 0.815338134765625, 0.92291259765625, 1.030487060546875, 1.1380615234375, 1.245635986328125, 1.35321044921875, 1.460784912109375, 1.568359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 12.0, 48.0, 141.0, 257.0, 275.0, 185.0, 58.0, 25.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.068758010864258, -24.513187408447266, -23.957616806030273, -23.40204620361328, -22.846473693847656, -22.290903091430664, -21.735332489013672, -21.17976188659668, -20.624191284179688, -20.068620681762695, -19.513050079345703, -18.95747947692871, -18.40190887451172, -17.846336364746094, -17.2907657623291, -16.73519515991211, -16.179624557495117, -15.624053955078125, -15.068483352661133, -14.512911796569824, -13.957341194152832, -13.40177059173584, -12.846199035644531, -12.290628433227539, -11.735057830810547, -11.179487228393555, -10.623916625976562, -10.068345069885254, -9.512774467468262, -8.95720386505127, -8.401632308959961, -7.846061706542969, -7.290489196777344, -6.734918594360352, -6.179347515106201, -5.623776435852051, -5.068205833435059, -4.512635231018066, -3.957064151763916, -3.4014933109283447, -2.8459224700927734, -2.290351629257202, -1.7347807884216309, -1.1792099475860596, -0.6236391067504883, -0.06806826591491699, 0.4875025749206543, 1.0430734157562256, 1.5986442565917969, 2.154215097427368, 2.7097859382629395, 3.2653567790985107, 3.820927619934082, 4.376498222351074, 4.932069301605225, 5.487640380859375, 6.043210983276367, 6.598781585693359, 7.15435266494751, 7.70992374420166, 8.265494346618652, 8.821064949035645, 9.376636505126953, 9.932207107543945, 10.487777709960938]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 14.0, 16.0, 28.0, 34.0, 52.0, 47.0, 66.0, 70.0, 65.0, 73.0, 69.0, 82.0, 83.0, 70.0, 47.0, 53.0, 30.0, 32.0, 27.0, 12.0, 14.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.076903343200684, -7.857119083404541, -7.637334823608398, -7.417551040649414, -7.1977667808532715, -6.977982521057129, -6.758198261260986, -6.538414001464844, -6.318630218505859, -6.098845958709717, -5.879061698913574, -5.65927791595459, -5.439493656158447, -5.219709396362305, -4.999925136566162, -4.7801408767700195, -4.560356616973877, -4.340572357177734, -4.120788097381592, -3.9010040760040283, -3.681220054626465, -3.4614357948303223, -3.2416515350341797, -3.021867275238037, -2.8020832538604736, -2.582298994064331, -2.3625149726867676, -2.142730712890625, -1.922946572303772, -1.703162431716919, -1.4833781719207764, -1.2635940313339233, -1.0438098907470703, -0.8240257501602173, -0.6042415499687195, -0.3844573497772217, -0.16467320919036865, 0.055110931396484375, 0.27489519119262695, 0.49467933177948, 0.714463472366333, 0.934247612953186, 1.154031753540039, 1.3738160133361816, 1.5936001539230347, 1.8133842945098877, 2.0331685543060303, 2.2529525756835938, 2.4727368354797363, 2.692521095275879, 2.9123051166534424, 3.132089376449585, 3.3518733978271484, 3.571657657623291, 3.7914419174194336, 4.011226177215576, 4.231010437011719, 4.450794696807861, 4.670578956604004, 4.890362739562988, 5.110146999359131, 5.329931259155273, 5.549715518951416, 5.769499778747559, 5.989283561706543]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 7.0, 11.0, 17.0, 27.0, 54.0, 72.0, 145.0, 282.0, 909.0, 4714.0, 52500.0, 867522.0, 112425.0, 7822.0, 1243.0, 375.0, 188.0, 94.0, 55.0, 27.0, 26.0, 15.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.96405029296875, -1.8929443359375, -1.82183837890625, -1.750732421875, -1.67962646484375, -1.6085205078125, -1.53741455078125, -1.46630859375, -1.39520263671875, -1.3240966796875, -1.25299072265625, -1.181884765625, -1.11077880859375, -1.0396728515625, -0.96856689453125, -0.8974609375, -0.82635498046875, -0.7552490234375, -0.68414306640625, -0.613037109375, -0.54193115234375, -0.4708251953125, -0.39971923828125, -0.32861328125, -0.25750732421875, -0.1864013671875, -0.11529541015625, -0.044189453125, 0.02691650390625, 0.0980224609375, 0.16912841796875, 0.240234375, 0.31134033203125, 0.3824462890625, 0.45355224609375, 0.524658203125, 0.59576416015625, 0.6668701171875, 0.73797607421875, 0.80908203125, 0.88018798828125, 0.9512939453125, 1.02239990234375, 1.093505859375, 1.16461181640625, 1.2357177734375, 1.30682373046875, 1.3779296875, 1.44903564453125, 1.5201416015625, 1.59124755859375, 1.662353515625, 1.73345947265625, 1.8045654296875, 1.87567138671875, 1.94677734375, 2.01788330078125, 2.0889892578125, 2.16009521484375, 2.231201171875, 2.30230712890625, 2.3734130859375, 2.44451904296875, 2.515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 13.0, 12.0, 40.0, 49.0, 88.0, 98.0, 110.0, 119.0, 129.0, 109.0, 89.0, 54.0, 38.0, 35.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.27716064453125, -6.0504150390625, -5.82366943359375, -5.596923828125, -5.37017822265625, -5.1434326171875, -4.91668701171875, -4.68994140625, -4.46319580078125, -4.2364501953125, -4.00970458984375, -3.782958984375, -3.55621337890625, -3.3294677734375, -3.10272216796875, -2.8759765625, -2.64923095703125, -2.4224853515625, -2.19573974609375, -1.968994140625, -1.74224853515625, -1.5155029296875, -1.28875732421875, -1.06201171875, -0.83526611328125, -0.6085205078125, -0.38177490234375, -0.155029296875, 0.07171630859375, 0.2984619140625, 0.52520751953125, 0.751953125, 0.97869873046875, 1.2054443359375, 1.43218994140625, 1.658935546875, 1.88568115234375, 2.1124267578125, 2.33917236328125, 2.56591796875, 2.79266357421875, 3.0194091796875, 3.24615478515625, 3.472900390625, 3.69964599609375, 3.9263916015625, 4.15313720703125, 4.3798828125, 4.60662841796875, 4.8333740234375, 5.06011962890625, 5.286865234375, 5.51361083984375, 5.7403564453125, 5.96710205078125, 6.19384765625, 6.42059326171875, 6.6473388671875, 6.87408447265625, 7.100830078125, 7.32757568359375, 7.5543212890625, 7.78106689453125, 8.0078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 12.0, 18.0, 23.0, 47.0, 67.0, 119.0, 209.0, 433.0, 917.0, 2443.0, 7735.0, 33426.0, 199616.0, 668153.0, 106665.0, 20308.0, 5165.0, 1712.0, 694.0, 346.0, 184.0, 94.0, 67.0, 25.0, 25.0, 13.0, 13.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.197265625, -1.1643218994140625, -1.131378173828125, -1.0984344482421875, -1.06549072265625, -1.0325469970703125, -0.999603271484375, -0.9666595458984375, -0.9337158203125, -0.9007720947265625, -0.867828369140625, -0.8348846435546875, -0.80194091796875, -0.7689971923828125, -0.736053466796875, -0.7031097412109375, -0.670166015625, -0.6372222900390625, -0.604278564453125, -0.5713348388671875, -0.53839111328125, -0.5054473876953125, -0.472503662109375, -0.4395599365234375, -0.4066162109375, -0.3736724853515625, -0.340728759765625, -0.3077850341796875, -0.27484130859375, -0.2418975830078125, -0.208953857421875, -0.1760101318359375, -0.14306640625, -0.1101226806640625, -0.077178955078125, -0.0442352294921875, -0.01129150390625, 0.0216522216796875, 0.054595947265625, 0.0875396728515625, 0.1204833984375, 0.1534271240234375, 0.186370849609375, 0.2193145751953125, 0.25225830078125, 0.2852020263671875, 0.318145751953125, 0.3510894775390625, 0.384033203125, 0.4169769287109375, 0.449920654296875, 0.4828643798828125, 0.51580810546875, 0.5487518310546875, 0.581695556640625, 0.6146392822265625, 0.6475830078125, 0.6805267333984375, 0.713470458984375, 0.7464141845703125, 0.77935791015625, 0.8123016357421875, 0.845245361328125, 0.8781890869140625, 0.9111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 14.0, 16.0, 18.0, 23.0, 45.0, 31.0, 43.0, 60.0, 63.0, 50.0, 79.0, 84.0, 60.0, 65.0, 61.0, 52.0, 42.0, 49.0, 47.0, 22.0, 12.0, 21.0, 15.0, 11.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3046875, -10.03167724609375, -9.7586669921875, -9.48565673828125, -9.212646484375, -8.93963623046875, -8.6666259765625, -8.39361572265625, -8.12060546875, -7.84759521484375, -7.5745849609375, -7.30157470703125, -7.028564453125, -6.75555419921875, -6.4825439453125, -6.20953369140625, -5.9365234375, -5.66351318359375, -5.3905029296875, -5.11749267578125, -4.844482421875, -4.57147216796875, -4.2984619140625, -4.02545166015625, -3.75244140625, -3.47943115234375, -3.2064208984375, -2.93341064453125, -2.660400390625, -2.38739013671875, -2.1143798828125, -1.84136962890625, -1.568359375, -1.29534912109375, -1.0223388671875, -0.74932861328125, -0.476318359375, -0.20330810546875, 0.0697021484375, 0.34271240234375, 0.61572265625, 0.88873291015625, 1.1617431640625, 1.43475341796875, 1.707763671875, 1.98077392578125, 2.2537841796875, 2.52679443359375, 2.7998046875, 3.07281494140625, 3.3458251953125, 3.61883544921875, 3.891845703125, 4.16485595703125, 4.4378662109375, 4.71087646484375, 4.98388671875, 5.25689697265625, 5.5299072265625, 5.80291748046875, 6.075927734375, 6.34893798828125, 6.6219482421875, 6.89495849609375, 7.16796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 1.0, 5.0, 8.0, 17.0, 25.0, 39.0, 61.0, 116.0, 151.0, 240.0, 435.0, 876.0, 1840.0, 4474.0, 12957.0, 53303.0, 329408.0, 522848.0, 91030.0, 19811.0, 6128.0, 2388.0, 1081.0, 524.0, 307.0, 176.0, 115.0, 63.0, 34.0, 30.0, 18.0, 14.0, 5.0, 10.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1109619140625, -0.10751152038574219, -0.10406112670898438, -0.10061073303222656, -0.09716033935546875, -0.09370994567871094, -0.09025955200195312, -0.08680915832519531, -0.0833587646484375, -0.07990837097167969, -0.07645797729492188, -0.07300758361816406, -0.06955718994140625, -0.06610679626464844, -0.06265640258789062, -0.05920600891113281, -0.055755615234375, -0.05230522155761719, -0.048854827880859375, -0.04540443420410156, -0.04195404052734375, -0.03850364685058594, -0.035053253173828125, -0.03160285949707031, -0.0281524658203125, -0.024702072143554688, -0.021251678466796875, -0.017801284790039062, -0.01435089111328125, -0.010900497436523438, -0.007450103759765625, -0.0039997100830078125, -0.00054931640625, 0.0029010772705078125, 0.006351470947265625, 0.009801864624023438, 0.01325225830078125, 0.016702651977539062, 0.020153045654296875, 0.023603439331054688, 0.0270538330078125, 0.030504226684570312, 0.033954620361328125, 0.03740501403808594, 0.04085540771484375, 0.04430580139160156, 0.047756195068359375, 0.05120658874511719, 0.054656982421875, 0.05810737609863281, 0.061557769775390625, 0.06500816345214844, 0.06845855712890625, 0.07190895080566406, 0.07535934448242188, 0.07880973815917969, 0.0822601318359375, 0.08571052551269531, 0.08916091918945312, 0.09261131286621094, 0.09606170654296875, 0.09951210021972656, 0.10296249389648438, 0.10641288757324219, 0.10986328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 12.0, 3.0, 9.0, 18.0, 24.0, 17.0, 31.0, 43.0, 68.0, 76.0, 96.0, 105.0, 96.0, 91.0, 70.0, 53.0, 35.0, 35.0, 28.0, 23.0, 17.0, 8.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.364418029785156e-05, -5.190353840589523e-05, -5.0162896513938904e-05, -4.8422254621982574e-05, -4.6681612730026245e-05, -4.4940970838069916e-05, -4.3200328946113586e-05, -4.145968705415726e-05, -3.971904516220093e-05, -3.79784032702446e-05, -3.623776137828827e-05, -3.449711948633194e-05, -3.275647759437561e-05, -3.101583570241928e-05, -2.927519381046295e-05, -2.7534551918506622e-05, -2.5793910026550293e-05, -2.4053268134593964e-05, -2.2312626242637634e-05, -2.0571984350681305e-05, -1.8831342458724976e-05, -1.7090700566768646e-05, -1.5350058674812317e-05, -1.3609416782855988e-05, -1.1868774890899658e-05, -1.0128132998943329e-05, -8.387491106987e-06, -6.64684921503067e-06, -4.906207323074341e-06, -3.1655654311180115e-06, -1.4249235391616821e-06, 3.157183527946472e-07, 2.0563602447509766e-06, 3.797002136707306e-06, 5.537644028663635e-06, 7.278285920619965e-06, 9.018927812576294e-06, 1.0759569704532623e-05, 1.2500211596488953e-05, 1.4240853488445282e-05, 1.598149538040161e-05, 1.772213727235794e-05, 1.946277916431427e-05, 2.12034210562706e-05, 2.294406294822693e-05, 2.4684704840183258e-05, 2.6425346732139587e-05, 2.8165988624095917e-05, 2.9906630516052246e-05, 3.1647272408008575e-05, 3.3387914299964905e-05, 3.5128556191921234e-05, 3.6869198083877563e-05, 3.860983997583389e-05, 4.035048186779022e-05, 4.209112375974655e-05, 4.383176565170288e-05, 4.557240754365921e-05, 4.731304943561554e-05, 4.905369132757187e-05, 5.07943332195282e-05, 5.253497511148453e-05, 5.427561700344086e-05, 5.6016258895397186e-05, 5.7756900787353516e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 3.0, 4.0, 10.0, 14.0, 22.0, 18.0, 30.0, 33.0, 62.0, 95.0, 200.0, 357.0, 821.0, 2061.0, 6942.0, 32175.0, 322527.0, 608375.0, 59254.0, 10455.0, 2941.0, 1112.0, 447.0, 211.0, 120.0, 83.0, 46.0, 26.0, 25.0, 15.0, 12.0, 11.0, 11.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11669921875, -0.11240196228027344, -0.10810470581054688, -0.10380744934082031, -0.09951019287109375, -0.09521293640136719, -0.09091567993164062, -0.08661842346191406, -0.0823211669921875, -0.07802391052246094, -0.07372665405273438, -0.06942939758300781, -0.06513214111328125, -0.06083488464355469, -0.056537628173828125, -0.05224037170410156, -0.047943115234375, -0.04364585876464844, -0.039348602294921875, -0.03505134582519531, -0.03075408935546875, -0.026456832885742188, -0.022159576416015625, -0.017862319946289062, -0.0135650634765625, -0.009267807006835938, -0.004970550537109375, -0.0006732940673828125, 0.00362396240234375, 0.007921218872070312, 0.012218475341796875, 0.016515731811523438, 0.02081298828125, 0.025110244750976562, 0.029407501220703125, 0.03370475769042969, 0.03800201416015625, 0.04229927062988281, 0.046596527099609375, 0.05089378356933594, 0.0551910400390625, 0.05948829650878906, 0.06378555297851562, 0.06808280944824219, 0.07238006591796875, 0.07667732238769531, 0.08097457885742188, 0.08527183532714844, 0.089569091796875, 0.09386634826660156, 0.09816360473632812, 0.10246086120605469, 0.10675811767578125, 0.11105537414550781, 0.11535263061523438, 0.11964988708496094, 0.1239471435546875, 0.12824440002441406, 0.13254165649414062, 0.1368389129638672, 0.14113616943359375, 0.1454334259033203, 0.14973068237304688, 0.15402793884277344, 0.1583251953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 6.0, 7.0, 12.0, 10.0, 28.0, 24.0, 34.0, 38.0, 65.0, 87.0, 113.0, 118.0, 91.0, 73.0, 78.0, 47.0, 47.0, 21.0, 18.0, 14.0, 13.0, 14.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02777099609375, -0.02675628662109375, -0.0257415771484375, -0.02472686767578125, -0.023712158203125, -0.02269744873046875, -0.0216827392578125, -0.02066802978515625, -0.0196533203125, -0.01863861083984375, -0.0176239013671875, -0.01660919189453125, -0.015594482421875, -0.01457977294921875, -0.0135650634765625, -0.01255035400390625, -0.01153564453125, -0.01052093505859375, -0.0095062255859375, -0.00849151611328125, -0.007476806640625, -0.00646209716796875, -0.0054473876953125, -0.00443267822265625, -0.00341796875, -0.00240325927734375, -0.0013885498046875, -0.00037384033203125, 0.000640869140625, 0.00165557861328125, 0.0026702880859375, 0.00368499755859375, 0.00469970703125, 0.00571441650390625, 0.0067291259765625, 0.00774383544921875, 0.008758544921875, 0.00977325439453125, 0.0107879638671875, 0.01180267333984375, 0.0128173828125, 0.01383209228515625, 0.0148468017578125, 0.01586151123046875, 0.016876220703125, 0.01789093017578125, 0.0189056396484375, 0.01992034912109375, 0.02093505859375, 0.02194976806640625, 0.0229644775390625, 0.02397918701171875, 0.024993896484375, 0.02600860595703125, 0.0270233154296875, 0.02803802490234375, 0.029052734375, 0.03006744384765625, 0.0310821533203125, 0.03209686279296875, 0.033111572265625, 0.03412628173828125, 0.0351409912109375, 0.03615570068359375, 0.03717041015625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 18.0, 278.0, 622.0, 93.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-45.268070220947266, -44.449100494384766, -43.630130767822266, -42.81116485595703, -41.99219512939453, -41.17322540283203, -40.35425567626953, -39.53528594970703, -38.7163200378418, -37.8973503112793, -37.0783805847168, -36.25941467285156, -35.44044494628906, -34.62147521972656, -33.80250549316406, -32.98353576660156, -32.16456604003906, -31.345596313476562, -30.526628494262695, -29.707658767700195, -28.888690948486328, -28.069721221923828, -27.250751495361328, -26.43178367614746, -25.612815856933594, -24.793846130371094, -23.974878311157227, -23.155908584594727, -22.33694076538086, -21.51797103881836, -20.69900131225586, -19.880033493041992, -19.061065673828125, -18.242095947265625, -17.423128128051758, -16.604158401489258, -15.78519058227539, -14.96622085571289, -14.147252082824707, -13.328283309936523, -12.509313583374023, -11.69034481048584, -10.871376037597656, -10.052406311035156, -9.233438491821289, -8.414468765258789, -7.5954999923706055, -6.776531219482422, -5.957562446594238, -5.138593673706055, -4.319624900817871, -3.5006556510925293, -2.6816868782043457, -1.862718105316162, -1.0437488555908203, -0.22478008270263672, 0.5941886901855469, 1.41315758228302, 2.232126474380493, 3.051095485687256, 3.8700642585754395, 4.689033031463623, 5.508002281188965, 6.326971054077148, 7.145939826965332]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 10.0, 11.0, 16.0, 39.0, 52.0, 71.0, 94.0, 95.0, 94.0, 100.0, 113.0, 102.0, 61.0, 52.0, 39.0, 28.0, 16.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.441736221313477, -6.247007369995117, -6.0522780418396, -5.85754919052124, -5.662819862365723, -5.468091011047363, -5.273362159729004, -5.078632831573486, -4.883903503417969, -4.689174652099609, -4.494445323944092, -4.299716472625732, -4.104987144470215, -3.9102582931518555, -3.715529203414917, -3.5208001136779785, -3.326071262359619, -3.1313421726226807, -2.936613082885742, -2.741884231567383, -2.5471549034118652, -2.352426052093506, -2.1576969623565674, -1.962967872619629, -1.7682387828826904, -1.573509693145752, -1.3787806034088135, -1.1840516328811646, -0.9893225431442261, -0.7945934534072876, -0.5998644828796387, -0.4051353931427002, -0.21040582656860352, -0.015676766633987427, 0.17905229330062866, 0.37378132343292236, 0.5685104131698608, 0.7632395029067993, 0.9579684734344482, 1.1526975631713867, 1.3474266529083252, 1.5421557426452637, 1.7368848323822021, 1.931613802909851, 2.1263427734375, 2.3210721015930176, 2.515800952911377, 2.7105300426483154, 2.905259132385254, 3.0999882221221924, 3.294717311859131, 3.4894461631774902, 3.684175491333008, 3.878904342651367, 4.073633193969727, 4.268362522125244, 4.463091850280762, 4.657820701599121, 4.852550029754639, 5.047278881072998, 5.242008209228516, 5.436737060546875, 5.631465911865234, 5.826195240020752, 6.020924091339111]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 11.0, 20.0, 25.0, 44.0, 55.0, 100.0, 180.0, 304.0, 591.0, 1461.0, 5210.0, 24127.0, 135245.0, 684486.0, 159447.0, 28212.0, 6013.0, 1640.0, 619.0, 304.0, 167.0, 113.0, 60.0, 43.0, 25.0, 17.0, 13.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.263519287109375, -3.13055419921875, -2.997589111328125, -2.8646240234375, -2.731658935546875, -2.59869384765625, -2.465728759765625, -2.332763671875, -2.199798583984375, -2.06683349609375, -1.933868408203125, -1.8009033203125, -1.667938232421875, -1.53497314453125, -1.402008056640625, -1.26904296875, -1.136077880859375, -1.00311279296875, -0.870147705078125, -0.7371826171875, -0.604217529296875, -0.47125244140625, -0.338287353515625, -0.205322265625, -0.072357177734375, 0.06060791015625, 0.193572998046875, 0.3265380859375, 0.459503173828125, 0.59246826171875, 0.725433349609375, 0.8583984375, 0.991363525390625, 1.12432861328125, 1.257293701171875, 1.3902587890625, 1.523223876953125, 1.65618896484375, 1.789154052734375, 1.922119140625, 2.055084228515625, 2.18804931640625, 2.321014404296875, 2.4539794921875, 2.586944580078125, 2.71990966796875, 2.852874755859375, 2.98583984375, 3.118804931640625, 3.25177001953125, 3.384735107421875, 3.5177001953125, 3.650665283203125, 3.78363037109375, 3.916595458984375, 4.049560546875, 4.182525634765625, 4.31549072265625, 4.448455810546875, 4.5814208984375, 4.714385986328125, 4.84735107421875, 4.980316162109375, 5.11328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 13.0, 9.0, 19.0, 28.0, 35.0, 44.0, 59.0, 61.0, 72.0, 78.0, 93.0, 71.0, 83.0, 73.0, 69.0, 46.0, 38.0, 39.0, 27.0, 17.0, 10.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.575927734375, -9.29248046875, -9.009033203125, -8.7255859375, -8.442138671875, -8.15869140625, -7.875244140625, -7.591796875, -7.308349609375, -7.02490234375, -6.741455078125, -6.4580078125, -6.174560546875, -5.89111328125, -5.607666015625, -5.32421875, -5.040771484375, -4.75732421875, -4.473876953125, -4.1904296875, -3.906982421875, -3.62353515625, -3.340087890625, -3.056640625, -2.773193359375, -2.48974609375, -2.206298828125, -1.9228515625, -1.639404296875, -1.35595703125, -1.072509765625, -0.7890625, -0.505615234375, -0.22216796875, 0.061279296875, 0.3447265625, 0.628173828125, 0.91162109375, 1.195068359375, 1.478515625, 1.761962890625, 2.04541015625, 2.328857421875, 2.6123046875, 2.895751953125, 3.17919921875, 3.462646484375, 3.74609375, 4.029541015625, 4.31298828125, 4.596435546875, 4.8798828125, 5.163330078125, 5.44677734375, 5.730224609375, 6.013671875, 6.297119140625, 6.58056640625, 6.864013671875, 7.1474609375, 7.430908203125, 7.71435546875, 7.997802734375, 8.28125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 9.0, 13.0, 22.0, 21.0, 60.0, 75.0, 130.0, 239.0, 506.0, 1633.0, 99295.0, 940895.0, 4208.0, 703.0, 324.0, 150.0, 89.0, 58.0, 30.0, 35.0, 20.0, 7.0, 12.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.6640625, -15.1619873046875, -14.659912109375, -14.1578369140625, -13.65576171875, -13.1536865234375, -12.651611328125, -12.1495361328125, -11.6474609375, -11.1453857421875, -10.643310546875, -10.1412353515625, -9.63916015625, -9.1370849609375, -8.635009765625, -8.1329345703125, -7.630859375, -7.1287841796875, -6.626708984375, -6.1246337890625, -5.62255859375, -5.1204833984375, -4.618408203125, -4.1163330078125, -3.6142578125, -3.1121826171875, -2.610107421875, -2.1080322265625, -1.60595703125, -1.1038818359375, -0.601806640625, -0.0997314453125, 0.40234375, 0.9044189453125, 1.406494140625, 1.9085693359375, 2.41064453125, 2.9127197265625, 3.414794921875, 3.9168701171875, 4.4189453125, 4.9210205078125, 5.423095703125, 5.9251708984375, 6.42724609375, 6.9293212890625, 7.431396484375, 7.9334716796875, 8.435546875, 8.9376220703125, 9.439697265625, 9.9417724609375, 10.44384765625, 10.9459228515625, 11.447998046875, 11.9500732421875, 12.4521484375, 12.9542236328125, 13.456298828125, 13.9583740234375, 14.46044921875, 14.9625244140625, 15.464599609375, 15.9666748046875, 16.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 11.0, 18.0, 24.0, 39.0, 52.0, 66.0, 101.0, 119.0, 113.0, 126.0, 104.0, 71.0, 51.0, 42.0, 22.0, 13.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.53125, -15.005126953125, -14.47900390625, -13.952880859375, -13.4267578125, -12.900634765625, -12.37451171875, -11.848388671875, -11.322265625, -10.796142578125, -10.27001953125, -9.743896484375, -9.2177734375, -8.691650390625, -8.16552734375, -7.639404296875, -7.11328125, -6.587158203125, -6.06103515625, -5.534912109375, -5.0087890625, -4.482666015625, -3.95654296875, -3.430419921875, -2.904296875, -2.378173828125, -1.85205078125, -1.325927734375, -0.7998046875, -0.273681640625, 0.25244140625, 0.778564453125, 1.3046875, 1.830810546875, 2.35693359375, 2.883056640625, 3.4091796875, 3.935302734375, 4.46142578125, 4.987548828125, 5.513671875, 6.039794921875, 6.56591796875, 7.092041015625, 7.6181640625, 8.144287109375, 8.67041015625, 9.196533203125, 9.72265625, 10.248779296875, 10.77490234375, 11.301025390625, 11.8271484375, 12.353271484375, 12.87939453125, 13.405517578125, 13.931640625, 14.457763671875, 14.98388671875, 15.510009765625, 16.0361328125, 16.562255859375, 17.08837890625, 17.614501953125, 18.140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 8.0, 8.0, 8.0, 20.0, 39.0, 59.0, 136.0, 407.0, 1830.0, 82292.0, 959274.0, 3510.0, 604.0, 172.0, 58.0, 42.0, 21.0, 21.0, 6.0, 5.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.9140625, -5.70416259765625, -5.4942626953125, -5.28436279296875, -5.074462890625, -4.86456298828125, -4.6546630859375, -4.44476318359375, -4.23486328125, -4.02496337890625, -3.8150634765625, -3.60516357421875, -3.395263671875, -3.18536376953125, -2.9754638671875, -2.76556396484375, -2.5556640625, -2.34576416015625, -2.1358642578125, -1.92596435546875, -1.716064453125, -1.50616455078125, -1.2962646484375, -1.08636474609375, -0.87646484375, -0.66656494140625, -0.4566650390625, -0.24676513671875, -0.036865234375, 0.17303466796875, 0.3829345703125, 0.59283447265625, 0.802734375, 1.01263427734375, 1.2225341796875, 1.43243408203125, 1.642333984375, 1.85223388671875, 2.0621337890625, 2.27203369140625, 2.48193359375, 2.69183349609375, 2.9017333984375, 3.11163330078125, 3.321533203125, 3.53143310546875, 3.7413330078125, 3.95123291015625, 4.1611328125, 4.37103271484375, 4.5809326171875, 4.79083251953125, 5.000732421875, 5.21063232421875, 5.4205322265625, 5.63043212890625, 5.84033203125, 6.05023193359375, 6.2601318359375, 6.47003173828125, 6.679931640625, 6.88983154296875, 7.0997314453125, 7.30963134765625, 7.51953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 12.0, 17.0, 36.0, 55.0, 94.0, 164.0, 321.0, 141.0, 66.0, 42.0, 22.0, 19.0, 5.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004944801330566406, -0.000481627881526947, -0.0004687756299972534, -0.0004559233784675598, -0.0004430711269378662, -0.0004302188754081726, -0.000417366623878479, -0.0004045143723487854, -0.0003916621208190918, -0.0003788098692893982, -0.0003659576177597046, -0.000353105366230011, -0.0003402531147003174, -0.0003274008631706238, -0.0003145486116409302, -0.00030169636011123657, -0.00028884410858154297, -0.00027599185705184937, -0.00026313960552215576, -0.00025028735399246216, -0.00023743510246276855, -0.00022458285093307495, -0.00021173059940338135, -0.00019887834787368774, -0.00018602609634399414, -0.00017317384481430054, -0.00016032159328460693, -0.00014746934175491333, -0.00013461709022521973, -0.00012176483869552612, -0.00010891258716583252, -9.606033563613892e-05, -8.320808410644531e-05, -7.035583257675171e-05, -5.7503581047058105e-05, -4.46513295173645e-05, -3.17990779876709e-05, -1.8946826457977295e-05, -6.094574928283691e-06, 6.757676601409912e-06, 1.9609928131103516e-05, 3.246217966079712e-05, 4.531443119049072e-05, 5.8166682720184326e-05, 7.101893424987793e-05, 8.387118577957153e-05, 9.672343730926514e-05, 0.00010957568883895874, 0.00012242794036865234, 0.00013528019189834595, 0.00014813244342803955, 0.00016098469495773315, 0.00017383694648742676, 0.00018668919801712036, 0.00019954144954681396, 0.00021239370107650757, 0.00022524595260620117, 0.00023809820413589478, 0.0002509504556655884, 0.000263802707195282, 0.0002766549587249756, 0.0002895072102546692, 0.0003023594617843628, 0.0003152117133140564, 0.00032806396484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 11.0, 14.0, 26.0, 38.0, 78.0, 147.0, 354.0, 841.0, 2868.0, 87413.0, 947684.0, 6594.0, 1377.0, 555.0, 273.0, 109.0, 53.0, 26.0, 13.0, 9.0, 8.0, 10.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.44921875, -7.2542724609375, -7.059326171875, -6.8643798828125, -6.66943359375, -6.4744873046875, -6.279541015625, -6.0845947265625, -5.8896484375, -5.6947021484375, -5.499755859375, -5.3048095703125, -5.10986328125, -4.9149169921875, -4.719970703125, -4.5250244140625, -4.330078125, -4.1351318359375, -3.940185546875, -3.7452392578125, -3.55029296875, -3.3553466796875, -3.160400390625, -2.9654541015625, -2.7705078125, -2.5755615234375, -2.380615234375, -2.1856689453125, -1.99072265625, -1.7957763671875, -1.600830078125, -1.4058837890625, -1.2109375, -1.0159912109375, -0.821044921875, -0.6260986328125, -0.43115234375, -0.2362060546875, -0.041259765625, 0.1536865234375, 0.3486328125, 0.5435791015625, 0.738525390625, 0.9334716796875, 1.12841796875, 1.3233642578125, 1.518310546875, 1.7132568359375, 1.908203125, 2.1031494140625, 2.298095703125, 2.4930419921875, 2.68798828125, 2.8829345703125, 3.077880859375, 3.2728271484375, 3.4677734375, 3.6627197265625, 3.857666015625, 4.0526123046875, 4.24755859375, 4.4425048828125, 4.637451171875, 4.8323974609375, 5.02734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 17.0, 22.0, 53.0, 86.0, 179.0, 343.0, 135.0, 68.0, 48.0, 16.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.728515625, -1.66021728515625, -1.5919189453125, -1.52362060546875, -1.455322265625, -1.38702392578125, -1.3187255859375, -1.25042724609375, -1.18212890625, -1.11383056640625, -1.0455322265625, -0.97723388671875, -0.908935546875, -0.84063720703125, -0.7723388671875, -0.70404052734375, -0.6357421875, -0.56744384765625, -0.4991455078125, -0.43084716796875, -0.362548828125, -0.29425048828125, -0.2259521484375, -0.15765380859375, -0.08935546875, -0.02105712890625, 0.0472412109375, 0.11553955078125, 0.183837890625, 0.25213623046875, 0.3204345703125, 0.38873291015625, 0.45703125, 0.52532958984375, 0.5936279296875, 0.66192626953125, 0.730224609375, 0.79852294921875, 0.8668212890625, 0.93511962890625, 1.00341796875, 1.07171630859375, 1.1400146484375, 1.20831298828125, 1.276611328125, 1.34490966796875, 1.4132080078125, 1.48150634765625, 1.5498046875, 1.61810302734375, 1.6864013671875, 1.75469970703125, 1.822998046875, 1.89129638671875, 1.9595947265625, 2.02789306640625, 2.09619140625, 2.16448974609375, 2.2327880859375, 2.30108642578125, 2.369384765625, 2.43768310546875, 2.5059814453125, 2.57427978515625, 2.642578125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 12.0, 73.0, 355.0, 422.0, 130.0, 12.0, 5.0, 0.0, 0.0, 5.0], "bins": [-64.74862670898438, -63.614410400390625, -62.480194091796875, -61.345977783203125, -60.211761474609375, -59.077545166015625, -57.943328857421875, -56.809112548828125, -55.674896240234375, -54.540679931640625, -53.406463623046875, -52.272247314453125, -51.138031005859375, -50.003814697265625, -48.869598388671875, -47.735382080078125, -46.601165771484375, -45.466949462890625, -44.332733154296875, -43.198516845703125, -42.064300537109375, -40.930084228515625, -39.795867919921875, -38.661651611328125, -37.52743911743164, -36.39322280883789, -35.25900650024414, -34.12479019165039, -32.99057388305664, -31.85635757446289, -30.72214126586914, -29.58792495727539, -28.45370864868164, -27.31949234008789, -26.18527603149414, -25.05105972290039, -23.91684341430664, -22.78262710571289, -21.64841079711914, -20.51419448852539, -19.37997817993164, -18.24576187133789, -17.11154556274414, -15.97732925415039, -14.84311294555664, -13.70889663696289, -12.574681282043457, -11.440464973449707, -10.306248664855957, -9.172032356262207, -8.037816047668457, -6.903600215911865, -5.769383907318115, -4.635167598724365, -3.5009517669677734, -2.3667354583740234, -1.2325191497802734, -0.09830296039581299, 1.0359132289886475, 2.1701292991638184, 3.3043456077575684, 4.438561916351318, 5.57277774810791, 6.70699405670166, 7.84121036529541]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 7.0, 5.0, 7.0, 8.0, 13.0, 17.0, 11.0, 25.0, 19.0, 28.0, 19.0, 29.0, 43.0, 45.0, 38.0, 45.0, 58.0, 43.0, 37.0, 50.0, 55.0, 49.0, 44.0, 41.0, 44.0, 29.0, 32.0, 22.0, 28.0, 22.0, 24.0, 10.0, 18.0, 7.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.950607299804688, -10.579919815063477, -10.209232330322266, -9.838544845581055, -9.467857360839844, -9.097168922424316, -8.726481437683105, -8.355793952941895, -7.985106468200684, -7.614418983459473, -7.243731498718262, -6.873043537139893, -6.502356052398682, -6.131668567657471, -5.760980606079102, -5.390293121337891, -5.01960563659668, -4.648918151855469, -4.278230667114258, -3.9075427055358887, -3.5368552207946777, -3.166167736053467, -2.7954800128936768, -2.4247922897338867, -2.054104804992676, -1.6834172010421753, -1.3127295970916748, -0.9420419931411743, -0.5713543891906738, -0.20066678524017334, 0.17002081871032715, 0.5407085418701172, 0.9113950729370117, 1.2820826768875122, 1.6527702808380127, 2.0234580039978027, 2.3941454887390137, 2.7648329734802246, 3.1355206966400146, 3.5062084197998047, 3.8768959045410156, 4.247583389282227, 4.6182708740234375, 4.988958835601807, 5.359646320343018, 5.7303338050842285, 6.101021766662598, 6.471709251403809, 6.8423967361450195, 7.2130842208862305, 7.583771705627441, 7.9544596672058105, 8.32514762878418, 8.69583511352539, 9.066522598266602, 9.437210083007812, 9.807897567749023, 10.178585052490234, 10.549272537231445, 10.919960021972656, 11.290647506713867, 11.661335945129395, 12.032023429870605, 12.402710914611816, 12.773398399353027]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 11.0, 12.0, 3.0, 22.0, 23.0, 29.0, 43.0, 56.0, 69.0, 106.0, 310.0, 1667.0, 93270.0, 4087925.0, 9781.0, 453.0, 171.0, 98.0, 52.0, 41.0, 40.0, 22.0, 18.0, 14.0, 16.0, 10.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.609375, -16.9140625, -16.21875, -15.5234375, -14.828125, -14.1328125, -13.4375, -12.7421875, -12.046875, -11.3515625, -10.65625, -9.9609375, -9.265625, -8.5703125, -7.875, -7.1796875, -6.484375, -5.7890625, -5.09375, -4.3984375, -3.703125, -3.0078125, -2.3125, -1.6171875, -0.921875, -0.2265625, 0.46875, 1.1640625, 1.859375, 2.5546875, 3.25, 3.9453125, 4.640625, 5.3359375, 6.03125, 6.7265625, 7.421875, 8.1171875, 8.8125, 9.5078125, 10.203125, 10.8984375, 11.59375, 12.2890625, 12.984375, 13.6796875, 14.375, 15.0703125, 15.765625, 16.4609375, 17.15625, 17.8515625, 18.546875, 19.2421875, 19.9375, 20.6328125, 21.328125, 22.0234375, 22.71875, 23.4140625, 24.109375, 24.8046875, 25.5, 26.1953125, 26.890625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 14.0, 9.0, 27.0, 46.0, 69.0, 75.0, 91.0, 115.0, 103.0, 122.0, 82.0, 82.0, 70.0, 32.0, 29.0, 32.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1015625, -6.8441162109375, -6.586669921875, -6.3292236328125, -6.07177734375, -5.8143310546875, -5.556884765625, -5.2994384765625, -5.0419921875, -4.7845458984375, -4.527099609375, -4.2696533203125, -4.01220703125, -3.7547607421875, -3.497314453125, -3.2398681640625, -2.982421875, -2.7249755859375, -2.467529296875, -2.2100830078125, -1.95263671875, -1.6951904296875, -1.437744140625, -1.1802978515625, -0.9228515625, -0.6654052734375, -0.407958984375, -0.1505126953125, 0.10693359375, 0.3643798828125, 0.621826171875, 0.8792724609375, 1.13671875, 1.3941650390625, 1.651611328125, 1.9090576171875, 2.16650390625, 2.4239501953125, 2.681396484375, 2.9388427734375, 3.1962890625, 3.4537353515625, 3.711181640625, 3.9686279296875, 4.22607421875, 4.4835205078125, 4.740966796875, 4.9984130859375, 5.255859375, 5.5133056640625, 5.770751953125, 6.0281982421875, 6.28564453125, 6.5430908203125, 6.800537109375, 7.0579833984375, 7.3154296875, 7.5728759765625, 7.830322265625, 8.0877685546875, 8.34521484375, 8.6026611328125, 8.860107421875, 9.1175537109375, 9.375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 11.0, 30.0, 98.0, 403.0, 3898.0, 4173320.0, 15695.0, 617.0, 125.0, 42.0, 12.0, 12.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.847412109375, -43.81982421875, -42.792236328125, -41.7646484375, -40.737060546875, -39.70947265625, -38.681884765625, -37.654296875, -36.626708984375, -35.59912109375, -34.571533203125, -33.5439453125, -32.516357421875, -31.48876953125, -30.461181640625, -29.43359375, -28.406005859375, -27.37841796875, -26.350830078125, -25.3232421875, -24.295654296875, -23.26806640625, -22.240478515625, -21.212890625, -20.185302734375, -19.15771484375, -18.130126953125, -17.1025390625, -16.074951171875, -15.04736328125, -14.019775390625, -12.9921875, -11.964599609375, -10.93701171875, -9.909423828125, -8.8818359375, -7.854248046875, -6.82666015625, -5.799072265625, -4.771484375, -3.743896484375, -2.71630859375, -1.688720703125, -0.6611328125, 0.366455078125, 1.39404296875, 2.421630859375, 3.44921875, 4.476806640625, 5.50439453125, 6.531982421875, 7.5595703125, 8.587158203125, 9.61474609375, 10.642333984375, 11.669921875, 12.697509765625, 13.72509765625, 14.752685546875, 15.7802734375, 16.807861328125, 17.83544921875, 18.863037109375, 19.890625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 8.0, 20.0, 52.0, 115.0, 487.0, 1522.0, 1333.0, 391.0, 92.0, 32.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.802734375, -2.646087646484375, -2.48944091796875, -2.332794189453125, -2.1761474609375, -2.019500732421875, -1.86285400390625, -1.706207275390625, -1.549560546875, -1.392913818359375, -1.23626708984375, -1.079620361328125, -0.9229736328125, -0.766326904296875, -0.60968017578125, -0.453033447265625, -0.29638671875, -0.139739990234375, 0.01690673828125, 0.173553466796875, 0.3302001953125, 0.486846923828125, 0.64349365234375, 0.800140380859375, 0.956787109375, 1.113433837890625, 1.27008056640625, 1.426727294921875, 1.5833740234375, 1.740020751953125, 1.89666748046875, 2.053314208984375, 2.2099609375, 2.366607666015625, 2.52325439453125, 2.679901123046875, 2.8365478515625, 2.993194580078125, 3.14984130859375, 3.306488037109375, 3.463134765625, 3.619781494140625, 3.77642822265625, 3.933074951171875, 4.0897216796875, 4.246368408203125, 4.40301513671875, 4.559661865234375, 4.71630859375, 4.872955322265625, 5.02960205078125, 5.186248779296875, 5.3428955078125, 5.499542236328125, 5.65618896484375, 5.812835693359375, 5.969482421875, 6.126129150390625, 6.28277587890625, 6.439422607421875, 6.5960693359375, 6.752716064453125, 6.90936279296875, 7.066009521484375, 7.22265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 22.0, 54.0, 116.0, 208.0, 249.0, 186.0, 96.0, 47.0, 17.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.764955520629883, -13.3389892578125, -12.913022994995117, -12.48705768585205, -12.061091423034668, -11.635125160217285, -11.209159851074219, -10.783193588256836, -10.357227325439453, -9.93126106262207, -9.505294799804688, -9.079329490661621, -8.653363227844238, -8.227396965026855, -7.801431179046631, -7.375465393066406, -6.949499130249023, -6.523532867431641, -6.097567081451416, -5.671601295471191, -5.245635032653809, -4.819668769836426, -4.393702983856201, -3.9677369594573975, -3.5417709350585938, -3.11580491065979, -2.6898388862609863, -2.2638728618621826, -1.837906837463379, -1.4119408130645752, -0.9859747886657715, -0.5600087642669678, -0.13404369354248047, 0.29192233085632324, 0.717888355255127, 1.1438543796539307, 1.5698204040527344, 1.995786428451538, 2.421752452850342, 2.8477184772491455, 3.273684501647949, 3.699650526046753, 4.125616550445557, 4.551582336425781, 4.977548599243164, 5.403514862060547, 5.8294806480407715, 6.255446434020996, 6.681412696838379, 7.107378959655762, 7.533344745635986, 7.959310531616211, 8.385276794433594, 8.811243057250977, 9.23720932006836, 9.663174629211426, 10.089140892028809, 10.515107154846191, 10.941072463989258, 11.36703872680664, 11.793004989624023, 12.218971252441406, 12.644937515258789, 13.070902824401855, 13.496869087219238]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 11.0, 5.0, 15.0, 10.0, 12.0, 19.0, 27.0, 44.0, 35.0, 48.0, 46.0, 59.0, 52.0, 58.0, 81.0, 73.0, 63.0, 57.0, 49.0, 60.0, 35.0, 36.0, 32.0, 20.0, 13.0, 13.0, 13.0, 5.0, 7.0, 7.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.562732696533203, -6.392062664031982, -6.221392631530762, -6.050722599029541, -5.88005256652832, -5.7093825340271, -5.538712501525879, -5.368042469024658, -5.1973724365234375, -5.026702404022217, -4.856032371520996, -4.685362339019775, -4.514692306518555, -4.344022274017334, -4.173352241516113, -4.002682209014893, -3.8320119380950928, -3.661341905593872, -3.4906718730926514, -3.3200018405914307, -3.14933180809021, -2.9786617755889893, -2.8079915046691895, -2.6373214721679688, -2.466651439666748, -2.2959814071655273, -2.1253113746643066, -1.954641342163086, -1.7839713096618652, -1.6133012771606445, -1.4426311254501343, -1.2719610929489136, -1.1012911796569824, -0.9306211471557617, -0.759951114654541, -0.5892810225486755, -0.41861099004745483, -0.24794095754623413, -0.07727086544036865, 0.09339916706085205, 0.26406919956207275, 0.43473923206329346, 0.6054092645645142, 0.7760793566703796, 0.9467493891716003, 1.1174194812774658, 1.2880895137786865, 1.4587595462799072, 1.629429578781128, 1.8000996112823486, 1.9707696437835693, 2.14143967628479, 2.3121097087860107, 2.4827797412872314, 2.6534500122070312, 2.824120044708252, 2.9947900772094727, 3.1654601097106934, 3.336130142211914, 3.5068001747131348, 3.6774702072143555, 3.848140239715576, 4.018810272216797, 4.189480304718018, 4.360150337219238]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 1.0, 4.0, 10.0, 17.0, 22.0, 33.0, 61.0, 83.0, 186.0, 370.0, 824.0, 2025.0, 7453.0, 54314.0, 777361.0, 183783.0, 16271.0, 3467.0, 1151.0, 590.0, 212.0, 123.0, 80.0, 45.0, 20.0, 17.0, 12.0, 5.0, 5.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.98828125, -1.927520751953125, -1.86676025390625, -1.805999755859375, -1.7452392578125, -1.684478759765625, -1.62371826171875, -1.562957763671875, -1.502197265625, -1.441436767578125, -1.38067626953125, -1.319915771484375, -1.2591552734375, -1.198394775390625, -1.13763427734375, -1.076873779296875, -1.01611328125, -0.955352783203125, -0.89459228515625, -0.833831787109375, -0.7730712890625, -0.712310791015625, -0.65155029296875, -0.590789794921875, -0.530029296875, -0.469268798828125, -0.40850830078125, -0.347747802734375, -0.2869873046875, -0.226226806640625, -0.16546630859375, -0.104705810546875, -0.0439453125, 0.016815185546875, 0.07757568359375, 0.138336181640625, 0.1990966796875, 0.259857177734375, 0.32061767578125, 0.381378173828125, 0.442138671875, 0.502899169921875, 0.56365966796875, 0.624420166015625, 0.6851806640625, 0.745941162109375, 0.80670166015625, 0.867462158203125, 0.92822265625, 0.988983154296875, 1.04974365234375, 1.110504150390625, 1.1712646484375, 1.232025146484375, 1.29278564453125, 1.353546142578125, 1.414306640625, 1.475067138671875, 1.53582763671875, 1.596588134765625, 1.6573486328125, 1.718109130859375, 1.77886962890625, 1.839630126953125, 1.900390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 17.0, 14.0, 19.0, 24.0, 40.0, 57.0, 50.0, 72.0, 79.0, 84.0, 97.0, 110.0, 79.0, 68.0, 52.0, 46.0, 30.0, 20.0, 25.0, 8.0, 6.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.3275146484375, -5.162841796875, -4.9981689453125, -4.83349609375, -4.6688232421875, -4.504150390625, -4.3394775390625, -4.1748046875, -4.0101318359375, -3.845458984375, -3.6807861328125, -3.51611328125, -3.3514404296875, -3.186767578125, -3.0220947265625, -2.857421875, -2.6927490234375, -2.528076171875, -2.3634033203125, -2.19873046875, -2.0340576171875, -1.869384765625, -1.7047119140625, -1.5400390625, -1.3753662109375, -1.210693359375, -1.0460205078125, -0.88134765625, -0.7166748046875, -0.552001953125, -0.3873291015625, -0.22265625, -0.0579833984375, 0.106689453125, 0.2713623046875, 0.43603515625, 0.6007080078125, 0.765380859375, 0.9300537109375, 1.0947265625, 1.2593994140625, 1.424072265625, 1.5887451171875, 1.75341796875, 1.9180908203125, 2.082763671875, 2.2474365234375, 2.412109375, 2.5767822265625, 2.741455078125, 2.9061279296875, 3.07080078125, 3.2354736328125, 3.400146484375, 3.5648193359375, 3.7294921875, 3.8941650390625, 4.058837890625, 4.2235107421875, 4.38818359375, 4.5528564453125, 4.717529296875, 4.8822021484375, 5.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 10.0, 6.0, 7.0, 9.0, 12.0, 26.0, 22.0, 35.0, 66.0, 59.0, 110.0, 175.0, 249.0, 447.0, 763.0, 1259.0, 2413.0, 4613.0, 9687.0, 21116.0, 48223.0, 127526.0, 393252.0, 281518.0, 88161.0, 36216.0, 16221.0, 7728.0, 3795.0, 1980.0, 1103.0, 634.0, 390.0, 228.0, 149.0, 112.0, 68.0, 42.0, 41.0, 25.0, 12.0, 12.0, 8.0, 13.0, 5.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.53662109375, -0.5197601318359375, -0.502899169921875, -0.4860382080078125, -0.46917724609375, -0.4523162841796875, -0.435455322265625, -0.4185943603515625, -0.4017333984375, -0.3848724365234375, -0.368011474609375, -0.3511505126953125, -0.33428955078125, -0.3174285888671875, -0.300567626953125, -0.2837066650390625, -0.266845703125, -0.2499847412109375, -0.233123779296875, -0.2162628173828125, -0.19940185546875, -0.1825408935546875, -0.165679931640625, -0.1488189697265625, -0.1319580078125, -0.1150970458984375, -0.098236083984375, -0.0813751220703125, -0.06451416015625, -0.0476531982421875, -0.030792236328125, -0.0139312744140625, 0.0029296875, 0.0197906494140625, 0.036651611328125, 0.0535125732421875, 0.07037353515625, 0.0872344970703125, 0.104095458984375, 0.1209564208984375, 0.1378173828125, 0.1546783447265625, 0.171539306640625, 0.1884002685546875, 0.20526123046875, 0.2221221923828125, 0.238983154296875, 0.2558441162109375, 0.272705078125, 0.2895660400390625, 0.306427001953125, 0.3232879638671875, 0.34014892578125, 0.3570098876953125, 0.373870849609375, 0.3907318115234375, 0.4075927734375, 0.4244537353515625, 0.441314697265625, 0.4581756591796875, 0.47503662109375, 0.4918975830078125, 0.508758544921875, 0.5256195068359375, 0.54248046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 9.0, 5.0, 4.0, 10.0, 5.0, 14.0, 5.0, 15.0, 19.0, 21.0, 18.0, 30.0, 34.0, 21.0, 39.0, 34.0, 34.0, 31.0, 44.0, 37.0, 35.0, 41.0, 44.0, 51.0, 37.0, 32.0, 37.0, 38.0, 26.0, 24.0, 19.0, 28.0, 22.0, 22.0, 18.0, 12.0, 14.0, 15.0, 13.0, 10.0, 5.0, 6.0, 6.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.01171875, -4.847412109375, -4.68310546875, -4.518798828125, -4.3544921875, -4.190185546875, -4.02587890625, -3.861572265625, -3.697265625, -3.532958984375, -3.36865234375, -3.204345703125, -3.0400390625, -2.875732421875, -2.71142578125, -2.547119140625, -2.3828125, -2.218505859375, -2.05419921875, -1.889892578125, -1.7255859375, -1.561279296875, -1.39697265625, -1.232666015625, -1.068359375, -0.904052734375, -0.73974609375, -0.575439453125, -0.4111328125, -0.246826171875, -0.08251953125, 0.081787109375, 0.24609375, 0.410400390625, 0.57470703125, 0.739013671875, 0.9033203125, 1.067626953125, 1.23193359375, 1.396240234375, 1.560546875, 1.724853515625, 1.88916015625, 2.053466796875, 2.2177734375, 2.382080078125, 2.54638671875, 2.710693359375, 2.875, 3.039306640625, 3.20361328125, 3.367919921875, 3.5322265625, 3.696533203125, 3.86083984375, 4.025146484375, 4.189453125, 4.353759765625, 4.51806640625, 4.682373046875, 4.8466796875, 5.010986328125, 5.17529296875, 5.339599609375, 5.50390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 8.0, 5.0, 15.0, 23.0, 22.0, 36.0, 66.0, 78.0, 151.0, 279.0, 602.0, 1246.0, 2766.0, 6255.0, 16830.0, 64324.0, 425456.0, 435184.0, 66143.0, 17400.0, 6295.0, 2765.0, 1269.0, 594.0, 294.0, 166.0, 76.0, 61.0, 33.0, 29.0, 26.0, 17.0, 11.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.1394519805908203, -0.13522720336914062, -0.13100242614746094, -0.12677764892578125, -0.12255287170410156, -0.11832809448242188, -0.11410331726074219, -0.1098785400390625, -0.10565376281738281, -0.10142898559570312, -0.09720420837402344, -0.09297943115234375, -0.08875465393066406, -0.08452987670898438, -0.08030509948730469, -0.076080322265625, -0.07185554504394531, -0.06763076782226562, -0.06340599060058594, -0.05918121337890625, -0.05495643615722656, -0.050731658935546875, -0.04650688171386719, -0.0422821044921875, -0.03805732727050781, -0.033832550048828125, -0.029607772827148438, -0.02538299560546875, -0.021158218383789062, -0.016933441162109375, -0.012708663940429688, -0.00848388671875, -0.0042591094970703125, -3.4332275390625e-05, 0.0041904449462890625, 0.00841522216796875, 0.012639999389648438, 0.016864776611328125, 0.021089553833007812, 0.0253143310546875, 0.029539108276367188, 0.033763885498046875, 0.03798866271972656, 0.04221343994140625, 0.04643821716308594, 0.050662994384765625, 0.05488777160644531, 0.059112548828125, 0.06333732604980469, 0.06756210327148438, 0.07178688049316406, 0.07601165771484375, 0.08023643493652344, 0.08446121215820312, 0.08868598937988281, 0.0929107666015625, 0.09713554382324219, 0.10136032104492188, 0.10558509826660156, 0.10980987548828125, 0.11403465270996094, 0.11825942993164062, 0.12248420715332031, 0.126708984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 14.0, 16.0, 31.0, 43.0, 67.0, 73.0, 105.0, 123.0, 119.0, 103.0, 77.0, 58.0, 46.0, 32.0, 29.0, 12.0, 12.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00010287761688232422, -0.00010043848305940628, -9.799934923648834e-05, -9.55602154135704e-05, -9.312108159065247e-05, -9.068194776773453e-05, -8.824281394481659e-05, -8.580368012189865e-05, -8.336454629898071e-05, -8.092541247606277e-05, -7.848627865314484e-05, -7.60471448302269e-05, -7.360801100730896e-05, -7.116887718439102e-05, -6.872974336147308e-05, -6.629060953855515e-05, -6.385147571563721e-05, -6.141234189271927e-05, -5.897320806980133e-05, -5.653407424688339e-05, -5.4094940423965454e-05, -5.1655806601047516e-05, -4.921667277812958e-05, -4.677753895521164e-05, -4.43384051322937e-05, -4.189927130937576e-05, -3.9460137486457825e-05, -3.7021003663539886e-05, -3.458186984062195e-05, -3.214273601770401e-05, -2.9703602194786072e-05, -2.7264468371868134e-05, -2.4825334548950195e-05, -2.2386200726032257e-05, -1.994706690311432e-05, -1.750793308019638e-05, -1.5068799257278442e-05, -1.2629665434360504e-05, -1.0190531611442566e-05, -7.751397788524628e-06, -5.3122639656066895e-06, -2.8731301426887512e-06, -4.33996319770813e-07, 2.0051375031471252e-06, 4.4442713260650635e-06, 6.883405148983002e-06, 9.32253897190094e-06, 1.1761672794818878e-05, 1.4200806617736816e-05, 1.6639940440654755e-05, 1.9079074263572693e-05, 2.151820808649063e-05, 2.395734190940857e-05, 2.6396475732326508e-05, 2.8835609555244446e-05, 3.1274743378162384e-05, 3.371387720108032e-05, 3.615301102399826e-05, 3.85921448469162e-05, 4.103127866983414e-05, 4.3470412492752075e-05, 4.5909546315670013e-05, 4.834868013858795e-05, 5.078781396150589e-05, 5.322694778442383e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 3.0, 3.0, 5.0, 13.0, 12.0, 14.0, 13.0, 19.0, 23.0, 31.0, 48.0, 53.0, 88.0, 166.0, 267.0, 609.0, 1574.0, 4989.0, 19483.0, 131224.0, 727959.0, 134202.0, 19552.0, 5245.0, 1546.0, 658.0, 294.0, 142.0, 89.0, 63.0, 46.0, 23.0, 23.0, 20.0, 14.0, 10.0, 9.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1690673828125, -0.1641674041748047, -0.15926742553710938, -0.15436744689941406, -0.14946746826171875, -0.14456748962402344, -0.13966751098632812, -0.1347675323486328, -0.1298675537109375, -0.12496757507324219, -0.12006759643554688, -0.11516761779785156, -0.11026763916015625, -0.10536766052246094, -0.10046768188476562, -0.09556770324707031, -0.090667724609375, -0.08576774597167969, -0.08086776733398438, -0.07596778869628906, -0.07106781005859375, -0.06616783142089844, -0.061267852783203125, -0.05636787414550781, -0.0514678955078125, -0.04656791687011719, -0.041667938232421875, -0.03676795959472656, -0.03186798095703125, -0.026968002319335938, -0.022068023681640625, -0.017168045043945312, -0.01226806640625, -0.0073680877685546875, -0.002468109130859375, 0.0024318695068359375, 0.00733184814453125, 0.012231826782226562, 0.017131805419921875, 0.022031784057617188, 0.0269317626953125, 0.03183174133300781, 0.036731719970703125, 0.04163169860839844, 0.04653167724609375, 0.05143165588378906, 0.056331634521484375, 0.06123161315917969, 0.066131591796875, 0.07103157043457031, 0.07593154907226562, 0.08083152770996094, 0.08573150634765625, 0.09063148498535156, 0.09553146362304688, 0.10043144226074219, 0.1053314208984375, 0.11023139953613281, 0.11513137817382812, 0.12003135681152344, 0.12493133544921875, 0.12983131408691406, 0.13473129272460938, 0.1396312713623047, 0.14453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 2.0, 4.0, 4.0, 7.0, 10.0, 14.0, 17.0, 19.0, 18.0, 31.0, 36.0, 61.0, 95.0, 110.0, 93.0, 114.0, 84.0, 83.0, 44.0, 26.0, 27.0, 19.0, 16.0, 15.0, 8.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0428466796875, -0.041527748107910156, -0.04020881652832031, -0.03888988494873047, -0.037570953369140625, -0.03625202178955078, -0.03493309020996094, -0.033614158630371094, -0.03229522705078125, -0.030976295471191406, -0.029657363891601562, -0.02833843231201172, -0.027019500732421875, -0.02570056915283203, -0.024381637573242188, -0.023062705993652344, -0.0217437744140625, -0.020424842834472656, -0.019105911254882812, -0.01778697967529297, -0.016468048095703125, -0.015149116516113281, -0.013830184936523438, -0.012511253356933594, -0.01119232177734375, -0.009873390197753906, -0.008554458618164062, -0.007235527038574219, -0.005916595458984375, -0.004597663879394531, -0.0032787322998046875, -0.0019598007202148438, -0.000640869140625, 0.0006780624389648438, 0.0019969940185546875, 0.0033159255981445312, 0.004634857177734375, 0.005953788757324219, 0.0072727203369140625, 0.008591651916503906, 0.00991058349609375, 0.011229515075683594, 0.012548446655273438, 0.013867378234863281, 0.015186309814453125, 0.01650524139404297, 0.017824172973632812, 0.019143104553222656, 0.0204620361328125, 0.021780967712402344, 0.023099899291992188, 0.02441883087158203, 0.025737762451171875, 0.02705669403076172, 0.028375625610351562, 0.029694557189941406, 0.03101348876953125, 0.032332420349121094, 0.03365135192871094, 0.03497028350830078, 0.036289215087890625, 0.03760814666748047, 0.03892707824707031, 0.040246009826660156, 0.04156494140625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 18.0, 122.0, 362.0, 354.0, 123.0, 25.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.70638656616211, -26.211946487426758, -25.717506408691406, -25.223066329956055, -24.728626251220703, -24.234188079833984, -23.739748001098633, -23.24530792236328, -22.75086784362793, -22.256427764892578, -21.761987686157227, -21.267547607421875, -20.773107528686523, -20.278667449951172, -19.784229278564453, -19.2897891998291, -18.79534912109375, -18.3009090423584, -17.806468963623047, -17.312028884887695, -16.817588806152344, -16.323150634765625, -15.828709602355957, -15.334270477294922, -14.839829444885254, -14.345389366149902, -13.85094928741455, -13.356510162353516, -12.862070083618164, -12.367630004882812, -11.873189926147461, -11.37874984741211, -10.884309768676758, -10.389869689941406, -9.895429611206055, -9.40099048614502, -8.906550407409668, -8.412110328674316, -7.917670249938965, -7.4232306480407715, -6.928791046142578, -6.434350967407227, -5.939911365509033, -5.445471286773682, -4.951031684875488, -4.456591606140137, -3.9621517658233643, -3.467711925506592, -2.9732723236083984, -2.478832483291626, -1.9843926429748535, -1.4899526834487915, -0.995512843132019, -0.501072883605957, -0.00663304328918457, 0.4878067970275879, 0.9822466373443604, 1.4766864776611328, 1.9711263179779053, 2.4655661582946777, 2.9600062370300293, 3.4544460773468018, 3.948885917663574, 4.443325996398926, 4.937765598297119]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 8.0, 14.0, 14.0, 12.0, 27.0, 39.0, 52.0, 53.0, 65.0, 72.0, 71.0, 113.0, 87.0, 74.0, 68.0, 73.0, 40.0, 46.0, 20.0, 20.0, 16.0, 10.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.346550941467285, -5.192205429077148, -5.037859916687012, -4.883513927459717, -4.72916841506958, -4.574822902679443, -4.420477390289307, -4.26613187789917, -4.111785888671875, -3.9574403762817383, -3.8030946254730225, -3.6487491130828857, -3.49440336227417, -3.340057849884033, -3.1857123374938965, -3.0313668251037598, -2.877021312713623, -2.7226758003234863, -2.5683300495147705, -2.413984537124634, -2.259638786315918, -2.1052932739257812, -1.9509477615356445, -1.7966021299362183, -1.642256498336792, -1.4879108667373657, -1.3335652351379395, -1.1792197227478027, -1.0248740911483765, -0.8705284595489502, -0.7161828875541687, -0.5618373155593872, -0.40749168395996094, -0.25314608216285706, -0.09880048036575317, 0.05554512143135071, 0.2098907232284546, 0.36423635482788086, 0.5185819268226624, 0.6729274988174438, 0.8272731304168701, 0.9816187620162964, 1.1359643936157227, 1.2903099060058594, 1.4446555376052856, 1.599001169204712, 1.7533466815948486, 1.907692313194275, 2.062037944793701, 2.216383457183838, 2.3707292079925537, 2.5250747203826904, 2.6794204711914062, 2.833765983581543, 2.9881114959716797, 3.1424570083618164, 3.2968027591705322, 3.451148271560669, 3.6054940223693848, 3.7598395347595215, 3.914185047149658, 4.068531036376953, 4.22287654876709, 4.377222061157227, 4.531567573547363]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 8.0, 8.0, 33.0, 49.0, 57.0, 134.0, 240.0, 471.0, 1102.0, 4494.0, 38700.0, 525163.0, 438420.0, 33603.0, 4051.0, 1047.0, 458.0, 231.0, 114.0, 63.0, 39.0, 31.0, 4.0, 11.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.51116943359375, -6.3074951171875, -6.10382080078125, -5.900146484375, -5.69647216796875, -5.4927978515625, -5.28912353515625, -5.08544921875, -4.88177490234375, -4.6781005859375, -4.47442626953125, -4.270751953125, -4.06707763671875, -3.8634033203125, -3.65972900390625, -3.4560546875, -3.25238037109375, -3.0487060546875, -2.84503173828125, -2.641357421875, -2.43768310546875, -2.2340087890625, -2.03033447265625, -1.82666015625, -1.62298583984375, -1.4193115234375, -1.21563720703125, -1.011962890625, -0.80828857421875, -0.6046142578125, -0.40093994140625, -0.197265625, 0.00640869140625, 0.2100830078125, 0.41375732421875, 0.617431640625, 0.82110595703125, 1.0247802734375, 1.22845458984375, 1.43212890625, 1.63580322265625, 1.8394775390625, 2.04315185546875, 2.246826171875, 2.45050048828125, 2.6541748046875, 2.85784912109375, 3.0615234375, 3.26519775390625, 3.4688720703125, 3.67254638671875, 3.876220703125, 4.07989501953125, 4.2835693359375, 4.48724365234375, 4.69091796875, 4.89459228515625, 5.0982666015625, 5.30194091796875, 5.505615234375, 5.70928955078125, 5.9129638671875, 6.11663818359375, 6.3203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 12.0, 12.0, 12.0, 25.0, 38.0, 45.0, 51.0, 64.0, 57.0, 79.0, 89.0, 82.0, 81.0, 74.0, 70.0, 39.0, 41.0, 34.0, 22.0, 21.0, 15.0, 14.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.9776611328125, -7.728759765625, -7.4798583984375, -7.23095703125, -6.9820556640625, -6.733154296875, -6.4842529296875, -6.2353515625, -5.9864501953125, -5.737548828125, -5.4886474609375, -5.23974609375, -4.9908447265625, -4.741943359375, -4.4930419921875, -4.244140625, -3.9952392578125, -3.746337890625, -3.4974365234375, -3.24853515625, -2.9996337890625, -2.750732421875, -2.5018310546875, -2.2529296875, -2.0040283203125, -1.755126953125, -1.5062255859375, -1.25732421875, -1.0084228515625, -0.759521484375, -0.5106201171875, -0.26171875, -0.0128173828125, 0.236083984375, 0.4849853515625, 0.73388671875, 0.9827880859375, 1.231689453125, 1.4805908203125, 1.7294921875, 1.9783935546875, 2.227294921875, 2.4761962890625, 2.72509765625, 2.9739990234375, 3.222900390625, 3.4718017578125, 3.720703125, 3.9696044921875, 4.218505859375, 4.4674072265625, 4.71630859375, 4.9652099609375, 5.214111328125, 5.4630126953125, 5.7119140625, 5.9608154296875, 6.209716796875, 6.4586181640625, 6.70751953125, 6.9564208984375, 7.205322265625, 7.4542236328125, 7.703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 11.0, 9.0, 13.0, 22.0, 41.0, 36.0, 55.0, 94.0, 108.0, 194.0, 349.0, 837.0, 4365.0, 364530.0, 669954.0, 6003.0, 937.0, 377.0, 183.0, 147.0, 90.0, 52.0, 46.0, 22.0, 17.0, 16.0, 8.0, 8.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.9921875, -10.5859375, -10.1796875, -9.7734375, -9.3671875, -8.9609375, -8.5546875, -8.1484375, -7.7421875, -7.3359375, -6.9296875, -6.5234375, -6.1171875, -5.7109375, -5.3046875, -4.8984375, -4.4921875, -4.0859375, -3.6796875, -3.2734375, -2.8671875, -2.4609375, -2.0546875, -1.6484375, -1.2421875, -0.8359375, -0.4296875, -0.0234375, 0.3828125, 0.7890625, 1.1953125, 1.6015625, 2.0078125, 2.4140625, 2.8203125, 3.2265625, 3.6328125, 4.0390625, 4.4453125, 4.8515625, 5.2578125, 5.6640625, 6.0703125, 6.4765625, 6.8828125, 7.2890625, 7.6953125, 8.1015625, 8.5078125, 8.9140625, 9.3203125, 9.7265625, 10.1328125, 10.5390625, 10.9453125, 11.3515625, 11.7578125, 12.1640625, 12.5703125, 12.9765625, 13.3828125, 13.7890625, 14.1953125, 14.6015625, 15.0078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 9.0, 17.0, 9.0, 21.0, 19.0, 24.0, 41.0, 45.0, 51.0, 57.0, 77.0, 73.0, 72.0, 71.0, 63.0, 61.0, 59.0, 57.0, 30.0, 29.0, 28.0, 19.0, 14.0, 14.0, 7.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.640625, -9.3577880859375, -9.074951171875, -8.7921142578125, -8.50927734375, -8.2264404296875, -7.943603515625, -7.6607666015625, -7.3779296875, -7.0950927734375, -6.812255859375, -6.5294189453125, -6.24658203125, -5.9637451171875, -5.680908203125, -5.3980712890625, -5.115234375, -4.8323974609375, -4.549560546875, -4.2667236328125, -3.98388671875, -3.7010498046875, -3.418212890625, -3.1353759765625, -2.8525390625, -2.5697021484375, -2.286865234375, -2.0040283203125, -1.72119140625, -1.4383544921875, -1.155517578125, -0.8726806640625, -0.58984375, -0.3070068359375, -0.024169921875, 0.2586669921875, 0.54150390625, 0.8243408203125, 1.107177734375, 1.3900146484375, 1.6728515625, 1.9556884765625, 2.238525390625, 2.5213623046875, 2.80419921875, 3.0870361328125, 3.369873046875, 3.6527099609375, 3.935546875, 4.2183837890625, 4.501220703125, 4.7840576171875, 5.06689453125, 5.3497314453125, 5.632568359375, 5.9154052734375, 6.1982421875, 6.4810791015625, 6.763916015625, 7.0467529296875, 7.32958984375, 7.6124267578125, 7.895263671875, 8.1781005859375, 8.4609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 6.0, 20.0, 18.0, 30.0, 55.0, 74.0, 162.0, 417.0, 1758.0, 31096.0, 969524.0, 42583.0, 2007.0, 409.0, 154.0, 85.0, 42.0, 25.0, 19.0, 18.0, 10.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.7578125, -2.640625, -2.5234375, -2.40625, -2.2890625, -2.171875, -2.0546875, -1.9375, -1.8203125, -1.703125, -1.5859375, -1.46875, -1.3515625, -1.234375, -1.1171875, -1.0, -0.8828125, -0.765625, -0.6484375, -0.53125, -0.4140625, -0.296875, -0.1796875, -0.0625, 0.0546875, 0.171875, 0.2890625, 0.40625, 0.5234375, 0.640625, 0.7578125, 0.875, 0.9921875, 1.109375, 1.2265625, 1.34375, 1.4609375, 1.578125, 1.6953125, 1.8125, 1.9296875, 2.046875, 2.1640625, 2.28125, 2.3984375, 2.515625, 2.6328125, 2.75, 2.8671875, 2.984375, 3.1015625, 3.21875, 3.3359375, 3.453125, 3.5703125, 3.6875, 3.8046875, 3.921875, 4.0390625, 4.15625, 4.2734375, 4.390625, 4.5078125, 4.625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 5.0, 15.0, 30.0, 16.0, 20.0, 26.0, 28.0, 45.0, 44.0, 57.0, 108.0, 121.0, 113.0, 102.0, 70.0, 32.0, 26.0, 32.0, 23.0, 14.0, 13.0, 7.0, 8.0, 8.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002263784408569336, -0.0002200007438659668, -0.000213623046875, -0.0002072453498840332, -0.0002008676528930664, -0.0001944899559020996, -0.0001881122589111328, -0.00018173456192016602, -0.00017535686492919922, -0.00016897916793823242, -0.00016260147094726562, -0.00015622377395629883, -0.00014984607696533203, -0.00014346837997436523, -0.00013709068298339844, -0.00013071298599243164, -0.00012433528900146484, -0.00011795759201049805, -0.00011157989501953125, -0.00010520219802856445, -9.882450103759766e-05, -9.244680404663086e-05, -8.606910705566406e-05, -7.969141006469727e-05, -7.331371307373047e-05, -6.693601608276367e-05, -6.0558319091796875e-05, -5.418062210083008e-05, -4.780292510986328e-05, -4.1425228118896484e-05, -3.504753112792969e-05, -2.866983413696289e-05, -2.2292137145996094e-05, -1.5914440155029297e-05, -9.5367431640625e-06, -3.159046173095703e-06, 3.2186508178710938e-06, 9.59634780883789e-06, 1.5974044799804688e-05, 2.2351741790771484e-05, 2.872943878173828e-05, 3.510713577270508e-05, 4.1484832763671875e-05, 4.786252975463867e-05, 5.424022674560547e-05, 6.0617923736572266e-05, 6.699562072753906e-05, 7.337331771850586e-05, 7.975101470947266e-05, 8.612871170043945e-05, 9.250640869140625e-05, 9.888410568237305e-05, 0.00010526180267333984, 0.00011163949966430664, 0.00011801719665527344, 0.00012439489364624023, 0.00013077259063720703, 0.00013715028762817383, 0.00014352798461914062, 0.00014990568161010742, 0.00015628337860107422, 0.00016266107559204102, 0.0001690387725830078, 0.0001754164695739746, 0.0001817941665649414]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 11.0, 9.0, 22.0, 36.0, 61.0, 195.0, 624.0, 3214.0, 184997.0, 852505.0, 5520.0, 916.0, 260.0, 88.0, 44.0, 19.0, 7.0, 13.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.140380859375, -5.96044921875, -5.780517578125, -5.6005859375, -5.420654296875, -5.24072265625, -5.060791015625, -4.880859375, -4.700927734375, -4.52099609375, -4.341064453125, -4.1611328125, -3.981201171875, -3.80126953125, -3.621337890625, -3.44140625, -3.261474609375, -3.08154296875, -2.901611328125, -2.7216796875, -2.541748046875, -2.36181640625, -2.181884765625, -2.001953125, -1.822021484375, -1.64208984375, -1.462158203125, -1.2822265625, -1.102294921875, -0.92236328125, -0.742431640625, -0.5625, -0.382568359375, -0.20263671875, -0.022705078125, 0.1572265625, 0.337158203125, 0.51708984375, 0.697021484375, 0.876953125, 1.056884765625, 1.23681640625, 1.416748046875, 1.5966796875, 1.776611328125, 1.95654296875, 2.136474609375, 2.31640625, 2.496337890625, 2.67626953125, 2.856201171875, 3.0361328125, 3.216064453125, 3.39599609375, 3.575927734375, 3.755859375, 3.935791015625, 4.11572265625, 4.295654296875, 4.4755859375, 4.655517578125, 4.83544921875, 5.015380859375, 5.1953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 4.0, 13.0, 24.0, 20.0, 58.0, 129.0, 332.0, 216.0, 101.0, 46.0, 19.0, 15.0, 7.0, 4.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80078125, -1.738189697265625, -1.67559814453125, -1.613006591796875, -1.5504150390625, -1.487823486328125, -1.42523193359375, -1.362640380859375, -1.300048828125, -1.237457275390625, -1.17486572265625, -1.112274169921875, -1.0496826171875, -0.987091064453125, -0.92449951171875, -0.861907958984375, -0.79931640625, -0.736724853515625, -0.67413330078125, -0.611541748046875, -0.5489501953125, -0.486358642578125, -0.42376708984375, -0.361175537109375, -0.298583984375, -0.235992431640625, -0.17340087890625, -0.110809326171875, -0.0482177734375, 0.014373779296875, 0.07696533203125, 0.139556884765625, 0.2021484375, 0.264739990234375, 0.32733154296875, 0.389923095703125, 0.4525146484375, 0.515106201171875, 0.57769775390625, 0.640289306640625, 0.702880859375, 0.765472412109375, 0.82806396484375, 0.890655517578125, 0.9532470703125, 1.015838623046875, 1.07843017578125, 1.141021728515625, 1.20361328125, 1.266204833984375, 1.32879638671875, 1.391387939453125, 1.4539794921875, 1.516571044921875, 1.57916259765625, 1.641754150390625, 1.704345703125, 1.766937255859375, 1.82952880859375, 1.892120361328125, 1.9547119140625, 2.017303466796875, 2.07989501953125, 2.142486572265625, 2.205078125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 11.0, 146.0, 466.0, 323.0, 53.0, 11.0, 1.0, 1.0, 1.0], "bins": [-72.70043182373047, -71.43944549560547, -70.17845916748047, -68.91746520996094, -67.65647888183594, -66.39549255371094, -65.13450622558594, -63.87351608276367, -62.612525939941406, -61.351539611816406, -60.09054946899414, -58.82956314086914, -57.568572998046875, -56.307586669921875, -55.04659652709961, -53.78561019897461, -52.52462387084961, -51.26363754272461, -50.002647399902344, -48.741661071777344, -47.48067092895508, -46.21968460083008, -44.95869445800781, -43.69770812988281, -42.43672180175781, -41.17573547363281, -39.91474533081055, -38.65375900268555, -37.39276885986328, -36.13178253173828, -34.870792388916016, -33.609806060791016, -32.348812103271484, -31.08782386779785, -29.82683563232422, -28.565847396850586, -27.304859161376953, -26.043872833251953, -24.78288459777832, -23.521896362304688, -22.260908126831055, -20.999919891357422, -19.73893165588379, -18.477943420410156, -17.216957092285156, -15.955967903137207, -14.69498062133789, -13.433992385864258, -12.173004150390625, -10.912015914916992, -9.65102767944336, -8.390040397644043, -7.12905216217041, -5.868063926696777, -4.607076168060303, -3.346088409423828, -2.0851001739501953, -0.8241121768951416, 0.4368758201599121, 1.6978638172149658, 2.9588518142700195, 4.219840049743652, 5.480827808380127, 6.741815567016602, 8.002803802490234]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 2.0, 6.0, 10.0, 12.0, 13.0, 30.0, 27.0, 40.0, 40.0, 42.0, 41.0, 47.0, 66.0, 66.0, 59.0, 63.0, 68.0, 49.0, 51.0, 53.0, 47.0, 28.0, 36.0, 22.0, 25.0, 18.0, 24.0, 11.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.782975196838379, -13.345107078552246, -12.907238960266113, -12.46937084197998, -12.031502723693848, -11.593634605407715, -11.155766487121582, -10.71789836883545, -10.280030250549316, -9.842162132263184, -9.40429401397705, -8.966425895690918, -8.528557777404785, -8.090689659118652, -7.6528215408325195, -7.214953422546387, -6.777085304260254, -6.339217185974121, -5.901349067687988, -5.4634809494018555, -5.025612831115723, -4.58774471282959, -4.149876594543457, -3.712008476257324, -3.2741403579711914, -2.8362722396850586, -2.398404121398926, -1.960536003112793, -1.5226678848266602, -1.0847997665405273, -0.6469316482543945, -0.20906352996826172, 0.2288055419921875, 0.6666736602783203, 1.1045417785644531, 1.542409896850586, 1.9802780151367188, 2.4181461334228516, 2.8560142517089844, 3.293882369995117, 3.73175048828125, 4.169618606567383, 4.607486724853516, 5.045354843139648, 5.483222961425781, 5.921091079711914, 6.358959197998047, 6.79682731628418, 7.2346954345703125, 7.672563552856445, 8.110431671142578, 8.548299789428711, 8.986167907714844, 9.424036026000977, 9.86190414428711, 10.299772262573242, 10.737640380859375, 11.175508499145508, 11.61337661743164, 12.051244735717773, 12.489112854003906, 12.926980972290039, 13.364849090576172, 13.802717208862305, 14.240585327148438]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 14.0, 20.0, 17.0, 21.0, 47.0, 58.0, 64.0, 114.0, 160.0, 239.0, 570.0, 2006.0, 16876.0, 1078182.0, 3034658.0, 56535.0, 3127.0, 659.0, 308.0, 200.0, 113.0, 72.0, 69.0, 35.0, 30.0, 24.0, 23.0, 5.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.0, -11.7012939453125, -11.402587890625, -11.1038818359375, -10.80517578125, -10.5064697265625, -10.207763671875, -9.9090576171875, -9.6103515625, -9.3116455078125, -9.012939453125, -8.7142333984375, -8.41552734375, -8.1168212890625, -7.818115234375, -7.5194091796875, -7.220703125, -6.9219970703125, -6.623291015625, -6.3245849609375, -6.02587890625, -5.7271728515625, -5.428466796875, -5.1297607421875, -4.8310546875, -4.5323486328125, -4.233642578125, -3.9349365234375, -3.63623046875, -3.3375244140625, -3.038818359375, -2.7401123046875, -2.44140625, -2.1427001953125, -1.843994140625, -1.5452880859375, -1.24658203125, -0.9478759765625, -0.649169921875, -0.3504638671875, -0.0517578125, 0.2469482421875, 0.545654296875, 0.8443603515625, 1.14306640625, 1.4417724609375, 1.740478515625, 2.0391845703125, 2.337890625, 2.6365966796875, 2.935302734375, 3.2340087890625, 3.53271484375, 3.8314208984375, 4.130126953125, 4.4288330078125, 4.7275390625, 5.0262451171875, 5.324951171875, 5.6236572265625, 5.92236328125, 6.2210693359375, 6.519775390625, 6.8184814453125, 7.1171875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 1.0, 8.0, 5.0, 12.0, 18.0, 20.0, 30.0, 34.0, 41.0, 55.0, 63.0, 67.0, 60.0, 76.0, 70.0, 66.0, 65.0, 78.0, 42.0, 44.0, 43.0, 30.0, 30.0, 13.0, 11.0, 5.0, 4.0, 10.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.962890625, -4.80859375, -4.654296875, -4.5, -4.345703125, -4.19140625, -4.037109375, -3.8828125, -3.728515625, -3.57421875, -3.419921875, -3.265625, -3.111328125, -2.95703125, -2.802734375, -2.6484375, -2.494140625, -2.33984375, -2.185546875, -2.03125, -1.876953125, -1.72265625, -1.568359375, -1.4140625, -1.259765625, -1.10546875, -0.951171875, -0.796875, -0.642578125, -0.48828125, -0.333984375, -0.1796875, -0.025390625, 0.12890625, 0.283203125, 0.4375, 0.591796875, 0.74609375, 0.900390625, 1.0546875, 1.208984375, 1.36328125, 1.517578125, 1.671875, 1.826171875, 1.98046875, 2.134765625, 2.2890625, 2.443359375, 2.59765625, 2.751953125, 2.90625, 3.060546875, 3.21484375, 3.369140625, 3.5234375, 3.677734375, 3.83203125, 3.986328125, 4.140625, 4.294921875, 4.44921875, 4.603515625, 4.7578125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 15.0, 25.0, 45.0, 129.0, 597.0, 8644.0, 4163997.0, 19697.0, 795.0, 142.0, 73.0, 28.0, 27.0, 15.0, 12.0, 9.0, 7.0, 5.0, 2.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.296875, -23.446533203125, -22.59619140625, -21.745849609375, -20.8955078125, -20.045166015625, -19.19482421875, -18.344482421875, -17.494140625, -16.643798828125, -15.79345703125, -14.943115234375, -14.0927734375, -13.242431640625, -12.39208984375, -11.541748046875, -10.69140625, -9.841064453125, -8.99072265625, -8.140380859375, -7.2900390625, -6.439697265625, -5.58935546875, -4.739013671875, -3.888671875, -3.038330078125, -2.18798828125, -1.337646484375, -0.4873046875, 0.363037109375, 1.21337890625, 2.063720703125, 2.9140625, 3.764404296875, 4.61474609375, 5.465087890625, 6.3154296875, 7.165771484375, 8.01611328125, 8.866455078125, 9.716796875, 10.567138671875, 11.41748046875, 12.267822265625, 13.1181640625, 13.968505859375, 14.81884765625, 15.669189453125, 16.51953125, 17.369873046875, 18.22021484375, 19.070556640625, 19.9208984375, 20.771240234375, 21.62158203125, 22.471923828125, 23.322265625, 24.172607421875, 25.02294921875, 25.873291015625, 26.7236328125, 27.573974609375, 28.42431640625, 29.274658203125, 30.125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 3.0, 13.0, 21.0, 55.0, 114.0, 383.0, 940.0, 1335.0, 722.0, 275.0, 97.0, 50.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.447265625, -3.329864501953125, -3.21246337890625, -3.095062255859375, -2.9776611328125, -2.860260009765625, -2.74285888671875, -2.625457763671875, -2.508056640625, -2.390655517578125, -2.27325439453125, -2.155853271484375, -2.0384521484375, -1.921051025390625, -1.80364990234375, -1.686248779296875, -1.56884765625, -1.451446533203125, -1.33404541015625, -1.216644287109375, -1.0992431640625, -0.981842041015625, -0.86444091796875, -0.747039794921875, -0.629638671875, -0.512237548828125, -0.39483642578125, -0.277435302734375, -0.1600341796875, -0.042633056640625, 0.07476806640625, 0.192169189453125, 0.3095703125, 0.426971435546875, 0.54437255859375, 0.661773681640625, 0.7791748046875, 0.896575927734375, 1.01397705078125, 1.131378173828125, 1.248779296875, 1.366180419921875, 1.48358154296875, 1.600982666015625, 1.7183837890625, 1.835784912109375, 1.95318603515625, 2.070587158203125, 2.18798828125, 2.305389404296875, 2.42279052734375, 2.540191650390625, 2.6575927734375, 2.774993896484375, 2.89239501953125, 3.009796142578125, 3.127197265625, 3.244598388671875, 3.36199951171875, 3.479400634765625, 3.5968017578125, 3.714202880859375, 3.83160400390625, 3.949005126953125, 4.06640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 13.0, 44.0, 66.0, 83.0, 120.0, 178.0, 165.0, 126.0, 85.0, 60.0, 42.0, 13.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.679505348205566, -9.389030456542969, -9.098555564880371, -8.808080673217773, -8.517605781555176, -8.227130889892578, -7.9366559982299805, -7.646181106567383, -7.355706214904785, -7.0652313232421875, -6.77475643157959, -6.484281539916992, -6.1938066482543945, -5.903331756591797, -5.612856864929199, -5.322381973266602, -5.031907081604004, -4.741432189941406, -4.450957298278809, -4.160482406616211, -3.8700075149536133, -3.5795326232910156, -3.289057731628418, -2.9985828399658203, -2.7081079483032227, -2.417633056640625, -2.1271581649780273, -1.8366832733154297, -1.546208381652832, -1.2557334899902344, -0.9652585983276367, -0.6747837066650391, -0.384307861328125, -0.09383296966552734, 0.1966419219970703, 0.48711681365966797, 0.7775917053222656, 1.0680665969848633, 1.358541488647461, 1.6490163803100586, 1.9394912719726562, 2.229966163635254, 2.5204410552978516, 2.810915946960449, 3.101390838623047, 3.3918657302856445, 3.682340621948242, 3.97281551361084, 4.2632904052734375, 4.553765296936035, 4.844240188598633, 5.1347150802612305, 5.425189971923828, 5.715664863586426, 6.006139755249023, 6.296614646911621, 6.587089538574219, 6.877564430236816, 7.168039321899414, 7.458514213562012, 7.748989105224609, 8.039463996887207, 8.329938888549805, 8.620413780212402, 8.910888671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 11.0, 12.0, 21.0, 15.0, 23.0, 17.0, 26.0, 23.0, 41.0, 41.0, 48.0, 54.0, 54.0, 63.0, 53.0, 65.0, 54.0, 46.0, 51.0, 43.0, 42.0, 31.0, 40.0, 29.0, 24.0, 22.0, 8.0, 9.0, 8.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.702385902404785, -4.561467170715332, -4.420547962188721, -4.279629230499268, -4.1387104988098145, -3.9977915287017822, -3.85687255859375, -3.715953826904297, -3.5750348567962646, -3.4341158866882324, -3.2931971549987793, -3.152278184890747, -3.011359214782715, -2.8704404830932617, -2.7295215129852295, -2.5886025428771973, -2.447683811187744, -2.306764841079712, -2.165846109390259, -2.0249271392822266, -1.8840082883834839, -1.7430894374847412, -1.602170467376709, -1.4612516164779663, -1.3203327655792236, -1.179413914680481, -1.0384950637817383, -0.897576093673706, -0.7566572427749634, -0.6157383918762207, -0.47481948137283325, -0.3339005708694458, -0.19298124313354492, -0.05206236243247986, 0.0888565182685852, 0.22977539896965027, 0.37069427967071533, 0.511613130569458, 0.6525320410728455, 0.7934509515762329, 0.9343698024749756, 1.0752886533737183, 1.216207504272461, 1.3571264743804932, 1.4980453252792358, 1.6389641761779785, 1.7798831462860107, 1.9208019971847534, 2.061720848083496, 2.2026398181915283, 2.3435585498809814, 2.4844775199890137, 2.625396251678467, 2.766315221786499, 2.9072341918945312, 3.0481529235839844, 3.1890718936920166, 3.329990863800049, 3.470909595489502, 3.611828565597534, 3.7527475357055664, 3.8936662673950195, 4.034584999084473, 4.175504207611084, 4.316422939300537]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 4.0, 13.0, 16.0, 30.0, 52.0, 91.0, 155.0, 264.0, 456.0, 916.0, 2291.0, 7550.0, 39208.0, 339631.0, 584760.0, 57431.0, 10361.0, 2968.0, 1093.0, 534.0, 308.0, 162.0, 109.0, 54.0, 32.0, 15.0, 11.0, 6.0, 5.0, 7.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2734375, -1.23114013671875, -1.1888427734375, -1.14654541015625, -1.104248046875, -1.06195068359375, -1.0196533203125, -0.97735595703125, -0.93505859375, -0.89276123046875, -0.8504638671875, -0.80816650390625, -0.765869140625, -0.72357177734375, -0.6812744140625, -0.63897705078125, -0.5966796875, -0.55438232421875, -0.5120849609375, -0.46978759765625, -0.427490234375, -0.38519287109375, -0.3428955078125, -0.30059814453125, -0.25830078125, -0.21600341796875, -0.1737060546875, -0.13140869140625, -0.089111328125, -0.04681396484375, -0.0045166015625, 0.03778076171875, 0.080078125, 0.12237548828125, 0.1646728515625, 0.20697021484375, 0.249267578125, 0.29156494140625, 0.3338623046875, 0.37615966796875, 0.41845703125, 0.46075439453125, 0.5030517578125, 0.54534912109375, 0.587646484375, 0.62994384765625, 0.6722412109375, 0.71453857421875, 0.7568359375, 0.79913330078125, 0.8414306640625, 0.88372802734375, 0.926025390625, 0.96832275390625, 1.0106201171875, 1.05291748046875, 1.09521484375, 1.13751220703125, 1.1798095703125, 1.22210693359375, 1.264404296875, 1.30670166015625, 1.3489990234375, 1.39129638671875, 1.43359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 12.0, 11.0, 31.0, 30.0, 31.0, 36.0, 53.0, 73.0, 87.0, 80.0, 86.0, 94.0, 75.0, 67.0, 54.0, 43.0, 46.0, 33.0, 23.0, 19.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.732421875, -3.606109619140625, -3.47979736328125, -3.353485107421875, -3.2271728515625, -3.100860595703125, -2.97454833984375, -2.848236083984375, -2.721923828125, -2.595611572265625, -2.46929931640625, -2.342987060546875, -2.2166748046875, -2.090362548828125, -1.96405029296875, -1.837738037109375, -1.71142578125, -1.585113525390625, -1.45880126953125, -1.332489013671875, -1.2061767578125, -1.079864501953125, -0.95355224609375, -0.827239990234375, -0.700927734375, -0.574615478515625, -0.44830322265625, -0.321990966796875, -0.1956787109375, -0.069366455078125, 0.05694580078125, 0.183258056640625, 0.3095703125, 0.435882568359375, 0.56219482421875, 0.688507080078125, 0.8148193359375, 0.941131591796875, 1.06744384765625, 1.193756103515625, 1.320068359375, 1.446380615234375, 1.57269287109375, 1.699005126953125, 1.8253173828125, 1.951629638671875, 2.07794189453125, 2.204254150390625, 2.33056640625, 2.456878662109375, 2.58319091796875, 2.709503173828125, 2.8358154296875, 2.962127685546875, 3.08843994140625, 3.214752197265625, 3.341064453125, 3.467376708984375, 3.59368896484375, 3.720001220703125, 3.8463134765625, 3.972625732421875, 4.09893798828125, 4.225250244140625, 4.3515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 12.0, 11.0, 10.0, 15.0, 17.0, 28.0, 56.0, 76.0, 100.0, 171.0, 275.0, 467.0, 756.0, 1538.0, 3027.0, 6545.0, 15724.0, 44360.0, 158161.0, 550489.0, 185662.0, 49642.0, 17323.0, 7108.0, 3258.0, 1569.0, 865.0, 490.0, 292.0, 167.0, 100.0, 78.0, 35.0, 44.0, 24.0, 17.0, 9.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.72021484375, -0.699371337890625, -0.67852783203125, -0.657684326171875, -0.6368408203125, -0.615997314453125, -0.59515380859375, -0.574310302734375, -0.553466796875, -0.532623291015625, -0.51177978515625, -0.490936279296875, -0.4700927734375, -0.449249267578125, -0.42840576171875, -0.407562255859375, -0.38671875, -0.365875244140625, -0.34503173828125, -0.324188232421875, -0.3033447265625, -0.282501220703125, -0.26165771484375, -0.240814208984375, -0.219970703125, -0.199127197265625, -0.17828369140625, -0.157440185546875, -0.1365966796875, -0.115753173828125, -0.09490966796875, -0.074066162109375, -0.05322265625, -0.032379150390625, -0.01153564453125, 0.009307861328125, 0.0301513671875, 0.050994873046875, 0.07183837890625, 0.092681884765625, 0.113525390625, 0.134368896484375, 0.15521240234375, 0.176055908203125, 0.1968994140625, 0.217742919921875, 0.23858642578125, 0.259429931640625, 0.2802734375, 0.301116943359375, 0.32196044921875, 0.342803955078125, 0.3636474609375, 0.384490966796875, 0.40533447265625, 0.426177978515625, 0.447021484375, 0.467864990234375, 0.48870849609375, 0.509552001953125, 0.5303955078125, 0.551239013671875, 0.57208251953125, 0.592926025390625, 0.61376953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 8.0, 10.0, 9.0, 19.0, 26.0, 22.0, 25.0, 36.0, 44.0, 37.0, 46.0, 43.0, 71.0, 54.0, 45.0, 63.0, 61.0, 44.0, 37.0, 46.0, 53.0, 35.0, 24.0, 27.0, 20.0, 8.0, 18.0, 13.0, 7.0, 10.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.94140625, -6.7425537109375, -6.543701171875, -6.3448486328125, -6.14599609375, -5.9471435546875, -5.748291015625, -5.5494384765625, -5.3505859375, -5.1517333984375, -4.952880859375, -4.7540283203125, -4.55517578125, -4.3563232421875, -4.157470703125, -3.9586181640625, -3.759765625, -3.5609130859375, -3.362060546875, -3.1632080078125, -2.96435546875, -2.7655029296875, -2.566650390625, -2.3677978515625, -2.1689453125, -1.9700927734375, -1.771240234375, -1.5723876953125, -1.37353515625, -1.1746826171875, -0.975830078125, -0.7769775390625, -0.578125, -0.3792724609375, -0.180419921875, 0.0184326171875, 0.21728515625, 0.4161376953125, 0.614990234375, 0.8138427734375, 1.0126953125, 1.2115478515625, 1.410400390625, 1.6092529296875, 1.80810546875, 2.0069580078125, 2.205810546875, 2.4046630859375, 2.603515625, 2.8023681640625, 3.001220703125, 3.2000732421875, 3.39892578125, 3.5977783203125, 3.796630859375, 3.9954833984375, 4.1943359375, 4.3931884765625, 4.592041015625, 4.7908935546875, 4.98974609375, 5.1885986328125, 5.387451171875, 5.5863037109375, 5.78515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 8.0, 6.0, 11.0, 20.0, 35.0, 41.0, 70.0, 97.0, 136.0, 218.0, 425.0, 762.0, 1721.0, 4688.0, 16619.0, 102438.0, 680939.0, 202597.0, 26799.0, 6560.0, 2185.0, 904.0, 495.0, 262.0, 165.0, 110.0, 71.0, 44.0, 36.0, 21.0, 19.0, 14.0, 13.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15731239318847656, -0.15263748168945312, -0.1479625701904297, -0.14328765869140625, -0.1386127471923828, -0.13393783569335938, -0.12926292419433594, -0.1245880126953125, -0.11991310119628906, -0.11523818969726562, -0.11056327819824219, -0.10588836669921875, -0.10121345520019531, -0.09653854370117188, -0.09186363220214844, -0.087188720703125, -0.08251380920410156, -0.07783889770507812, -0.07316398620605469, -0.06848907470703125, -0.06381416320800781, -0.059139251708984375, -0.05446434020996094, -0.0497894287109375, -0.04511451721191406, -0.040439605712890625, -0.03576469421386719, -0.03108978271484375, -0.026414871215820312, -0.021739959716796875, -0.017065048217773438, -0.01239013671875, -0.0077152252197265625, -0.003040313720703125, 0.0016345977783203125, 0.00630950927734375, 0.010984420776367188, 0.015659332275390625, 0.020334243774414062, 0.0250091552734375, 0.029684066772460938, 0.034358978271484375, 0.03903388977050781, 0.04370880126953125, 0.04838371276855469, 0.053058624267578125, 0.05773353576660156, 0.062408447265625, 0.06708335876464844, 0.07175827026367188, 0.07643318176269531, 0.08110809326171875, 0.08578300476074219, 0.09045791625976562, 0.09513282775878906, 0.0998077392578125, 0.10448265075683594, 0.10915756225585938, 0.11383247375488281, 0.11850738525390625, 0.12318229675292969, 0.12785720825195312, 0.13253211975097656, 0.13720703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 11.0, 8.0, 12.0, 25.0, 19.0, 50.0, 52.0, 84.0, 125.0, 165.0, 142.0, 92.0, 75.0, 54.0, 36.0, 14.0, 16.0, 10.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.106231689453125e-05, -7.832609117031097e-05, -7.55898654460907e-05, -7.285363972187042e-05, -7.011741399765015e-05, -6.738118827342987e-05, -6.46449625492096e-05, -6.190873682498932e-05, -5.917251110076904e-05, -5.643628537654877e-05, -5.370005965232849e-05, -5.0963833928108215e-05, -4.822760820388794e-05, -4.5491382479667664e-05, -4.275515675544739e-05, -4.001893103122711e-05, -3.7282705307006836e-05, -3.454647958278656e-05, -3.1810253858566284e-05, -2.9074028134346008e-05, -2.6337802410125732e-05, -2.3601576685905457e-05, -2.086535096168518e-05, -1.8129125237464905e-05, -1.539289951324463e-05, -1.2656673789024353e-05, -9.920448064804077e-06, -7.184222340583801e-06, -4.447996616363525e-06, -1.7117708921432495e-06, 1.0244548320770264e-06, 3.7606805562973022e-06, 6.496906280517578e-06, 9.233132004737854e-06, 1.196935772895813e-05, 1.4705583453178406e-05, 1.744180917739868e-05, 2.0178034901618958e-05, 2.2914260625839233e-05, 2.565048635005951e-05, 2.8386712074279785e-05, 3.112293779850006e-05, 3.385916352272034e-05, 3.659538924694061e-05, 3.933161497116089e-05, 4.2067840695381165e-05, 4.480406641960144e-05, 4.7540292143821716e-05, 5.027651786804199e-05, 5.301274359226227e-05, 5.5748969316482544e-05, 5.848519504070282e-05, 6.12214207649231e-05, 6.395764648914337e-05, 6.669387221336365e-05, 6.943009793758392e-05, 7.21663236618042e-05, 7.490254938602448e-05, 7.763877511024475e-05, 8.037500083446503e-05, 8.31112265586853e-05, 8.584745228290558e-05, 8.858367800712585e-05, 9.131990373134613e-05, 9.40561294555664e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 14.0, 19.0, 15.0, 34.0, 40.0, 55.0, 78.0, 111.0, 187.0, 262.0, 451.0, 817.0, 1572.0, 3595.0, 9810.0, 41875.0, 377999.0, 535042.0, 56388.0, 11919.0, 4208.0, 1774.0, 889.0, 482.0, 272.0, 184.0, 123.0, 107.0, 60.0, 52.0, 29.0, 19.0, 11.0, 15.0, 11.0, 5.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1441650390625, -0.13967132568359375, -0.1351776123046875, -0.13068389892578125, -0.126190185546875, -0.12169647216796875, -0.1172027587890625, -0.11270904541015625, -0.10821533203125, -0.10372161865234375, -0.0992279052734375, -0.09473419189453125, -0.090240478515625, -0.08574676513671875, -0.0812530517578125, -0.07675933837890625, -0.072265625, -0.06777191162109375, -0.0632781982421875, -0.05878448486328125, -0.054290771484375, -0.04979705810546875, -0.0453033447265625, -0.04080963134765625, -0.03631591796875, -0.03182220458984375, -0.0273284912109375, -0.02283477783203125, -0.018341064453125, -0.01384735107421875, -0.0093536376953125, -0.00485992431640625, -0.0003662109375, 0.00412750244140625, 0.0086212158203125, 0.01311492919921875, 0.017608642578125, 0.02210235595703125, 0.0265960693359375, 0.03108978271484375, 0.03558349609375, 0.04007720947265625, 0.0445709228515625, 0.04906463623046875, 0.053558349609375, 0.05805206298828125, 0.0625457763671875, 0.06703948974609375, 0.071533203125, 0.07602691650390625, 0.0805206298828125, 0.08501434326171875, 0.089508056640625, 0.09400177001953125, 0.0984954833984375, 0.10298919677734375, 0.10748291015625, 0.11197662353515625, 0.1164703369140625, 0.12096405029296875, 0.125457763671875, 0.12995147705078125, 0.1344451904296875, 0.13893890380859375, 0.1434326171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 11.0, 5.0, 10.0, 16.0, 20.0, 18.0, 17.0, 31.0, 34.0, 64.0, 88.0, 94.0, 112.0, 109.0, 107.0, 47.0, 56.0, 31.0, 26.0, 25.0, 14.0, 13.0, 13.0, 2.0, 6.0, 2.0, 12.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.031707763671875, -0.030704021453857422, -0.029700279235839844, -0.028696537017822266, -0.027692794799804688, -0.02668905258178711, -0.02568531036376953, -0.024681568145751953, -0.023677825927734375, -0.022674083709716797, -0.02167034149169922, -0.02066659927368164, -0.019662857055664062, -0.018659114837646484, -0.017655372619628906, -0.016651630401611328, -0.01564788818359375, -0.014644145965576172, -0.013640403747558594, -0.012636661529541016, -0.011632919311523438, -0.01062917709350586, -0.009625434875488281, -0.008621692657470703, -0.007617950439453125, -0.006614208221435547, -0.005610466003417969, -0.004606723785400391, -0.0036029815673828125, -0.0025992393493652344, -0.0015954971313476562, -0.0005917549133300781, 0.0004119873046875, 0.0014157295227050781, 0.0024194717407226562, 0.0034232139587402344, 0.0044269561767578125, 0.005430698394775391, 0.006434440612792969, 0.007438182830810547, 0.008441925048828125, 0.009445667266845703, 0.010449409484863281, 0.01145315170288086, 0.012456893920898438, 0.013460636138916016, 0.014464378356933594, 0.015468120574951172, 0.01647186279296875, 0.017475605010986328, 0.018479347229003906, 0.019483089447021484, 0.020486831665039062, 0.02149057388305664, 0.02249431610107422, 0.023498058319091797, 0.024501800537109375, 0.025505542755126953, 0.02650928497314453, 0.02751302719116211, 0.028516769409179688, 0.029520511627197266, 0.030524253845214844, 0.03152799606323242, 0.03253173828125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 26.0, 95.0, 231.0, 310.0, 219.0, 96.0, 29.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.412696838378906, -10.102378845214844, -9.792060852050781, -9.481742858886719, -9.171424865722656, -8.861106872558594, -8.550788879394531, -8.240470886230469, -7.9301533699035645, -7.619835376739502, -7.3095173835754395, -6.999199390411377, -6.688881874084473, -6.37856388092041, -6.068245887756348, -5.757927894592285, -5.447609901428223, -5.13729190826416, -4.826973915100098, -4.516655921936035, -4.206337928771973, -3.8960201740264893, -3.585702419281006, -3.2753844261169434, -2.965066432952881, -2.6547484397888184, -2.344430446624756, -2.0341126918792725, -1.72379469871521, -1.4134767055511475, -1.1031588315963745, -0.7928409576416016, -0.48252296447753906, -0.17220503091812134, 0.1381129026412964, 0.4484308362007141, 0.7587487697601318, 1.0690667629241943, 1.3793846368789673, 1.6897025108337402, 2.0000205039978027, 2.3103384971618652, 2.6206564903259277, 2.930974245071411, 3.2412922382354736, 3.551610231399536, 3.8619279861450195, 4.172245979309082, 4.4825639724731445, 4.792881965637207, 5.1031999588012695, 5.413517951965332, 5.7238359451293945, 6.034153938293457, 6.344471454620361, 6.654789447784424, 6.965107440948486, 7.275425434112549, 7.585743427276611, 7.896061420440674, 8.206378936767578, 8.51669692993164, 8.827014923095703, 9.137332916259766, 9.447650909423828]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 16.0, 22.0, 24.0, 27.0, 28.0, 46.0, 51.0, 65.0, 65.0, 86.0, 73.0, 86.0, 71.0, 68.0, 48.0, 55.0, 42.0, 33.0, 29.0, 19.0, 11.0, 15.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.410827159881592, -3.299912691116333, -3.188997983932495, -3.0780835151672363, -2.9671688079833984, -2.8562543392181396, -2.7453396320343018, -2.634425163269043, -2.523510456085205, -2.4125959873199463, -2.3016812801361084, -2.1907668113708496, -2.0798521041870117, -1.968937635421753, -1.858022928237915, -1.7471084594726562, -1.636193871498108, -1.5252792835235596, -1.4143646955490112, -1.303450107574463, -1.1925355195999146, -1.0816209316253662, -0.9707064032554626, -0.8597918152809143, -0.748877227306366, -0.6379626393318176, -0.5270480513572693, -0.41613349318504333, -0.305218905210495, -0.19430434703826904, -0.0833897590637207, 0.027524828910827637, 0.13843941688537598, 0.24935400485992432, 0.36026859283447266, 0.4711831510066986, 0.5820977687835693, 0.6930122971534729, 0.8039268851280212, 0.9148414731025696, 1.0257561206817627, 1.136670708656311, 1.2475852966308594, 1.3584998846054077, 1.469414472579956, 1.5803289413452148, 1.6912436485290527, 1.8021581172943115, 1.9130727052688599, 2.023987293243408, 2.134901762008667, 2.245816469192505, 2.3567309379577637, 2.4676456451416016, 2.5785601139068604, 2.6894748210906982, 2.800389289855957, 2.911303758621216, 3.0222184658050537, 3.1331329345703125, 3.2440476417541504, 3.354962110519409, 3.465876817703247, 3.576791286468506, 3.6877059936523438]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 27.0, 31.0, 52.0, 86.0, 146.0, 303.0, 712.0, 1952.0, 7885.0, 46721.0, 308670.0, 544499.0, 114606.0, 17292.0, 3518.0, 1122.0, 418.0, 211.0, 107.0, 64.0, 46.0, 16.0, 11.0, 13.0, 6.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.119384765625, -4.96533203125, -4.811279296875, -4.6572265625, -4.503173828125, -4.34912109375, -4.195068359375, -4.041015625, -3.886962890625, -3.73291015625, -3.578857421875, -3.4248046875, -3.270751953125, -3.11669921875, -2.962646484375, -2.80859375, -2.654541015625, -2.50048828125, -2.346435546875, -2.1923828125, -2.038330078125, -1.88427734375, -1.730224609375, -1.576171875, -1.422119140625, -1.26806640625, -1.114013671875, -0.9599609375, -0.805908203125, -0.65185546875, -0.497802734375, -0.34375, -0.189697265625, -0.03564453125, 0.118408203125, 0.2724609375, 0.426513671875, 0.58056640625, 0.734619140625, 0.888671875, 1.042724609375, 1.19677734375, 1.350830078125, 1.5048828125, 1.658935546875, 1.81298828125, 1.967041015625, 2.12109375, 2.275146484375, 2.42919921875, 2.583251953125, 2.7373046875, 2.891357421875, 3.04541015625, 3.199462890625, 3.353515625, 3.507568359375, 3.66162109375, 3.815673828125, 3.9697265625, 4.123779296875, 4.27783203125, 4.431884765625, 4.5859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 5.0, 11.0, 16.0, 16.0, 25.0, 21.0, 37.0, 37.0, 46.0, 61.0, 61.0, 65.0, 52.0, 84.0, 81.0, 68.0, 55.0, 52.0, 36.0, 39.0, 31.0, 25.0, 20.0, 18.0, 13.0, 11.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75634765625, -5.5595703125, -5.36279296875, -5.166015625, -4.96923828125, -4.7724609375, -4.57568359375, -4.37890625, -4.18212890625, -3.9853515625, -3.78857421875, -3.591796875, -3.39501953125, -3.1982421875, -3.00146484375, -2.8046875, -2.60791015625, -2.4111328125, -2.21435546875, -2.017578125, -1.82080078125, -1.6240234375, -1.42724609375, -1.23046875, -1.03369140625, -0.8369140625, -0.64013671875, -0.443359375, -0.24658203125, -0.0498046875, 0.14697265625, 0.34375, 0.54052734375, 0.7373046875, 0.93408203125, 1.130859375, 1.32763671875, 1.5244140625, 1.72119140625, 1.91796875, 2.11474609375, 2.3115234375, 2.50830078125, 2.705078125, 2.90185546875, 3.0986328125, 3.29541015625, 3.4921875, 3.68896484375, 3.8857421875, 4.08251953125, 4.279296875, 4.47607421875, 4.6728515625, 4.86962890625, 5.06640625, 5.26318359375, 5.4599609375, 5.65673828125, 5.853515625, 6.05029296875, 6.2470703125, 6.44384765625, 6.640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 6.0, 5.0, 14.0, 19.0, 21.0, 44.0, 50.0, 75.0, 114.0, 206.0, 362.0, 759.0, 3184.0, 73415.0, 842140.0, 121880.0, 4374.0, 865.0, 396.0, 205.0, 153.0, 71.0, 65.0, 35.0, 23.0, 21.0, 17.0, 12.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-11.4296875, -11.15472412109375, -10.8797607421875, -10.60479736328125, -10.329833984375, -10.05487060546875, -9.7799072265625, -9.50494384765625, -9.22998046875, -8.95501708984375, -8.6800537109375, -8.40509033203125, -8.130126953125, -7.85516357421875, -7.5802001953125, -7.30523681640625, -7.0302734375, -6.75531005859375, -6.4803466796875, -6.20538330078125, -5.930419921875, -5.65545654296875, -5.3804931640625, -5.10552978515625, -4.83056640625, -4.55560302734375, -4.2806396484375, -4.00567626953125, -3.730712890625, -3.45574951171875, -3.1807861328125, -2.90582275390625, -2.630859375, -2.35589599609375, -2.0809326171875, -1.80596923828125, -1.531005859375, -1.25604248046875, -0.9810791015625, -0.70611572265625, -0.43115234375, -0.15618896484375, 0.1187744140625, 0.39373779296875, 0.668701171875, 0.94366455078125, 1.2186279296875, 1.49359130859375, 1.7685546875, 2.04351806640625, 2.3184814453125, 2.59344482421875, 2.868408203125, 3.14337158203125, 3.4183349609375, 3.69329833984375, 3.96826171875, 4.24322509765625, 4.5181884765625, 4.79315185546875, 5.068115234375, 5.34307861328125, 5.6180419921875, 5.89300537109375, 6.16796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 9.0, 12.0, 22.0, 25.0, 26.0, 42.0, 54.0, 57.0, 78.0, 72.0, 95.0, 82.0, 97.0, 70.0, 72.0, 42.0, 37.0, 36.0, 25.0, 10.0, 13.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1328125, -9.841552734375, -9.55029296875, -9.259033203125, -8.9677734375, -8.676513671875, -8.38525390625, -8.093994140625, -7.802734375, -7.511474609375, -7.22021484375, -6.928955078125, -6.6376953125, -6.346435546875, -6.05517578125, -5.763916015625, -5.47265625, -5.181396484375, -4.89013671875, -4.598876953125, -4.3076171875, -4.016357421875, -3.72509765625, -3.433837890625, -3.142578125, -2.851318359375, -2.56005859375, -2.268798828125, -1.9775390625, -1.686279296875, -1.39501953125, -1.103759765625, -0.8125, -0.521240234375, -0.22998046875, 0.061279296875, 0.3525390625, 0.643798828125, 0.93505859375, 1.226318359375, 1.517578125, 1.808837890625, 2.10009765625, 2.391357421875, 2.6826171875, 2.973876953125, 3.26513671875, 3.556396484375, 3.84765625, 4.138916015625, 4.43017578125, 4.721435546875, 5.0126953125, 5.303955078125, 5.59521484375, 5.886474609375, 6.177734375, 6.468994140625, 6.76025390625, 7.051513671875, 7.3427734375, 7.634033203125, 7.92529296875, 8.216552734375, 8.5078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 6.0, 22.0, 29.0, 56.0, 87.0, 210.0, 961.0, 7635.0, 561152.0, 470110.0, 6921.0, 884.0, 233.0, 95.0, 57.0, 19.0, 10.0, 13.0, 8.0, 7.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8828125, -2.77978515625, -2.6767578125, -2.57373046875, -2.470703125, -2.36767578125, -2.2646484375, -2.16162109375, -2.05859375, -1.95556640625, -1.8525390625, -1.74951171875, -1.646484375, -1.54345703125, -1.4404296875, -1.33740234375, -1.234375, -1.13134765625, -1.0283203125, -0.92529296875, -0.822265625, -0.71923828125, -0.6162109375, -0.51318359375, -0.41015625, -0.30712890625, -0.2041015625, -0.10107421875, 0.001953125, 0.10498046875, 0.2080078125, 0.31103515625, 0.4140625, 0.51708984375, 0.6201171875, 0.72314453125, 0.826171875, 0.92919921875, 1.0322265625, 1.13525390625, 1.23828125, 1.34130859375, 1.4443359375, 1.54736328125, 1.650390625, 1.75341796875, 1.8564453125, 1.95947265625, 2.0625, 2.16552734375, 2.2685546875, 2.37158203125, 2.474609375, 2.57763671875, 2.6806640625, 2.78369140625, 2.88671875, 2.98974609375, 3.0927734375, 3.19580078125, 3.298828125, 3.40185546875, 3.5048828125, 3.60791015625, 3.7109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 10.0, 10.0, 26.0, 23.0, 45.0, 53.0, 62.0, 99.0, 132.0, 153.0, 103.0, 78.0, 60.0, 49.0, 29.0, 21.0, 15.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000247955322265625, -0.00023971498012542725, -0.0002314746379852295, -0.00022323429584503174, -0.00021499395370483398, -0.00020675361156463623, -0.00019851326942443848, -0.00019027292728424072, -0.00018203258514404297, -0.00017379224300384521, -0.00016555190086364746, -0.0001573115587234497, -0.00014907121658325195, -0.0001408308744430542, -0.00013259053230285645, -0.0001243501901626587, -0.00011610984802246094, -0.00010786950588226318, -9.962916374206543e-05, -9.138882160186768e-05, -8.314847946166992e-05, -7.490813732147217e-05, -6.666779518127441e-05, -5.842745304107666e-05, -5.0187110900878906e-05, -4.194676876068115e-05, -3.37064266204834e-05, -2.5466084480285645e-05, -1.722574234008789e-05, -8.985400199890137e-06, -7.450580596923828e-07, 7.495284080505371e-06, 1.5735626220703125e-05, 2.397596836090088e-05, 3.221631050109863e-05, 4.045665264129639e-05, 4.869699478149414e-05, 5.6937336921691895e-05, 6.517767906188965e-05, 7.34180212020874e-05, 8.165836334228516e-05, 8.989870548248291e-05, 9.813904762268066e-05, 0.00010637938976287842, 0.00011461973190307617, 0.00012286007404327393, 0.00013110041618347168, 0.00013934075832366943, 0.0001475811004638672, 0.00015582144260406494, 0.0001640617847442627, 0.00017230212688446045, 0.0001805424690246582, 0.00018878281116485596, 0.0001970231533050537, 0.00020526349544525146, 0.00021350383758544922, 0.00022174417972564697, 0.00022998452186584473, 0.00023822486400604248, 0.00024646520614624023, 0.000254705548286438, 0.00026294589042663574, 0.0002711862325668335, 0.00027942657470703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 7.0, 6.0, 10.0, 11.0, 14.0, 30.0, 37.0, 73.0, 171.0, 474.0, 1500.0, 5502.0, 109908.0, 895451.0, 30175.0, 3478.0, 1054.0, 347.0, 138.0, 70.0, 32.0, 9.0, 14.0, 8.0, 9.0, 7.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.451171875, -3.341064453125, -3.23095703125, -3.120849609375, -3.0107421875, -2.900634765625, -2.79052734375, -2.680419921875, -2.5703125, -2.460205078125, -2.35009765625, -2.239990234375, -2.1298828125, -2.019775390625, -1.90966796875, -1.799560546875, -1.689453125, -1.579345703125, -1.46923828125, -1.359130859375, -1.2490234375, -1.138916015625, -1.02880859375, -0.918701171875, -0.80859375, -0.698486328125, -0.58837890625, -0.478271484375, -0.3681640625, -0.258056640625, -0.14794921875, -0.037841796875, 0.072265625, 0.182373046875, 0.29248046875, 0.402587890625, 0.5126953125, 0.622802734375, 0.73291015625, 0.843017578125, 0.953125, 1.063232421875, 1.17333984375, 1.283447265625, 1.3935546875, 1.503662109375, 1.61376953125, 1.723876953125, 1.833984375, 1.944091796875, 2.05419921875, 2.164306640625, 2.2744140625, 2.384521484375, 2.49462890625, 2.604736328125, 2.71484375, 2.824951171875, 2.93505859375, 3.045166015625, 3.1552734375, 3.265380859375, 3.37548828125, 3.485595703125, 3.595703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 6.0, 16.0, 22.0, 27.0, 61.0, 99.0, 119.0, 199.0, 170.0, 105.0, 71.0, 40.0, 24.0, 18.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.31982421875, -1.2783203125, -1.23681640625, -1.1953125, -1.15380859375, -1.1123046875, -1.07080078125, -1.029296875, -0.98779296875, -0.9462890625, -0.90478515625, -0.86328125, -0.82177734375, -0.7802734375, -0.73876953125, -0.697265625, -0.65576171875, -0.6142578125, -0.57275390625, -0.53125, -0.48974609375, -0.4482421875, -0.40673828125, -0.365234375, -0.32373046875, -0.2822265625, -0.24072265625, -0.19921875, -0.15771484375, -0.1162109375, -0.07470703125, -0.033203125, 0.00830078125, 0.0498046875, 0.09130859375, 0.1328125, 0.17431640625, 0.2158203125, 0.25732421875, 0.298828125, 0.34033203125, 0.3818359375, 0.42333984375, 0.46484375, 0.50634765625, 0.5478515625, 0.58935546875, 0.630859375, 0.67236328125, 0.7138671875, 0.75537109375, 0.796875, 0.83837890625, 0.8798828125, 0.92138671875, 0.962890625, 1.00439453125, 1.0458984375, 1.08740234375, 1.12890625, 1.17041015625, 1.2119140625, 1.25341796875, 1.294921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 25.0, 78.0, 151.0, 203.0, 235.0, 164.0, 99.0, 40.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.679859161376953, -21.189781188964844, -20.6997013092041, -20.209623336791992, -19.719545364379883, -19.22946548461914, -18.73938751220703, -18.249309539794922, -17.759231567382812, -17.269153594970703, -16.77907371520996, -16.28899574279785, -15.798917770385742, -15.308838844299316, -14.81875991821289, -14.328681945800781, -13.838602066040039, -13.348523139953613, -12.858445167541504, -12.368366241455078, -11.878288269042969, -11.388209342956543, -10.898130416870117, -10.408052444458008, -9.917974472045898, -9.427895545959473, -8.937817573547363, -8.447738647460938, -7.95766019821167, -7.467581748962402, -6.977503299713135, -6.487424850463867, -5.997345924377441, -5.507267475128174, -5.017189025878906, -4.5271100997924805, -4.037031650543213, -3.5469532012939453, -3.0568747520446777, -2.566796064376831, -2.0767176151275635, -1.5866390466690063, -1.0965604782104492, -0.6064820289611816, -0.11640346050262451, 0.3736751079559326, 0.8637535572052002, 1.3538322448730469, 1.8439106941223145, 2.333989143371582, 2.8240678310394287, 3.3141462802886963, 3.804224967956543, 4.2943034172058105, 4.784381866455078, 5.274460792541504, 5.764538764953613, 6.254617214202881, 6.744695663452148, 7.234774589538574, 7.724853038787842, 8.21493148803711, 8.705009460449219, 9.195088386535645, 9.68516731262207]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 8.0, 4.0, 13.0, 17.0, 7.0, 16.0, 20.0, 30.0, 15.0, 27.0, 28.0, 30.0, 40.0, 48.0, 39.0, 60.0, 53.0, 46.0, 31.0, 41.0, 44.0, 41.0, 43.0, 40.0, 25.0, 31.0, 32.0, 25.0, 16.0, 21.0, 20.0, 14.0, 17.0, 9.0, 13.0, 6.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.39370346069336, -8.103063583374023, -7.8124237060546875, -7.521783828735352, -7.231143951416016, -6.94050407409668, -6.6498637199401855, -6.35922384262085, -6.068583965301514, -5.777944087982178, -5.487304210662842, -5.196664333343506, -4.906023979187012, -4.615384101867676, -4.32474422454834, -4.034104347229004, -3.743464469909668, -3.452824592590332, -3.162184715270996, -2.871544599533081, -2.580904722213745, -2.290264844894409, -1.9996248483657837, -1.7089848518371582, -1.4183449745178223, -1.1277050971984863, -0.8370651006698608, -0.5464251637458801, -0.2557852268218994, 0.03485465049743652, 0.325494647026062, 0.6161346435546875, 0.9067745208740234, 1.1974143981933594, 1.4880543947219849, 1.7786943912506104, 2.0693342685699463, 2.3599741458892822, 2.6506142616271973, 2.941254138946533, 3.231894016265869, 3.522533893585205, 3.813173770904541, 4.103813648223877, 4.394454002380371, 4.685093879699707, 4.975733757019043, 5.266373634338379, 5.557013511657715, 5.847653388977051, 6.138293266296387, 6.428933143615723, 6.719573020935059, 7.0102128982543945, 7.300853252410889, 7.591493129730225, 7.8821330070495605, 8.172773361206055, 8.46341323852539, 8.754053115844727, 9.044692993164062, 9.335332870483398, 9.625972747802734, 9.91661262512207, 10.207252502441406]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 12.0, 24.0, 38.0, 41.0, 58.0, 94.0, 114.0, 219.0, 340.0, 829.0, 5089.0, 789990.0, 3382096.0, 13000.0, 1192.0, 421.0, 242.0, 155.0, 111.0, 80.0, 43.0, 37.0, 23.0, 19.0, 5.0, 10.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.7884521484375, -9.365966796875, -8.9434814453125, -8.52099609375, -8.0985107421875, -7.676025390625, -7.2535400390625, -6.8310546875, -6.4085693359375, -5.986083984375, -5.5635986328125, -5.14111328125, -4.7186279296875, -4.296142578125, -3.8736572265625, -3.451171875, -3.0286865234375, -2.606201171875, -2.1837158203125, -1.76123046875, -1.3387451171875, -0.916259765625, -0.4937744140625, -0.0712890625, 0.3511962890625, 0.773681640625, 1.1961669921875, 1.61865234375, 2.0411376953125, 2.463623046875, 2.8861083984375, 3.30859375, 3.7310791015625, 4.153564453125, 4.5760498046875, 4.99853515625, 5.4210205078125, 5.843505859375, 6.2659912109375, 6.6884765625, 7.1109619140625, 7.533447265625, 7.9559326171875, 8.37841796875, 8.8009033203125, 9.223388671875, 9.6458740234375, 10.068359375, 10.4908447265625, 10.913330078125, 11.3358154296875, 11.75830078125, 12.1807861328125, 12.603271484375, 13.0257568359375, 13.4482421875, 13.8707275390625, 14.293212890625, 14.7156982421875, 15.13818359375, 15.5606689453125, 15.983154296875, 16.4056396484375, 16.828125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 15.0, 19.0, 22.0, 34.0, 32.0, 53.0, 54.0, 68.0, 72.0, 69.0, 68.0, 73.0, 77.0, 67.0, 52.0, 47.0, 44.0, 35.0, 25.0, 22.0, 18.0, 11.0, 5.0, 2.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.080078125, -2.944976806640625, -2.80987548828125, -2.674774169921875, -2.5396728515625, -2.404571533203125, -2.26947021484375, -2.134368896484375, -1.999267578125, -1.864166259765625, -1.72906494140625, -1.593963623046875, -1.4588623046875, -1.323760986328125, -1.18865966796875, -1.053558349609375, -0.91845703125, -0.783355712890625, -0.64825439453125, -0.513153076171875, -0.3780517578125, -0.242950439453125, -0.10784912109375, 0.027252197265625, 0.162353515625, 0.297454833984375, 0.43255615234375, 0.567657470703125, 0.7027587890625, 0.837860107421875, 0.97296142578125, 1.108062744140625, 1.2431640625, 1.378265380859375, 1.51336669921875, 1.648468017578125, 1.7835693359375, 1.918670654296875, 2.05377197265625, 2.188873291015625, 2.323974609375, 2.459075927734375, 2.59417724609375, 2.729278564453125, 2.8643798828125, 2.999481201171875, 3.13458251953125, 3.269683837890625, 3.40478515625, 3.539886474609375, 3.67498779296875, 3.810089111328125, 3.9451904296875, 4.080291748046875, 4.21539306640625, 4.350494384765625, 4.485595703125, 4.620697021484375, 4.75579833984375, 4.890899658203125, 5.0260009765625, 5.161102294921875, 5.29620361328125, 5.431304931640625, 5.56640625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 10.0, 4.0, 20.0, 72.0, 228.0, 1254.0, 98464.0, 4090910.0, 2745.0, 399.0, 80.0, 40.0, 15.0, 9.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.375, -26.4677734375, -25.560546875, -24.6533203125, -23.74609375, -22.8388671875, -21.931640625, -21.0244140625, -20.1171875, -19.2099609375, -18.302734375, -17.3955078125, -16.48828125, -15.5810546875, -14.673828125, -13.7666015625, -12.859375, -11.9521484375, -11.044921875, -10.1376953125, -9.23046875, -8.3232421875, -7.416015625, -6.5087890625, -5.6015625, -4.6943359375, -3.787109375, -2.8798828125, -1.97265625, -1.0654296875, -0.158203125, 0.7490234375, 1.65625, 2.5634765625, 3.470703125, 4.3779296875, 5.28515625, 6.1923828125, 7.099609375, 8.0068359375, 8.9140625, 9.8212890625, 10.728515625, 11.6357421875, 12.54296875, 13.4501953125, 14.357421875, 15.2646484375, 16.171875, 17.0791015625, 17.986328125, 18.8935546875, 19.80078125, 20.7080078125, 21.615234375, 22.5224609375, 23.4296875, 24.3369140625, 25.244140625, 26.1513671875, 27.05859375, 27.9658203125, 28.873046875, 29.7802734375, 30.6875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 44.0, 170.0, 746.0, 1841.0, 940.0, 225.0, 58.0, 23.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.40234375, -5.24603271484375, -5.0897216796875, -4.93341064453125, -4.777099609375, -4.62078857421875, -4.4644775390625, -4.30816650390625, -4.15185546875, -3.99554443359375, -3.8392333984375, -3.68292236328125, -3.526611328125, -3.37030029296875, -3.2139892578125, -3.05767822265625, -2.9013671875, -2.74505615234375, -2.5887451171875, -2.43243408203125, -2.276123046875, -2.11981201171875, -1.9635009765625, -1.80718994140625, -1.65087890625, -1.49456787109375, -1.3382568359375, -1.18194580078125, -1.025634765625, -0.86932373046875, -0.7130126953125, -0.55670166015625, -0.400390625, -0.24407958984375, -0.0877685546875, 0.06854248046875, 0.224853515625, 0.38116455078125, 0.5374755859375, 0.69378662109375, 0.85009765625, 1.00640869140625, 1.1627197265625, 1.31903076171875, 1.475341796875, 1.63165283203125, 1.7879638671875, 1.94427490234375, 2.1005859375, 2.25689697265625, 2.4132080078125, 2.56951904296875, 2.725830078125, 2.88214111328125, 3.0384521484375, 3.19476318359375, 3.35107421875, 3.50738525390625, 3.6636962890625, 3.82000732421875, 3.976318359375, 4.13262939453125, 4.2889404296875, 4.44525146484375, 4.6015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 16.0, 29.0, 50.0, 85.0, 88.0, 108.0, 137.0, 127.0, 97.0, 91.0, 77.0, 44.0, 32.0, 12.0, 11.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.574495315551758, -3.3629133701324463, -3.1513314247131348, -2.9397497177124023, -2.7281675338745117, -2.5165858268737793, -2.3050038814544678, -2.0934219360351562, -1.8818399906158447, -1.6702580451965332, -1.4586760997772217, -1.2470942735671997, -1.0355123281478882, -0.8239303827285767, -0.6123485565185547, -0.40076661109924316, -0.18918466567993164, 0.022397249937057495, 0.23397916555404663, 0.4455610513687134, 0.6571429967880249, 0.8687249422073364, 1.0803067684173584, 1.29188871383667, 1.5034706592559814, 1.715052604675293, 1.9266345500946045, 2.138216495513916, 2.3497982025146484, 2.561380386352539, 2.7729620933532715, 2.984544038772583, 3.1961259841918945, 3.407707929611206, 3.6192898750305176, 3.83087158203125, 4.042453765869141, 4.254035472869873, 4.4656171798706055, 4.677199363708496, 4.888781547546387, 5.100363254547119, 5.31194543838501, 5.523527145385742, 5.735109329223633, 5.946691036224365, 6.158272743225098, 6.369854927062988, 6.581436634063721, 6.793018341064453, 7.004600524902344, 7.216182231903076, 7.427764415740967, 7.639346122741699, 7.85092830657959, 8.062509536743164, 8.274091720581055, 8.485673904418945, 8.69725513458252, 8.90883731842041, 9.1204195022583, 9.332001686096191, 9.543582916259766, 9.755165100097656, 9.966747283935547]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 15.0, 14.0, 13.0, 14.0, 18.0, 18.0, 22.0, 30.0, 27.0, 37.0, 36.0, 45.0, 46.0, 45.0, 56.0, 45.0, 40.0, 50.0, 40.0, 37.0, 44.0, 39.0, 39.0, 25.0, 34.0, 29.0, 17.0, 21.0, 14.0, 16.0, 12.0, 9.0, 5.0, 10.0, 5.0, 7.0, 5.0, 0.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.976426601409912, -2.8715806007385254, -2.7667346000671387, -2.661888599395752, -2.5570428371429443, -2.4521968364715576, -2.347350835800171, -2.242504835128784, -2.1376590728759766, -2.03281307220459, -1.9279671907424927, -1.823121190071106, -1.7182753086090088, -1.613429307937622, -1.5085833072662354, -1.4037373065948486, -1.298891305923462, -1.1940453052520752, -1.089199423789978, -0.9843534231185913, -0.8795074820518494, -0.7746615409851074, -0.6698155403137207, -0.5649695992469788, -0.4601236581802368, -0.3552777171134949, -0.25043174624443054, -0.1455857753753662, -0.04073983430862427, 0.06410610675811768, 0.1689521074295044, 0.27379804849624634, 0.3786439895629883, 0.4834899306297302, 0.5883358716964722, 0.6931818723678589, 0.7980278134346008, 0.9028737545013428, 1.0077197551727295, 1.1125657558441162, 1.2174116373062134, 1.3222576379776, 1.4271035194396973, 1.531949520111084, 1.6367955207824707, 1.7416414022445679, 1.8464874029159546, 1.9513332843780518, 2.0561792850494385, 2.161025285720825, 2.265871286392212, 2.3707170486450195, 2.4755630493164062, 2.580409049987793, 2.6852550506591797, 2.7901010513305664, 2.894947052001953, 2.99979305267334, 3.1046390533447266, 3.2094850540161133, 3.314330816268921, 3.4191768169403076, 3.5240228176116943, 3.628868818283081, 3.7337145805358887]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 10.0, 17.0, 23.0, 41.0, 43.0, 83.0, 157.0, 234.0, 402.0, 897.0, 2721.0, 16649.0, 238576.0, 739993.0, 41050.0, 5106.0, 1255.0, 510.0, 291.0, 182.0, 108.0, 63.0, 50.0, 32.0, 23.0, 16.0, 2.0, 2.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.0959930419921875, -2.039642333984375, -1.9832916259765625, -1.92694091796875, -1.8705902099609375, -1.814239501953125, -1.7578887939453125, -1.7015380859375, -1.6451873779296875, -1.588836669921875, -1.5324859619140625, -1.47613525390625, -1.4197845458984375, -1.363433837890625, -1.3070831298828125, -1.250732421875, -1.1943817138671875, -1.138031005859375, -1.0816802978515625, -1.02532958984375, -0.9689788818359375, -0.912628173828125, -0.8562774658203125, -0.7999267578125, -0.7435760498046875, -0.687225341796875, -0.6308746337890625, -0.57452392578125, -0.5181732177734375, -0.461822509765625, -0.4054718017578125, -0.34912109375, -0.2927703857421875, -0.236419677734375, -0.1800689697265625, -0.12371826171875, -0.0673675537109375, -0.011016845703125, 0.0453338623046875, 0.1016845703125, 0.1580352783203125, 0.214385986328125, 0.2707366943359375, 0.32708740234375, 0.3834381103515625, 0.439788818359375, 0.4961395263671875, 0.552490234375, 0.6088409423828125, 0.665191650390625, 0.7215423583984375, 0.77789306640625, 0.8342437744140625, 0.890594482421875, 0.9469451904296875, 1.0032958984375, 1.0596466064453125, 1.115997314453125, 1.1723480224609375, 1.22869873046875, 1.2850494384765625, 1.341400146484375, 1.3977508544921875, 1.4541015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 8.0, 10.0, 17.0, 17.0, 19.0, 30.0, 26.0, 36.0, 44.0, 38.0, 60.0, 60.0, 70.0, 67.0, 59.0, 59.0, 77.0, 47.0, 50.0, 46.0, 40.0, 30.0, 24.0, 9.0, 21.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -1.99462890625, -1.8994140625, -1.80419921875, -1.708984375, -1.61376953125, -1.5185546875, -1.42333984375, -1.328125, -1.23291015625, -1.1376953125, -1.04248046875, -0.947265625, -0.85205078125, -0.7568359375, -0.66162109375, -0.56640625, -0.47119140625, -0.3759765625, -0.28076171875, -0.185546875, -0.09033203125, 0.0048828125, 0.10009765625, 0.1953125, 0.29052734375, 0.3857421875, 0.48095703125, 0.576171875, 0.67138671875, 0.7666015625, 0.86181640625, 0.95703125, 1.05224609375, 1.1474609375, 1.24267578125, 1.337890625, 1.43310546875, 1.5283203125, 1.62353515625, 1.71875, 1.81396484375, 1.9091796875, 2.00439453125, 2.099609375, 2.19482421875, 2.2900390625, 2.38525390625, 2.48046875, 2.57568359375, 2.6708984375, 2.76611328125, 2.861328125, 2.95654296875, 3.0517578125, 3.14697265625, 3.2421875, 3.33740234375, 3.4326171875, 3.52783203125, 3.623046875, 3.71826171875, 3.8134765625, 3.90869140625, 4.00390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 5.0, 12.0, 10.0, 17.0, 31.0, 33.0, 70.0, 97.0, 182.0, 334.0, 582.0, 1306.0, 2829.0, 7138.0, 21393.0, 81361.0, 479508.0, 361994.0, 63008.0, 17671.0, 6122.0, 2438.0, 1139.0, 531.0, 301.0, 181.0, 81.0, 63.0, 45.0, 21.0, 17.0, 13.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9697265625, -0.941131591796875, -0.91253662109375, -0.883941650390625, -0.8553466796875, -0.826751708984375, -0.79815673828125, -0.769561767578125, -0.740966796875, -0.712371826171875, -0.68377685546875, -0.655181884765625, -0.6265869140625, -0.597991943359375, -0.56939697265625, -0.540802001953125, -0.51220703125, -0.483612060546875, -0.45501708984375, -0.426422119140625, -0.3978271484375, -0.369232177734375, -0.34063720703125, -0.312042236328125, -0.283447265625, -0.254852294921875, -0.22625732421875, -0.197662353515625, -0.1690673828125, -0.140472412109375, -0.11187744140625, -0.083282470703125, -0.0546875, -0.026092529296875, 0.00250244140625, 0.031097412109375, 0.0596923828125, 0.088287353515625, 0.11688232421875, 0.145477294921875, 0.174072265625, 0.202667236328125, 0.23126220703125, 0.259857177734375, 0.2884521484375, 0.317047119140625, 0.34564208984375, 0.374237060546875, 0.40283203125, 0.431427001953125, 0.46002197265625, 0.488616943359375, 0.5172119140625, 0.545806884765625, 0.57440185546875, 0.602996826171875, 0.631591796875, 0.660186767578125, 0.68878173828125, 0.717376708984375, 0.7459716796875, 0.774566650390625, 0.80316162109375, 0.831756591796875, 0.8603515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 4.0, 7.0, 5.0, 16.0, 6.0, 9.0, 24.0, 23.0, 18.0, 33.0, 44.0, 51.0, 57.0, 57.0, 60.0, 50.0, 83.0, 58.0, 67.0, 56.0, 49.0, 40.0, 33.0, 33.0, 19.0, 23.0, 17.0, 16.0, 8.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.53076171875, -8.2724609375, -8.01416015625, -7.755859375, -7.49755859375, -7.2392578125, -6.98095703125, -6.72265625, -6.46435546875, -6.2060546875, -5.94775390625, -5.689453125, -5.43115234375, -5.1728515625, -4.91455078125, -4.65625, -4.39794921875, -4.1396484375, -3.88134765625, -3.623046875, -3.36474609375, -3.1064453125, -2.84814453125, -2.58984375, -2.33154296875, -2.0732421875, -1.81494140625, -1.556640625, -1.29833984375, -1.0400390625, -0.78173828125, -0.5234375, -0.26513671875, -0.0068359375, 0.25146484375, 0.509765625, 0.76806640625, 1.0263671875, 1.28466796875, 1.54296875, 1.80126953125, 2.0595703125, 2.31787109375, 2.576171875, 2.83447265625, 3.0927734375, 3.35107421875, 3.609375, 3.86767578125, 4.1259765625, 4.38427734375, 4.642578125, 4.90087890625, 5.1591796875, 5.41748046875, 5.67578125, 5.93408203125, 6.1923828125, 6.45068359375, 6.708984375, 6.96728515625, 7.2255859375, 7.48388671875, 7.7421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 14.0, 9.0, 17.0, 22.0, 47.0, 38.0, 79.0, 97.0, 167.0, 319.0, 695.0, 1816.0, 8780.0, 168226.0, 839494.0, 23379.0, 3280.0, 1036.0, 450.0, 207.0, 129.0, 68.0, 45.0, 44.0, 25.0, 19.0, 17.0, 9.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57373046875, -0.5569648742675781, -0.5401992797851562, -0.5234336853027344, -0.5066680908203125, -0.4899024963378906, -0.47313690185546875, -0.4563713073730469, -0.439605712890625, -0.4228401184082031, -0.40607452392578125, -0.3893089294433594, -0.3725433349609375, -0.3557777404785156, -0.33901214599609375, -0.3222465515136719, -0.30548095703125, -0.2887153625488281, -0.27194976806640625, -0.2551841735839844, -0.2384185791015625, -0.22165298461914062, -0.20488739013671875, -0.18812179565429688, -0.171356201171875, -0.15459060668945312, -0.13782501220703125, -0.12105941772460938, -0.1042938232421875, -0.08752822875976562, -0.07076263427734375, -0.053997039794921875, -0.0372314453125, -0.020465850830078125, -0.00370025634765625, 0.013065338134765625, 0.0298309326171875, 0.046596527099609375, 0.06336212158203125, 0.08012771606445312, 0.096893310546875, 0.11365890502929688, 0.13042449951171875, 0.14719009399414062, 0.1639556884765625, 0.18072128295898438, 0.19748687744140625, 0.21425247192382812, 0.23101806640625, 0.24778366088867188, 0.26454925537109375, 0.2813148498535156, 0.2980804443359375, 0.3148460388183594, 0.33161163330078125, 0.3483772277832031, 0.365142822265625, 0.3819084167480469, 0.39867401123046875, 0.4154396057128906, 0.4322052001953125, 0.4489707946777344, 0.46573638916015625, 0.4825019836425781, 0.499267578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 14.0, 26.0, 35.0, 74.0, 115.0, 130.0, 132.0, 147.0, 103.0, 72.0, 51.0, 44.0, 22.0, 10.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.0001185983419418335, -0.00011417269706726074, -0.00010974705219268799, -0.00010532140731811523, -0.00010089576244354248, -9.647011756896973e-05, -9.204447269439697e-05, -8.761882781982422e-05, -8.319318294525146e-05, -7.876753807067871e-05, -7.434189319610596e-05, -6.99162483215332e-05, -6.549060344696045e-05, -6.10649585723877e-05, -5.663931369781494e-05, -5.221366882324219e-05, -4.7788023948669434e-05, -4.336237907409668e-05, -3.8936734199523926e-05, -3.451108932495117e-05, -3.0085444450378418e-05, -2.5659799575805664e-05, -2.123415470123291e-05, -1.6808509826660156e-05, -1.2382864952087402e-05, -7.957220077514648e-06, -3.5315752029418945e-06, 8.940696716308594e-07, 5.319714546203613e-06, 9.745359420776367e-06, 1.4171004295349121e-05, 1.8596649169921875e-05, 2.302229404449463e-05, 2.7447938919067383e-05, 3.187358379364014e-05, 3.629922866821289e-05, 4.0724873542785645e-05, 4.51505184173584e-05, 4.957616329193115e-05, 5.4001808166503906e-05, 5.842745304107666e-05, 6.285309791564941e-05, 6.727874279022217e-05, 7.170438766479492e-05, 7.613003253936768e-05, 8.055567741394043e-05, 8.498132228851318e-05, 8.940696716308594e-05, 9.383261203765869e-05, 9.825825691223145e-05, 0.0001026839017868042, 0.00010710954666137695, 0.00011153519153594971, 0.00011596083641052246, 0.00012038648128509521, 0.00012481212615966797, 0.00012923777103424072, 0.00013366341590881348, 0.00013808906078338623, 0.00014251470565795898, 0.00014694035053253174, 0.0001513659954071045, 0.00015579164028167725, 0.00016021728515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 11.0, 11.0, 18.0, 36.0, 52.0, 85.0, 121.0, 264.0, 475.0, 1081.0, 2960.0, 8422.0, 27758.0, 144850.0, 716415.0, 112496.0, 22893.0, 6741.0, 2218.0, 843.0, 355.0, 156.0, 94.0, 59.0, 42.0, 18.0, 21.0, 17.0, 9.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2737159729003906, -0.26374053955078125, -0.2537651062011719, -0.2437896728515625, -0.23381423950195312, -0.22383880615234375, -0.21386337280273438, -0.203887939453125, -0.19391250610351562, -0.18393707275390625, -0.17396163940429688, -0.1639862060546875, -0.15401077270507812, -0.14403533935546875, -0.13405990600585938, -0.12408447265625, -0.11410903930664062, -0.10413360595703125, -0.09415817260742188, -0.0841827392578125, -0.07420730590820312, -0.06423187255859375, -0.054256439208984375, -0.044281005859375, -0.034305572509765625, -0.02433013916015625, -0.014354705810546875, -0.0043792724609375, 0.005596160888671875, 0.01557159423828125, 0.025547027587890625, 0.0355224609375, 0.045497894287109375, 0.05547332763671875, 0.06544876098632812, 0.0754241943359375, 0.08539962768554688, 0.09537506103515625, 0.10535049438476562, 0.115325927734375, 0.12530136108398438, 0.13527679443359375, 0.14525222778320312, 0.1552276611328125, 0.16520309448242188, 0.17517852783203125, 0.18515396118164062, 0.19512939453125, 0.20510482788085938, 0.21508026123046875, 0.22505569458007812, 0.2350311279296875, 0.24500656127929688, 0.25498199462890625, 0.2649574279785156, 0.274932861328125, 0.2849082946777344, 0.29488372802734375, 0.3048591613769531, 0.3148345947265625, 0.3248100280761719, 0.33478546142578125, 0.3447608947753906, 0.354736328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 11.0, 4.0, 9.0, 13.0, 19.0, 11.0, 22.0, 26.0, 35.0, 52.0, 82.0, 138.0, 167.0, 132.0, 79.0, 42.0, 33.0, 20.0, 18.0, 15.0, 9.0, 11.0, 9.0, 5.0, 6.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.128662109375, -0.1250133514404297, -0.12136459350585938, -0.11771583557128906, -0.11406707763671875, -0.11041831970214844, -0.10676956176757812, -0.10312080383300781, -0.0994720458984375, -0.09582328796386719, -0.09217453002929688, -0.08852577209472656, -0.08487701416015625, -0.08122825622558594, -0.07757949829101562, -0.07393074035644531, -0.070281982421875, -0.06663322448730469, -0.06298446655273438, -0.05933570861816406, -0.05568695068359375, -0.05203819274902344, -0.048389434814453125, -0.04474067687988281, -0.0410919189453125, -0.03744316101074219, -0.033794403076171875, -0.030145645141601562, -0.02649688720703125, -0.022848129272460938, -0.019199371337890625, -0.015550613403320312, -0.01190185546875, -0.008253097534179688, -0.004604339599609375, -0.0009555816650390625, 0.00269317626953125, 0.0063419342041015625, 0.009990692138671875, 0.013639450073242188, 0.0172882080078125, 0.020936965942382812, 0.024585723876953125, 0.028234481811523438, 0.03188323974609375, 0.03553199768066406, 0.039180755615234375, 0.04282951354980469, 0.046478271484375, 0.05012702941894531, 0.053775787353515625, 0.05742454528808594, 0.06107330322265625, 0.06472206115722656, 0.06837081909179688, 0.07201957702636719, 0.0756683349609375, 0.07931709289550781, 0.08296585083007812, 0.08661460876464844, 0.09026336669921875, 0.09391212463378906, 0.09756088256835938, 0.10120964050292969, 0.1048583984375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 27.0, 64.0, 118.0, 158.0, 190.0, 166.0, 131.0, 86.0, 34.0, 16.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.433723449707031, -5.25148868560791, -5.069253921508789, -4.887019634246826, -4.704784870147705, -4.522550106048584, -4.340315818786621, -4.1580810546875, -3.975846290588379, -3.793611526489258, -3.611377000808716, -3.429142475128174, -3.2469077110290527, -3.0646729469299316, -2.8824384212493896, -2.7002038955688477, -2.5179691314697266, -2.3357343673706055, -2.1534998416900635, -1.971265196800232, -1.7890305519104004, -1.6067959070205688, -1.4245612621307373, -1.2423266172409058, -1.0600919723510742, -0.8778573274612427, -0.6956226825714111, -0.5133880376815796, -0.33115339279174805, -0.1489187479019165, 0.03331589698791504, 0.21555054187774658, 0.3977851867675781, 0.5800198316574097, 0.7622544765472412, 0.9444891214370728, 1.1267237663269043, 1.3089584112167358, 1.4911930561065674, 1.673427700996399, 1.8556623458862305, 2.0378971099853516, 2.2201316356658936, 2.4023661613464355, 2.5846009254455566, 2.7668356895446777, 2.9490702152252197, 3.1313047409057617, 3.313539505004883, 3.495774269104004, 3.678008794784546, 3.860243320465088, 4.042478084564209, 4.22471284866333, 4.406947135925293, 4.589181900024414, 4.771416664123535, 4.953651428222656, 5.135886192321777, 5.31812047958374, 5.500355243682861, 5.682590007781982, 5.864824295043945, 6.047059059143066, 6.2292938232421875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 8.0, 12.0, 21.0, 19.0, 17.0, 30.0, 20.0, 36.0, 48.0, 44.0, 60.0, 59.0, 63.0, 59.0, 56.0, 56.0, 60.0, 60.0, 44.0, 43.0, 40.0, 30.0, 20.0, 24.0, 18.0, 12.0, 10.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9969929456710815, -1.910638689994812, -1.824284553527832, -1.7379302978515625, -1.6515761613845825, -1.565221905708313, -1.478867769241333, -1.3925135135650635, -1.306159257888794, -1.2198050022125244, -1.1334508657455444, -1.047096610069275, -0.9607424736022949, -0.8743882179260254, -0.7880340218544006, -0.7016798257827759, -0.6153256893157959, -0.5289714932441711, -0.4426172971725464, -0.35626307129859924, -0.2699088752269745, -0.18355467915534973, -0.09720045328140259, -0.010846257209777832, 0.07550793886184692, 0.16186213493347168, 0.24821634590625763, 0.3345705568790436, 0.42092475295066833, 0.5072789192199707, 0.5936331748962402, 0.679987370967865, 0.7663414478302002, 0.852695643901825, 0.9390498399734497, 1.0254040956497192, 1.1117582321166992, 1.1981124877929688, 1.2844667434692383, 1.3708208799362183, 1.4571750164031982, 1.5435292720794678, 1.6298834085464478, 1.7162376642227173, 1.8025918006896973, 1.8889460563659668, 1.9753003120422363, 2.061654567718506, 2.1480088233947754, 2.234363079071045, 2.3207173347473145, 2.407071352005005, 2.4934256076812744, 2.579779863357544, 2.6661341190338135, 2.752488136291504, 2.8388423919677734, 2.925196647644043, 3.0115509033203125, 3.097904920578003, 3.1842591762542725, 3.270613431930542, 3.3569676876068115, 3.443321704864502, 3.5296759605407715]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 12.0, 8.0, 21.0, 16.0, 47.0, 81.0, 103.0, 196.0, 335.0, 683.0, 1529.0, 4654.0, 17312.0, 76737.0, 283537.0, 431009.0, 175461.0, 41837.0, 9962.0, 2813.0, 1097.0, 478.0, 251.0, 136.0, 88.0, 45.0, 36.0, 29.0, 13.0, 11.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.9151611328125, -3.771728515625, -3.6282958984375, -3.48486328125, -3.3414306640625, -3.197998046875, -3.0545654296875, -2.9111328125, -2.7677001953125, -2.624267578125, -2.4808349609375, -2.33740234375, -2.1939697265625, -2.050537109375, -1.9071044921875, -1.763671875, -1.6202392578125, -1.476806640625, -1.3333740234375, -1.18994140625, -1.0465087890625, -0.903076171875, -0.7596435546875, -0.6162109375, -0.4727783203125, -0.329345703125, -0.1859130859375, -0.04248046875, 0.1009521484375, 0.244384765625, 0.3878173828125, 0.53125, 0.6746826171875, 0.818115234375, 0.9615478515625, 1.10498046875, 1.2484130859375, 1.391845703125, 1.5352783203125, 1.6787109375, 1.8221435546875, 1.965576171875, 2.1090087890625, 2.25244140625, 2.3958740234375, 2.539306640625, 2.6827392578125, 2.826171875, 2.9696044921875, 3.113037109375, 3.2564697265625, 3.39990234375, 3.5433349609375, 3.686767578125, 3.8302001953125, 3.9736328125, 4.1170654296875, 4.260498046875, 4.4039306640625, 4.54736328125, 4.6907958984375, 4.834228515625, 4.9776611328125, 5.12109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 7.0, 16.0, 15.0, 21.0, 24.0, 50.0, 35.0, 54.0, 66.0, 62.0, 86.0, 67.0, 79.0, 61.0, 75.0, 59.0, 56.0, 43.0, 29.0, 14.0, 26.0, 13.0, 8.0, 17.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.67962646484375, -4.5115966796875, -4.34356689453125, -4.175537109375, -4.00750732421875, -3.8394775390625, -3.67144775390625, -3.50341796875, -3.33538818359375, -3.1673583984375, -2.99932861328125, -2.831298828125, -2.66326904296875, -2.4952392578125, -2.32720947265625, -2.1591796875, -1.99114990234375, -1.8231201171875, -1.65509033203125, -1.487060546875, -1.31903076171875, -1.1510009765625, -0.98297119140625, -0.81494140625, -0.64691162109375, -0.4788818359375, -0.31085205078125, -0.142822265625, 0.02520751953125, 0.1932373046875, 0.36126708984375, 0.529296875, 0.69732666015625, 0.8653564453125, 1.03338623046875, 1.201416015625, 1.36944580078125, 1.5374755859375, 1.70550537109375, 1.87353515625, 2.04156494140625, 2.2095947265625, 2.37762451171875, 2.545654296875, 2.71368408203125, 2.8817138671875, 3.04974365234375, 3.2177734375, 3.38580322265625, 3.5538330078125, 3.72186279296875, 3.889892578125, 4.05792236328125, 4.2259521484375, 4.39398193359375, 4.56201171875, 4.73004150390625, 4.8980712890625, 5.06610107421875, 5.234130859375, 5.40216064453125, 5.5701904296875, 5.73822021484375, 5.90625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 10.0, 21.0, 23.0, 38.0, 45.0, 75.0, 94.0, 197.0, 292.0, 555.0, 1119.0, 2693.0, 8583.0, 37209.0, 193266.0, 512006.0, 231375.0, 45387.0, 9946.0, 2939.0, 1229.0, 571.0, 299.0, 205.0, 113.0, 68.0, 52.0, 40.0, 24.0, 15.0, 6.0, 15.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.28125, -6.10943603515625, -5.9376220703125, -5.76580810546875, -5.593994140625, -5.42218017578125, -5.2503662109375, -5.07855224609375, -4.90673828125, -4.73492431640625, -4.5631103515625, -4.39129638671875, -4.219482421875, -4.04766845703125, -3.8758544921875, -3.70404052734375, -3.5322265625, -3.36041259765625, -3.1885986328125, -3.01678466796875, -2.844970703125, -2.67315673828125, -2.5013427734375, -2.32952880859375, -2.15771484375, -1.98590087890625, -1.8140869140625, -1.64227294921875, -1.470458984375, -1.29864501953125, -1.1268310546875, -0.95501708984375, -0.783203125, -0.61138916015625, -0.4395751953125, -0.26776123046875, -0.095947265625, 0.07586669921875, 0.2476806640625, 0.41949462890625, 0.59130859375, 0.76312255859375, 0.9349365234375, 1.10675048828125, 1.278564453125, 1.45037841796875, 1.6221923828125, 1.79400634765625, 1.9658203125, 2.13763427734375, 2.3094482421875, 2.48126220703125, 2.653076171875, 2.82489013671875, 2.9967041015625, 3.16851806640625, 3.34033203125, 3.51214599609375, 3.6839599609375, 3.85577392578125, 4.027587890625, 4.19940185546875, 4.3712158203125, 4.54302978515625, 4.71484375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 12.0, 13.0, 20.0, 29.0, 52.0, 59.0, 85.0, 104.0, 120.0, 98.0, 110.0, 91.0, 74.0, 41.0, 30.0, 21.0, 15.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.8408203125, -8.572265625, -8.3037109375, -8.03515625, -7.7666015625, -7.498046875, -7.2294921875, -6.9609375, -6.6923828125, -6.423828125, -6.1552734375, -5.88671875, -5.6181640625, -5.349609375, -5.0810546875, -4.8125, -4.5439453125, -4.275390625, -4.0068359375, -3.73828125, -3.4697265625, -3.201171875, -2.9326171875, -2.6640625, -2.3955078125, -2.126953125, -1.8583984375, -1.58984375, -1.3212890625, -1.052734375, -0.7841796875, -0.515625, -0.2470703125, 0.021484375, 0.2900390625, 0.55859375, 0.8271484375, 1.095703125, 1.3642578125, 1.6328125, 1.9013671875, 2.169921875, 2.4384765625, 2.70703125, 2.9755859375, 3.244140625, 3.5126953125, 3.78125, 4.0498046875, 4.318359375, 4.5869140625, 4.85546875, 5.1240234375, 5.392578125, 5.6611328125, 5.9296875, 6.1982421875, 6.466796875, 6.7353515625, 7.00390625, 7.2724609375, 7.541015625, 7.8095703125, 8.078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 13.0, 16.0, 22.0, 44.0, 81.0, 162.0, 284.0, 708.0, 2169.0, 32855.0, 934888.0, 72777.0, 3040.0, 785.0, 313.0, 172.0, 90.0, 52.0, 21.0, 21.0, 14.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5859375, -2.48486328125, -2.3837890625, -2.28271484375, -2.181640625, -2.08056640625, -1.9794921875, -1.87841796875, -1.77734375, -1.67626953125, -1.5751953125, -1.47412109375, -1.373046875, -1.27197265625, -1.1708984375, -1.06982421875, -0.96875, -0.86767578125, -0.7666015625, -0.66552734375, -0.564453125, -0.46337890625, -0.3623046875, -0.26123046875, -0.16015625, -0.05908203125, 0.0419921875, 0.14306640625, 0.244140625, 0.34521484375, 0.4462890625, 0.54736328125, 0.6484375, 0.74951171875, 0.8505859375, 0.95166015625, 1.052734375, 1.15380859375, 1.2548828125, 1.35595703125, 1.45703125, 1.55810546875, 1.6591796875, 1.76025390625, 1.861328125, 1.96240234375, 2.0634765625, 2.16455078125, 2.265625, 2.36669921875, 2.4677734375, 2.56884765625, 2.669921875, 2.77099609375, 2.8720703125, 2.97314453125, 3.07421875, 3.17529296875, 3.2763671875, 3.37744140625, 3.478515625, 3.57958984375, 3.6806640625, 3.78173828125, 3.8828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 8.0, 14.0, 18.0, 10.0, 22.0, 23.0, 29.0, 29.0, 44.0, 60.0, 39.0, 60.0, 70.0, 114.0, 72.0, 74.0, 62.0, 55.0, 28.0, 29.0, 24.0, 27.0, 15.0, 12.0, 14.0, 7.0, 8.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001513957977294922, -0.00014721695333719254, -0.00014303810894489288, -0.00013885926455259323, -0.00013468042016029358, -0.00013050157576799393, -0.00012632273137569427, -0.00012214388698339462, -0.00011796504259109497, -0.00011378619819879532, -0.00010960735380649567, -0.00010542850941419601, -0.00010124966502189636, -9.707082062959671e-05, -9.289197623729706e-05, -8.87131318449974e-05, -8.453428745269775e-05, -8.03554430603981e-05, -7.617659866809845e-05, -7.19977542757988e-05, -6.781890988349915e-05, -6.36400654911995e-05, -5.946122109889984e-05, -5.528237670660019e-05, -5.110353231430054e-05, -4.6924687922000885e-05, -4.274584352970123e-05, -3.856699913740158e-05, -3.438815474510193e-05, -3.0209310352802277e-05, -2.6030465960502625e-05, -2.1851621568202972e-05, -1.767277717590332e-05, -1.3493932783603668e-05, -9.315088391304016e-06, -5.136243999004364e-06, -9.57399606704712e-07, 3.22144478559494e-06, 7.400289177894592e-06, 1.1579133570194244e-05, 1.5757977962493896e-05, 1.993682235479355e-05, 2.41156667470932e-05, 2.8294511139392853e-05, 3.2473355531692505e-05, 3.665219992399216e-05, 4.083104431629181e-05, 4.500988870859146e-05, 4.918873310089111e-05, 5.3367577493190765e-05, 5.754642188549042e-05, 6.172526627779007e-05, 6.590411067008972e-05, 7.008295506238937e-05, 7.426179945468903e-05, 7.844064384698868e-05, 8.261948823928833e-05, 8.679833263158798e-05, 9.097717702388763e-05, 9.515602141618729e-05, 9.933486580848694e-05, 0.00010351371020078659, 0.00010769255459308624, 0.0001118713989853859, 0.00011605024337768555]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 19.0, 24.0, 28.0, 44.0, 81.0, 136.0, 145.0, 270.0, 430.0, 676.0, 1099.0, 2056.0, 4454.0, 11237.0, 37649.0, 157596.0, 493101.0, 251206.0, 59941.0, 16245.0, 5939.0, 2688.0, 1316.0, 755.0, 504.0, 311.0, 196.0, 141.0, 90.0, 50.0, 40.0, 31.0, 16.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.089263916015625, -1.05255126953125, -1.015838623046875, -0.9791259765625, -0.942413330078125, -0.90570068359375, -0.868988037109375, -0.832275390625, -0.795562744140625, -0.75885009765625, -0.722137451171875, -0.6854248046875, -0.648712158203125, -0.61199951171875, -0.575286865234375, -0.53857421875, -0.501861572265625, -0.46514892578125, -0.428436279296875, -0.3917236328125, -0.355010986328125, -0.31829833984375, -0.281585693359375, -0.244873046875, -0.208160400390625, -0.17144775390625, -0.134735107421875, -0.0980224609375, -0.061309814453125, -0.02459716796875, 0.012115478515625, 0.048828125, 0.085540771484375, 0.12225341796875, 0.158966064453125, 0.1956787109375, 0.232391357421875, 0.26910400390625, 0.305816650390625, 0.342529296875, 0.379241943359375, 0.41595458984375, 0.452667236328125, 0.4893798828125, 0.526092529296875, 0.56280517578125, 0.599517822265625, 0.63623046875, 0.672943115234375, 0.70965576171875, 0.746368408203125, 0.7830810546875, 0.819793701171875, 0.85650634765625, 0.893218994140625, 0.929931640625, 0.966644287109375, 1.00335693359375, 1.040069580078125, 1.0767822265625, 1.113494873046875, 1.15020751953125, 1.186920166015625, 1.2236328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 11.0, 6.0, 4.0, 16.0, 19.0, 20.0, 40.0, 73.0, 124.0, 188.0, 196.0, 120.0, 65.0, 41.0, 25.0, 18.0, 10.0, 5.0, 4.0, 5.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.955078125, -0.9169769287109375, -0.878875732421875, -0.8407745361328125, -0.80267333984375, -0.7645721435546875, -0.726470947265625, -0.6883697509765625, -0.6502685546875, -0.6121673583984375, -0.574066162109375, -0.5359649658203125, -0.49786376953125, -0.4597625732421875, -0.421661376953125, -0.3835601806640625, -0.345458984375, -0.3073577880859375, -0.269256591796875, -0.2311553955078125, -0.19305419921875, -0.1549530029296875, -0.116851806640625, -0.0787506103515625, -0.0406494140625, -0.0025482177734375, 0.035552978515625, 0.0736541748046875, 0.11175537109375, 0.1498565673828125, 0.187957763671875, 0.2260589599609375, 0.26416015625, 0.3022613525390625, 0.340362548828125, 0.3784637451171875, 0.41656494140625, 0.4546661376953125, 0.492767333984375, 0.5308685302734375, 0.5689697265625, 0.6070709228515625, 0.645172119140625, 0.6832733154296875, 0.72137451171875, 0.7594757080078125, 0.797576904296875, 0.8356781005859375, 0.873779296875, 0.9118804931640625, 0.949981689453125, 0.9880828857421875, 1.02618408203125, 1.0642852783203125, 1.102386474609375, 1.1404876708984375, 1.1785888671875, 1.2166900634765625, 1.254791259765625, 1.2928924560546875, 1.33099365234375, 1.3690948486328125, 1.407196044921875, 1.4452972412109375, 1.4833984375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 3.0, 14.0, 18.0, 74.0, 122.0, 177.0, 231.0, 186.0, 97.0, 43.0, 17.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.168214797973633, -16.752307891845703, -16.336402893066406, -15.920495986938477, -15.504590034484863, -15.088683128356934, -14.67277717590332, -14.25687026977539, -13.840964317321777, -13.425058364868164, -13.009151458740234, -12.593245506286621, -12.177339553833008, -11.761432647705078, -11.345526695251465, -10.929620742797852, -10.513713836669922, -10.097807884216309, -9.681900978088379, -9.265995025634766, -8.850089073181152, -8.434182167053223, -8.01827621459961, -7.602369785308838, -7.186464309692383, -6.770557880401611, -6.354651927947998, -5.938745498657227, -5.522839069366455, -5.106932640075684, -4.69102668762207, -4.275120258331299, -3.8592138290405273, -3.443307638168335, -3.0274012088775635, -2.611495018005371, -2.1955885887145996, -1.7796823978424072, -1.3637762069702148, -0.9478697776794434, -0.531963586807251, -0.11605730652809143, 0.2998489737510681, 0.7157552242279053, 1.1316615343093872, 1.5475678443908691, 1.9634740352630615, 2.379380464553833, 2.7952866554260254, 3.2111928462982178, 3.6270992755889893, 4.043005466461182, 4.458911895751953, 4.874817848205566, 5.290724277496338, 5.706630706787109, 6.122536659240723, 6.538443088531494, 6.954349040985107, 7.370255470275879, 7.78616189956665, 8.202068328857422, 8.617974281311035, 9.033880233764648, 9.449787139892578]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 10.0, 7.0, 7.0, 10.0, 10.0, 12.0, 12.0, 18.0, 20.0, 15.0, 30.0, 36.0, 31.0, 34.0, 32.0, 38.0, 38.0, 45.0, 38.0, 41.0, 44.0, 41.0, 33.0, 43.0, 34.0, 35.0, 24.0, 38.0, 21.0, 27.0, 20.0, 26.0, 23.0, 17.0, 13.0, 11.0, 13.0, 11.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0], "bins": [-6.223525524139404, -6.045218467712402, -5.8669114112854, -5.688604354858398, -5.5102972984313965, -5.3319902420043945, -5.153682708740234, -4.975376129150391, -4.7970685958862305, -4.6187615394592285, -4.440454483032227, -4.262147426605225, -4.083840370178223, -3.9055333137512207, -3.7272260189056396, -3.5489189624786377, -3.370612144470215, -3.192305088043213, -3.013998031616211, -2.835690975189209, -2.657383918762207, -2.479076862335205, -2.300769567489624, -2.122462511062622, -1.9441554546356201, -1.7658483982086182, -1.5875413417816162, -1.4092341661453247, -1.2309271097183228, -1.0526200532913208, -0.8743128776550293, -0.6960058212280273, -0.5176982879638672, -0.33939120173454285, -0.1610841155052185, 0.017223000526428223, 0.19553005695343018, 0.37383711338043213, 0.5521442890167236, 0.7304513454437256, 0.9087584018707275, 1.0870654582977295, 1.2653725147247314, 1.443679690361023, 1.621986746788025, 1.8002938032150269, 1.9786009788513184, 2.1569080352783203, 2.3352150917053223, 2.513522148132324, 2.691829204559326, 2.870136260986328, 3.04844331741333, 3.226750373840332, 3.405057668685913, 3.583364725112915, 3.761671781539917, 3.939978837966919, 4.1182861328125, 4.296593189239502, 4.474900245666504, 4.653207302093506, 4.831514358520508, 5.00982141494751, 5.188128471374512]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 4.0, 7.0, 16.0, 18.0, 15.0, 26.0, 43.0, 47.0, 71.0, 106.0, 157.0, 230.0, 356.0, 499.0, 822.0, 1184.0, 1725.0, 2540.0, 3609.0, 5155.0, 8369.0, 999338.0, 9075.0, 5477.0, 3689.0, 2537.0, 1767.0, 1146.0, 824.0, 534.0, 385.0, 260.0, 171.0, 125.0, 84.0, 48.0, 33.0, 30.0, 19.0, 16.0, 12.0, 13.0, 4.0, 6.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.849271774291992, -3.723269462585449, -3.5972671508789062, -3.471264600753784, -3.345262289047241, -3.2192599773406982, -3.093257427215576, -2.967255115509033, -2.8412528038024902, -2.7152504920959473, -2.5892481803894043, -2.4632456302642822, -2.3372433185577393, -2.2112410068511963, -2.085238456726074, -1.9592361450195312, -1.8332338333129883, -1.7072315216064453, -1.5812290906906128, -1.4552266597747803, -1.3292243480682373, -1.2032220363616943, -1.0772196054458618, -0.9512172341346741, -0.8252148628234863, -0.6992124915122986, -0.5732101202011108, -0.4472077488899231, -0.32120537757873535, -0.1952030062675476, -0.06920063495635986, 0.05680173635482788, 0.18280410766601562, 0.30880647897720337, 0.4348088502883911, 0.5608112215995789, 0.6868135929107666, 0.8128159642219543, 0.9388183355331421, 1.0648207664489746, 1.1908230781555176, 1.3168253898620605, 1.442827820777893, 1.5688302516937256, 1.6948325634002686, 1.8208348751068115, 1.946837306022644, 2.0728397369384766, 2.1988420486450195, 2.3248443603515625, 2.4508466720581055, 2.5768492221832275, 2.7028515338897705, 2.8288538455963135, 2.9548563957214355, 3.0808587074279785, 3.2068610191345215, 3.3328633308410645, 3.4588656425476074, 3.5848681926727295, 3.7108705043792725, 3.8368728160858154, 3.9628753662109375, 4.0888776779174805, 4.214879989624023]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 12.0, 18.0, 29.0, 45.0, 69.0, 86.0, 113.0, 140.0, 51441952.0, 27502.0, 136.0, 83.0, 47.0, 23.0, 19.0, 12.0, 9.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-236.25, -228.609375, -220.96875, -213.328125, -205.6875, -198.046875, -190.40625, -182.765625, -175.125, -167.484375, -159.84375, -152.203125, -144.5625, -136.921875, -129.28125, -121.640625, -114.0, -106.359375, -98.71875, -91.078125, -83.4375, -75.796875, -68.15625, -60.515625, -52.875, -45.234375, -37.59375, -29.953125, -22.3125, -14.671875, -7.03125, 0.609375, 8.25, 15.890625, 23.53125, 31.171875, 38.8125, 46.453125, 54.09375, 61.734375, 69.375, 77.015625, 84.65625, 92.296875, 99.9375, 107.578125, 115.21875, 122.859375, 130.5, 138.140625, 145.78125, 153.421875, 161.0625, 168.703125, 176.34375, 183.984375, 191.625, 199.265625, 206.90625, 214.546875, 222.1875, 229.828125, 237.46875, 245.109375, 252.75]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 15.0, 14.0, 20.0, 41.0, 51.0, 126.0, 147.0, 196.0, 283.0, 430.0, 657.0, 907.0, 1324.0, 2199.0, 3294.0, 5125.0, 7992.0, 12503.0, 19580.0, 31946.0, 51797.0, 86543.0, 151190.0, 303130.0, 964694.0, 3884105.0, 350759.0, 167749.0, 94405.0, 56501.0, 34745.0, 21519.0, 13568.0, 8305.0, 5375.0, 3412.0, 2263.0, 1514.0, 1005.0, 652.0, 461.0, 276.0, 196.0, 124.0, 79.0, 63.0, 52.0, 21.0, 34.0, 13.0, 12.0, 5.0, 11.0, 0.0, 2.0], "bins": [-4.1875, -4.06463623046875, -3.9417724609375, -3.81890869140625, -3.696044921875, -3.57318115234375, -3.4503173828125, -3.32745361328125, -3.20458984375, -3.08172607421875, -2.9588623046875, -2.83599853515625, -2.713134765625, -2.59027099609375, -2.4674072265625, -2.34454345703125, -2.2216796875, -2.09881591796875, -1.9759521484375, -1.85308837890625, -1.730224609375, -1.60736083984375, -1.4844970703125, -1.36163330078125, -1.23876953125, -1.11590576171875, -0.9930419921875, -0.87017822265625, -0.747314453125, -0.62445068359375, -0.5015869140625, -0.37872314453125, -0.255859375, -0.13299560546875, -0.0101318359375, 0.11273193359375, 0.235595703125, 0.35845947265625, 0.4813232421875, 0.60418701171875, 0.72705078125, 0.84991455078125, 0.9727783203125, 1.09564208984375, 1.218505859375, 1.34136962890625, 1.4642333984375, 1.58709716796875, 1.7099609375, 1.83282470703125, 1.9556884765625, 2.07855224609375, 2.201416015625, 2.32427978515625, 2.4471435546875, 2.57000732421875, 2.69287109375, 2.81573486328125, 2.9385986328125, 3.06146240234375, 3.184326171875, 3.30718994140625, 3.4300537109375, 3.55291748046875, 3.67578125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 8.0, 8.0, 8.0, 9.0, 14.0, 20.0, 24.0, 27.0, 27.0, 19.0, 31.0, 38.0, 31.0, 31.0, 42.0, 37.0, 44.0, 75.0, 1041.0, 56.0, 44.0, 47.0, 40.0, 33.0, 35.0, 29.0, 27.0, 31.0, 20.0, 24.0, 22.0, 15.0, 11.0, 10.0, 10.0, 11.0, 11.0, 1.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.51904296875, -21.6943359375, -20.86962890625, -20.044921875, -19.22021484375, -18.3955078125, -17.57080078125, -16.74609375, -15.92138671875, -15.0966796875, -14.27197265625, -13.447265625, -12.62255859375, -11.7978515625, -10.97314453125, -10.1484375, -9.32373046875, -8.4990234375, -7.67431640625, -6.849609375, -6.02490234375, -5.2001953125, -4.37548828125, -3.55078125, -2.72607421875, -1.9013671875, -1.07666015625, -0.251953125, 0.57275390625, 1.3974609375, 2.22216796875, 3.046875, 3.87158203125, 4.6962890625, 5.52099609375, 6.345703125, 7.17041015625, 7.9951171875, 8.81982421875, 9.64453125, 10.46923828125, 11.2939453125, 12.11865234375, 12.943359375, 13.76806640625, 14.5927734375, 15.41748046875, 16.2421875, 17.06689453125, 17.8916015625, 18.71630859375, 19.541015625, 20.36572265625, 21.1904296875, 22.01513671875, 22.83984375, 23.66455078125, 24.4892578125, 25.31396484375, 26.138671875, 26.96337890625, 27.7880859375, 28.61279296875, 29.4375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 3.0, 8.0, 11.0, 20.0, 60.0, 78.0, 101.0, 133.0, 239.0, 295.0, 456.0, 532.0, 803.0, 1177.0, 1518.0, 2082.0, 3013.0, 3893.0, 5376.0, 7462.0, 10434.0, 14815.0, 21057.0, 29946.0, 44160.0, 66781.0, 103163.0, 163525.0, 288097.0, 861606.0, 3706650.0, 380830.0, 199616.0, 122307.0, 78607.0, 52060.0, 35195.0, 24523.0, 17289.0, 11919.0, 8589.0, 6295.0, 4616.0, 3324.0, 2439.0, 1746.0, 1270.0, 952.0, 746.0, 536.0, 344.0, 246.0, 145.0, 124.0, 75.0, 45.0, 37.0, 33.0, 29.0, 11.0, 3.0], "bins": [-4.75, -4.60687255859375, -4.4637451171875, -4.32061767578125, -4.177490234375, -4.03436279296875, -3.8912353515625, -3.74810791015625, -3.60498046875, -3.46185302734375, -3.3187255859375, -3.17559814453125, -3.032470703125, -2.88934326171875, -2.7462158203125, -2.60308837890625, -2.4599609375, -2.31683349609375, -2.1737060546875, -2.03057861328125, -1.887451171875, -1.74432373046875, -1.6011962890625, -1.45806884765625, -1.31494140625, -1.17181396484375, -1.0286865234375, -0.88555908203125, -0.742431640625, -0.59930419921875, -0.4561767578125, -0.31304931640625, -0.169921875, -0.02679443359375, 0.1163330078125, 0.25946044921875, 0.402587890625, 0.54571533203125, 0.6888427734375, 0.83197021484375, 0.97509765625, 1.11822509765625, 1.2613525390625, 1.40447998046875, 1.547607421875, 1.69073486328125, 1.8338623046875, 1.97698974609375, 2.1201171875, 2.26324462890625, 2.4063720703125, 2.54949951171875, 2.692626953125, 2.83575439453125, 2.9788818359375, 3.12200927734375, 3.26513671875, 3.40826416015625, 3.5513916015625, 3.69451904296875, 3.837646484375, 3.98077392578125, 4.1239013671875, 4.26702880859375, 4.41015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 10.0, 3.0, 3.0, 6.0, 8.0, 13.0, 23.0, 17.0, 22.0, 21.0, 25.0, 30.0, 22.0, 33.0, 37.0, 25.0, 40.0, 39.0, 54.0, 573.0, 475.0, 70.0, 38.0, 40.0, 24.0, 37.0, 37.0, 35.0, 20.0, 22.0, 30.0, 26.0, 30.0, 10.0, 14.0, 17.0, 15.0, 8.0, 5.0, 10.0, 8.0, 9.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.5234375, -13.0721435546875, -12.620849609375, -12.1695556640625, -11.71826171875, -11.2669677734375, -10.815673828125, -10.3643798828125, -9.9130859375, -9.4617919921875, -9.010498046875, -8.5592041015625, -8.10791015625, -7.6566162109375, -7.205322265625, -6.7540283203125, -6.302734375, -5.8514404296875, -5.400146484375, -4.9488525390625, -4.49755859375, -4.0462646484375, -3.594970703125, -3.1436767578125, -2.6923828125, -2.2410888671875, -1.789794921875, -1.3385009765625, -0.88720703125, -0.4359130859375, 0.015380859375, 0.4666748046875, 0.91796875, 1.3692626953125, 1.820556640625, 2.2718505859375, 2.72314453125, 3.1744384765625, 3.625732421875, 4.0770263671875, 4.5283203125, 4.9796142578125, 5.430908203125, 5.8822021484375, 6.33349609375, 6.7847900390625, 7.236083984375, 7.6873779296875, 8.138671875, 8.5899658203125, 9.041259765625, 9.4925537109375, 9.94384765625, 10.3951416015625, 10.846435546875, 11.2977294921875, 11.7490234375, 12.2003173828125, 12.651611328125, 13.1029052734375, 13.55419921875, 14.0054931640625, 14.456787109375, 14.9080810546875, 15.359375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 8.0, 5.0, 8.0, 10.0, 21.0, 9.0, 13.0, 22.0, 37.0, 58.0, 53.0, 56.0, 85.0, 86.0, 134.0, 187.0, 243.0, 314.0, 452.0, 549.0, 925.0, 1230.0, 2029.0, 3146.0, 5644.0, 11103.0, 26132.0, 90925.0, 5932417.0, 149140.0, 35077.0, 13627.0, 6796.0, 3578.0, 2246.0, 1461.0, 954.0, 645.0, 514.0, 374.0, 264.0, 217.0, 121.0, 124.0, 97.0, 77.0, 63.0, 34.0, 24.0, 16.0, 23.0, 25.0, 15.0, 8.0, 7.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0], "bins": [-21.734375, -21.04736328125, -20.3603515625, -19.67333984375, -18.986328125, -18.29931640625, -17.6123046875, -16.92529296875, -16.23828125, -15.55126953125, -14.8642578125, -14.17724609375, -13.490234375, -12.80322265625, -12.1162109375, -11.42919921875, -10.7421875, -10.05517578125, -9.3681640625, -8.68115234375, -7.994140625, -7.30712890625, -6.6201171875, -5.93310546875, -5.24609375, -4.55908203125, -3.8720703125, -3.18505859375, -2.498046875, -1.81103515625, -1.1240234375, -0.43701171875, 0.25, 0.93701171875, 1.6240234375, 2.31103515625, 2.998046875, 3.68505859375, 4.3720703125, 5.05908203125, 5.74609375, 6.43310546875, 7.1201171875, 7.80712890625, 8.494140625, 9.18115234375, 9.8681640625, 10.55517578125, 11.2421875, 11.92919921875, 12.6162109375, 13.30322265625, 13.990234375, 14.67724609375, 15.3642578125, 16.05126953125, 16.73828125, 17.42529296875, 18.1123046875, 18.79931640625, 19.486328125, 20.17333984375, 20.8603515625, 21.54736328125, 22.234375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 6.0, 8.0, 13.0, 14.0, 9.0, 15.0, 17.0, 25.0, 24.0, 31.0, 32.0, 41.0, 41.0, 38.0, 43.0, 63.0, 101.0, 430.0, 512.0, 100.0, 74.0, 49.0, 41.0, 53.0, 36.0, 25.0, 35.0, 18.0, 22.0, 15.0, 17.0, 9.0, 14.0, 8.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.484375, -11.10205078125, -10.7197265625, -10.33740234375, -9.955078125, -9.57275390625, -9.1904296875, -8.80810546875, -8.42578125, -8.04345703125, -7.6611328125, -7.27880859375, -6.896484375, -6.51416015625, -6.1318359375, -5.74951171875, -5.3671875, -4.98486328125, -4.6025390625, -4.22021484375, -3.837890625, -3.45556640625, -3.0732421875, -2.69091796875, -2.30859375, -1.92626953125, -1.5439453125, -1.16162109375, -0.779296875, -0.39697265625, -0.0146484375, 0.36767578125, 0.75, 1.13232421875, 1.5146484375, 1.89697265625, 2.279296875, 2.66162109375, 3.0439453125, 3.42626953125, 3.80859375, 4.19091796875, 4.5732421875, 4.95556640625, 5.337890625, 5.72021484375, 6.1025390625, 6.48486328125, 6.8671875, 7.24951171875, 7.6318359375, 8.01416015625, 8.396484375, 8.77880859375, 9.1611328125, 9.54345703125, 9.92578125, 10.30810546875, 10.6904296875, 11.07275390625, 11.455078125, 11.83740234375, 12.2197265625, 12.60205078125, 12.984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 12.0, 14.0, 28.0, 31.0, 68.0, 111.0, 236.0, 211.0, 104.0, 57.0, 42.0, 19.0, 23.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.58287811279297, -27.763355255126953, -26.94383430480957, -26.124311447143555, -25.304790496826172, -24.485267639160156, -23.66574478149414, -22.846221923828125, -22.026700973510742, -21.207178115844727, -20.387657165527344, -19.568134307861328, -18.748611450195312, -17.92909049987793, -17.109567642211914, -16.29004669189453, -15.470523834228516, -14.651001930236816, -13.831480026245117, -13.011957168579102, -12.192435264587402, -11.372913360595703, -10.553390502929688, -9.733868598937988, -8.914346694946289, -8.09482479095459, -7.275302410125732, -6.455780029296875, -5.636258125305176, -4.816736221313477, -3.997213840484619, -3.1776914596557617, -2.3581714630126953, -1.538649320602417, -0.7191271781921387, 0.10039496421813965, 0.919917106628418, 1.7394390106201172, 2.5589613914489746, 3.378483772277832, 4.198005676269531, 5.0175275802612305, 5.837049961090088, 6.656572341918945, 7.4760942459106445, 8.295616149902344, 9.11513900756836, 9.934660911560059, 10.754182815551758, 11.573704719543457, 12.393226623535156, 13.212749481201172, 14.032271385192871, 14.85179328918457, 15.671316146850586, 16.49083709716797, 17.310359954833984, 18.1298828125, 18.949403762817383, 19.7689266204834, 20.58844757080078, 21.407970428466797, 22.227493286132812, 23.047016143798828, 23.86653709411621]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 4.0, 7.0, 14.0, 7.0, 13.0, 23.0, 17.0, 27.0, 35.0, 26.0, 31.0, 29.0, 29.0, 23.0, 35.0, 48.0, 47.0, 33.0, 49.0, 31.0, 40.0, 38.0, 35.0, 39.0, 29.0, 37.0, 27.0, 25.0, 22.0, 24.0, 24.0, 20.0, 16.0, 11.0, 13.0, 10.0, 17.0, 6.0, 2.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-14.916242599487305, -14.425434112548828, -13.934626579284668, -13.443818092346191, -12.953009605407715, -12.462202072143555, -11.971393585205078, -11.480585098266602, -10.989777565002441, -10.498969078063965, -10.008161544799805, -9.517353057861328, -9.026544570922852, -8.535737037658691, -8.044928550720215, -7.5541205406188965, -7.06331205368042, -6.572504043579102, -6.081695556640625, -5.590887546539307, -5.100079536437988, -4.609271049499512, -4.118463039398193, -3.627655029296875, -3.1368467807769775, -2.64603853225708, -2.1552305221557617, -1.6644222736358643, -1.1736141443252563, -0.6828060150146484, -0.19199776649475098, 0.2988102436065674, 0.7896184921264648, 1.2804266214370728, 1.7712347507476807, 2.262042999267578, 2.7528510093688965, 3.243659257888794, 3.7344675064086914, 4.22527551651001, 4.716083526611328, 5.2068915367126465, 5.697700023651123, 6.188508033752441, 6.67931604385376, 7.170124053955078, 7.660932540893555, 8.151741027832031, 8.642549514770508, 9.133358001708984, 9.624165534973145, 10.114974021911621, 10.605782508850098, 11.096590042114258, 11.587398529052734, 12.078207015991211, 12.569014549255371, 13.059823036193848, 13.550630569458008, 14.041439056396484, 14.532247543334961, 15.023055076599121, 15.513863563537598, 16.004671096801758, 16.495479583740234]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 6.0, 12.0, 18.0, 18.0, 18.0, 49.0, 62.0, 89.0, 131.0, 214.0, 390.0, 661.0, 1272.0, 2878.0, 7560.0, 27698.0, 252570.0, 3851638.0, 33363.0, 8457.0, 3403.0, 1570.0, 807.0, 465.0, 284.0, 182.0, 124.0, 92.0, 63.0, 47.0, 35.0, 23.0, 17.0, 14.0, 10.0, 8.0, 4.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1685791015625, -0.16258811950683594, -0.15659713745117188, -0.1506061553955078, -0.14461517333984375, -0.1386241912841797, -0.13263320922851562, -0.12664222717285156, -0.1206512451171875, -0.11466026306152344, -0.10866928100585938, -0.10267829895019531, -0.09668731689453125, -0.09069633483886719, -0.08470535278320312, -0.07871437072753906, -0.072723388671875, -0.06673240661621094, -0.060741424560546875, -0.05475044250488281, -0.04875946044921875, -0.04276847839355469, -0.036777496337890625, -0.030786514282226562, -0.0247955322265625, -0.018804550170898438, -0.012813568115234375, -0.0068225860595703125, -0.00083160400390625, 0.0051593780517578125, 0.011150360107421875, 0.017141342163085938, 0.02313232421875, 0.029123306274414062, 0.035114288330078125, 0.04110527038574219, 0.04709625244140625, 0.05308723449707031, 0.059078216552734375, 0.06506919860839844, 0.0710601806640625, 0.07705116271972656, 0.08304214477539062, 0.08903312683105469, 0.09502410888671875, 0.10101509094238281, 0.10700607299804688, 0.11299705505371094, 0.118988037109375, 0.12497901916503906, 0.13097000122070312, 0.1369609832763672, 0.14295196533203125, 0.1489429473876953, 0.15493392944335938, 0.16092491149902344, 0.1669158935546875, 0.17290687561035156, 0.17889785766601562, 0.1848888397216797, 0.19087982177734375, 0.1968708038330078, 0.20286178588867188, 0.20885276794433594, 0.21484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 2.0, 2.0, 5.0, 6.0, 10.0, 9.0, 7.0, 15.0, 15.0, 14.0, 22.0, 168.0, 635.0, 14.0, 14.0, 13.0, 4.0, 5.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.028411865234375, -0.027395248413085938, -0.026378631591796875, -0.025362014770507812, -0.02434539794921875, -0.023328781127929688, -0.022312164306640625, -0.021295547485351562, -0.0202789306640625, -0.019262313842773438, -0.018245697021484375, -0.017229080200195312, -0.01621246337890625, -0.015195846557617188, -0.014179229736328125, -0.013162612915039062, -0.01214599609375, -0.011129379272460938, -0.010112762451171875, -0.009096145629882812, -0.00807952880859375, -0.0070629119873046875, -0.006046295166015625, -0.0050296783447265625, -0.0040130615234375, -0.0029964447021484375, -0.001979827880859375, -0.0009632110595703125, 5.340576171875e-05, 0.0010700225830078125, 0.002086639404296875, 0.0031032562255859375, 0.004119873046875, 0.0051364898681640625, 0.006153106689453125, 0.0071697235107421875, 0.00818634033203125, 0.009202957153320312, 0.010219573974609375, 0.011236190795898438, 0.0122528076171875, 0.013269424438476562, 0.014286041259765625, 0.015302658081054688, 0.01631927490234375, 0.017335891723632812, 0.018352508544921875, 0.019369125366210938, 0.0203857421875, 0.021402359008789062, 0.022418975830078125, 0.023435592651367188, 0.02445220947265625, 0.025468826293945312, 0.026485443115234375, 0.027502059936523438, 0.0285186767578125, 0.029535293579101562, 0.030551910400390625, 0.03156852722167969, 0.03258514404296875, 0.03360176086425781, 0.034618377685546875, 0.03563499450683594, 0.036651611328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 10.0, 11.0, 11.0, 18.0, 19.0, 33.0, 40.0, 70.0, 96.0, 145.0, 267.0, 463.0, 904.0, 1678.0, 3659.0, 9210.0, 28289.0, 129571.0, 1991598.0, 1850386.0, 128888.0, 29697.0, 10271.0, 4305.0, 2065.0, 1033.0, 568.0, 348.0, 201.0, 122.0, 81.0, 53.0, 34.0, 37.0, 19.0, 20.0, 16.0, 11.0, 6.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1207275390625, -0.11695384979248047, -0.11318016052246094, -0.1094064712524414, -0.10563278198242188, -0.10185909271240234, -0.09808540344238281, -0.09431171417236328, -0.09053802490234375, -0.08676433563232422, -0.08299064636230469, -0.07921695709228516, -0.07544326782226562, -0.0716695785522461, -0.06789588928222656, -0.06412220001220703, -0.0603485107421875, -0.05657482147216797, -0.05280113220214844, -0.049027442932128906, -0.045253753662109375, -0.041480064392089844, -0.03770637512207031, -0.03393268585205078, -0.03015899658203125, -0.02638530731201172, -0.022611618041992188, -0.018837928771972656, -0.015064239501953125, -0.011290550231933594, -0.0075168609619140625, -0.0037431716918945312, 3.0517578125e-05, 0.0038042068481445312, 0.0075778961181640625, 0.011351585388183594, 0.015125274658203125, 0.018898963928222656, 0.022672653198242188, 0.02644634246826172, 0.03022003173828125, 0.03399372100830078, 0.03776741027832031, 0.041541099548339844, 0.045314788818359375, 0.049088478088378906, 0.05286216735839844, 0.05663585662841797, 0.0604095458984375, 0.06418323516845703, 0.06795692443847656, 0.0717306137084961, 0.07550430297851562, 0.07927799224853516, 0.08305168151855469, 0.08682537078857422, 0.09059906005859375, 0.09437274932861328, 0.09814643859863281, 0.10192012786865234, 0.10569381713867188, 0.1094675064086914, 0.11324119567871094, 0.11701488494873047, 0.12078857421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 0.0, 2.0, 8.0, 7.0, 14.0, 16.0, 22.0, 20.0, 33.0, 40.0, 70.0, 116.0, 125.0, 219.0, 343.0, 704.0, 929.0, 463.0, 293.0, 175.0, 122.0, 73.0, 75.0, 46.0, 29.0, 22.0, 25.0, 23.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037109375, -0.0357975959777832, -0.034485816955566406, -0.03317403793334961, -0.03186225891113281, -0.030550479888916016, -0.02923870086669922, -0.027926921844482422, -0.026615142822265625, -0.025303363800048828, -0.02399158477783203, -0.022679805755615234, -0.021368026733398438, -0.02005624771118164, -0.018744468688964844, -0.017432689666748047, -0.01612091064453125, -0.014809131622314453, -0.013497352600097656, -0.01218557357788086, -0.010873794555664062, -0.009562015533447266, -0.008250236511230469, -0.006938457489013672, -0.005626678466796875, -0.004314899444580078, -0.0030031204223632812, -0.0016913414001464844, -0.0003795623779296875, 0.0009322166442871094, 0.0022439956665039062, 0.003555774688720703, 0.0048675537109375, 0.006179332733154297, 0.007491111755371094, 0.00880289077758789, 0.010114669799804688, 0.011426448822021484, 0.012738227844238281, 0.014050006866455078, 0.015361785888671875, 0.016673564910888672, 0.01798534393310547, 0.019297122955322266, 0.020608901977539062, 0.02192068099975586, 0.023232460021972656, 0.024544239044189453, 0.02585601806640625, 0.027167797088623047, 0.028479576110839844, 0.02979135513305664, 0.031103134155273438, 0.032414913177490234, 0.03372669219970703, 0.03503847122192383, 0.036350250244140625, 0.03766202926635742, 0.03897380828857422, 0.040285587310791016, 0.04159736633300781, 0.04290914535522461, 0.044220924377441406, 0.0455327033996582, 0.046844482421875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 30.0, 230.0, 490.0, 160.0, 49.0, 25.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3138902187347412, -0.2860272526741028, -0.25816428661346436, -0.23030132055282593, -0.2024383544921875, -0.17457537353038788, -0.14671240746974945, -0.11884944140911102, -0.0909864753484726, -0.06312350928783417, -0.03526053950190544, -0.007397569715976715, 0.020465396344661713, 0.04832836985588074, 0.07619133591651917, 0.10405430197715759, 0.13191726803779602, 0.15978023409843445, 0.18764320015907288, 0.2155061662197113, 0.24336913228034973, 0.27123212814331055, 0.299095094203949, 0.3269580602645874, 0.35482102632522583, 0.38268399238586426, 0.4105469584465027, 0.4384099245071411, 0.46627289056777954, 0.49413585662841797, 0.5219988226890564, 0.5498617887496948, 0.5777247548103333, 0.6055877208709717, 0.6334506869316101, 0.6613136529922485, 0.689176619052887, 0.7170395851135254, 0.7449025511741638, 0.7727655172348022, 0.8006284832954407, 0.8284914493560791, 0.8563544154167175, 0.884217381477356, 0.9120803475379944, 0.9399433135986328, 0.9678062796592712, 0.9956692457199097, 1.0235322713851929, 1.051395297050476, 1.0792582035064697, 1.107121229171753, 1.1349841356277466, 1.1628471612930298, 1.1907100677490234, 1.2185730934143066, 1.2464359998703003, 1.2742990255355835, 1.3021619319915771, 1.3300249576568604, 1.357887864112854, 1.3857508897781372, 1.4136137962341309, 1.441476821899414, 1.4693397283554077]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 11.0, 19.0, 18.0, 27.0, 33.0, 36.0, 45.0, 48.0, 54.0, 62.0, 82.0, 73.0, 68.0, 60.0, 44.0, 61.0, 58.0, 41.0, 40.0, 26.0, 20.0, 16.0, 11.0, 13.0, 10.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21157985925674438, -0.20223669707775116, -0.19289351999759674, -0.18355035781860352, -0.1742071807384491, -0.16486401855945587, -0.15552085638046265, -0.14617767930030823, -0.1368345022201538, -0.12749134004116058, -0.11814816296100616, -0.10880500078201294, -0.09946182370185852, -0.0901186615228653, -0.08077549189329147, -0.07143232226371765, -0.062089160084724426, -0.052745990455150604, -0.04340282082557678, -0.03405965492129326, -0.024716485291719437, -0.015373315662145615, -0.006030149757862091, 0.003313019871711731, 0.012656189501285553, 0.021999359130859375, 0.0313425287604332, 0.04068569466471672, 0.05002886429429054, 0.059372033923864365, 0.06871519982814789, 0.07805836945772171, 0.08740153908729553, 0.09674470871686935, 0.10608787834644318, 0.1154310405254364, 0.12477421760559082, 0.13411737978458405, 0.14346054196357727, 0.1528037190437317, 0.1621468961238861, 0.17149005830287933, 0.18083323538303375, 0.19017639756202698, 0.1995195746421814, 0.20886273682117462, 0.21820589900016785, 0.22754907608032227, 0.2368922382593155, 0.24623540043830872, 0.25557857751846313, 0.26492175459861755, 0.2742649018764496, 0.283608078956604, 0.2929512560367584, 0.30229443311691284, 0.3116375803947449, 0.3209807574748993, 0.3303239047527313, 0.33966708183288574, 0.34901025891304016, 0.3583534359931946, 0.3676965832710266, 0.37703976035118103, 0.38638293743133545]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 14.0, 6.0, 11.0, 30.0, 34.0, 49.0, 55.0, 82.0, 124.0, 169.0, 243.0, 324.0, 502.0, 781.0, 1316.0, 2054.0, 3669.0, 6930.0, 14176.0, 49149.0, 894346.0, 45156.0, 13615.0, 6365.0, 3448.0, 2107.0, 1266.0, 817.0, 550.0, 336.0, 257.0, 160.0, 114.0, 77.0, 49.0, 40.0, 36.0, 25.0, 18.0, 14.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.17138671875, -0.16576385498046875, -0.1601409912109375, -0.15451812744140625, -0.148895263671875, -0.14327239990234375, -0.1376495361328125, -0.13202667236328125, -0.12640380859375, -0.12078094482421875, -0.1151580810546875, -0.10953521728515625, -0.103912353515625, -0.09828948974609375, -0.0926666259765625, -0.08704376220703125, -0.0814208984375, -0.07579803466796875, -0.0701751708984375, -0.06455230712890625, -0.058929443359375, -0.05330657958984375, -0.0476837158203125, -0.04206085205078125, -0.03643798828125, -0.03081512451171875, -0.0251922607421875, -0.01956939697265625, -0.013946533203125, -0.00832366943359375, -0.0027008056640625, 0.00292205810546875, 0.008544921875, 0.01416778564453125, 0.0197906494140625, 0.02541351318359375, 0.031036376953125, 0.03665924072265625, 0.0422821044921875, 0.04790496826171875, 0.05352783203125, 0.05915069580078125, 0.0647735595703125, 0.07039642333984375, 0.076019287109375, 0.08164215087890625, 0.0872650146484375, 0.09288787841796875, 0.0985107421875, 0.10413360595703125, 0.1097564697265625, 0.11537933349609375, 0.121002197265625, 0.12662506103515625, 0.1322479248046875, 0.13787078857421875, 0.14349365234375, 0.14911651611328125, 0.1547393798828125, 0.16036224365234375, 0.165985107421875, 0.17160797119140625, 0.1772308349609375, 0.18285369873046875, 0.1884765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 1.0, 5.0, 7.0, 5.0, 5.0, 12.0, 11.0, 15.0, 12.0, 24.0, 117.0, 395.0, 269.0, 47.0, 11.0, 11.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025848388671875, -0.02487659454345703, -0.023904800415039062, -0.022933006286621094, -0.021961212158203125, -0.020989418029785156, -0.020017623901367188, -0.01904582977294922, -0.01807403564453125, -0.01710224151611328, -0.016130447387695312, -0.015158653259277344, -0.014186859130859375, -0.013215065002441406, -0.012243270874023438, -0.011271476745605469, -0.0102996826171875, -0.009327888488769531, -0.008356094360351562, -0.007384300231933594, -0.006412506103515625, -0.005440711975097656, -0.0044689178466796875, -0.0034971237182617188, -0.00252532958984375, -0.0015535354614257812, -0.0005817413330078125, 0.00039005279541015625, 0.001361846923828125, 0.0023336410522460938, 0.0033054351806640625, 0.004277229309082031, 0.0052490234375, 0.006220817565917969, 0.0071926116943359375, 0.008164405822753906, 0.009136199951171875, 0.010107994079589844, 0.011079788208007812, 0.012051582336425781, 0.01302337646484375, 0.013995170593261719, 0.014966964721679688, 0.015938758850097656, 0.016910552978515625, 0.017882347106933594, 0.018854141235351562, 0.01982593536376953, 0.0207977294921875, 0.02176952362060547, 0.022741317749023438, 0.023713111877441406, 0.024684906005859375, 0.025656700134277344, 0.026628494262695312, 0.02760028839111328, 0.02857208251953125, 0.02954387664794922, 0.030515670776367188, 0.031487464904785156, 0.032459259033203125, 0.033431053161621094, 0.03440284729003906, 0.03537464141845703, 0.036346435546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 6.0, 17.0, 23.0, 28.0, 35.0, 39.0, 64.0, 81.0, 104.0, 153.0, 243.0, 371.0, 553.0, 863.0, 1597.0, 3241.0, 7641.0, 26772.0, 222886.0, 706731.0, 55273.0, 12102.0, 4424.0, 2136.0, 1113.0, 688.0, 385.0, 282.0, 168.0, 138.0, 103.0, 67.0, 43.0, 38.0, 34.0, 22.0, 20.0, 14.0, 13.0, 11.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.2315673828125, -0.22390174865722656, -0.21623611450195312, -0.2085704803466797, -0.20090484619140625, -0.1932392120361328, -0.18557357788085938, -0.17790794372558594, -0.1702423095703125, -0.16257667541503906, -0.15491104125976562, -0.1472454071044922, -0.13957977294921875, -0.1319141387939453, -0.12424850463867188, -0.11658287048339844, -0.108917236328125, -0.10125160217285156, -0.09358596801757812, -0.08592033386230469, -0.07825469970703125, -0.07058906555175781, -0.06292343139648438, -0.05525779724121094, -0.0475921630859375, -0.03992652893066406, -0.032260894775390625, -0.024595260620117188, -0.01692962646484375, -0.009263992309570312, -0.001598358154296875, 0.0060672760009765625, 0.01373291015625, 0.021398544311523438, 0.029064178466796875, 0.03672981262207031, 0.04439544677734375, 0.05206108093261719, 0.059726715087890625, 0.06739234924316406, 0.0750579833984375, 0.08272361755371094, 0.09038925170898438, 0.09805488586425781, 0.10572052001953125, 0.11338615417480469, 0.12105178833007812, 0.12871742248535156, 0.136383056640625, 0.14404869079589844, 0.15171432495117188, 0.1593799591064453, 0.16704559326171875, 0.1747112274169922, 0.18237686157226562, 0.19004249572753906, 0.1977081298828125, 0.20537376403808594, 0.21303939819335938, 0.2207050323486328, 0.22837066650390625, 0.2360363006591797, 0.24370193481445312, 0.25136756896972656, 0.259033203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 8.0, 9.0, 3.0, 5.0, 19.0, 9.0, 9.0, 15.0, 12.0, 13.0, 24.0, 22.0, 26.0, 35.0, 32.0, 23.0, 38.0, 22.0, 33.0, 33.0, 32.0, 40.0, 30.0, 37.0, 33.0, 48.0, 30.0, 39.0, 33.0, 39.0, 29.0, 28.0, 32.0, 11.0, 27.0, 17.0, 16.0, 14.0, 16.0, 14.0, 7.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0], "bins": [-0.12493896484375, -0.12144184112548828, -0.11794471740722656, -0.11444759368896484, -0.11095046997070312, -0.1074533462524414, -0.10395622253417969, -0.10045909881591797, -0.09696197509765625, -0.09346485137939453, -0.08996772766113281, -0.0864706039428711, -0.08297348022460938, -0.07947635650634766, -0.07597923278808594, -0.07248210906982422, -0.0689849853515625, -0.06548786163330078, -0.06199073791503906, -0.058493614196777344, -0.054996490478515625, -0.051499366760253906, -0.04800224304199219, -0.04450511932373047, -0.04100799560546875, -0.03751087188720703, -0.03401374816894531, -0.030516624450683594, -0.027019500732421875, -0.023522377014160156, -0.020025253295898438, -0.01652812957763672, -0.013031005859375, -0.009533882141113281, -0.0060367584228515625, -0.0025396347045898438, 0.000957489013671875, 0.004454612731933594, 0.007951736450195312, 0.011448860168457031, 0.01494598388671875, 0.01844310760498047, 0.021940231323242188, 0.025437355041503906, 0.028934478759765625, 0.032431602478027344, 0.03592872619628906, 0.03942584991455078, 0.0429229736328125, 0.04642009735107422, 0.04991722106933594, 0.053414344787597656, 0.056911468505859375, 0.060408592224121094, 0.06390571594238281, 0.06740283966064453, 0.07089996337890625, 0.07439708709716797, 0.07789421081542969, 0.0813913345336914, 0.08488845825195312, 0.08838558197021484, 0.09188270568847656, 0.09537982940673828, 0.098876953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 11.0, 5.0, 12.0, 12.0, 19.0, 45.0, 60.0, 74.0, 147.0, 275.0, 507.0, 1217.0, 3640.0, 21157.0, 977027.0, 36970.0, 4645.0, 1322.0, 631.0, 312.0, 163.0, 99.0, 60.0, 41.0, 30.0, 14.0, 10.0, 9.0, 9.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49169921875, -0.4745025634765625, -0.457305908203125, -0.4401092529296875, -0.42291259765625, -0.4057159423828125, -0.388519287109375, -0.3713226318359375, -0.3541259765625, -0.3369293212890625, -0.319732666015625, -0.3025360107421875, -0.28533935546875, -0.2681427001953125, -0.250946044921875, -0.2337493896484375, -0.216552734375, -0.1993560791015625, -0.182159423828125, -0.1649627685546875, -0.14776611328125, -0.1305694580078125, -0.113372802734375, -0.0961761474609375, -0.0789794921875, -0.0617828369140625, -0.044586181640625, -0.0273895263671875, -0.01019287109375, 0.0070037841796875, 0.024200439453125, 0.0413970947265625, 0.05859375, 0.0757904052734375, 0.092987060546875, 0.1101837158203125, 0.12738037109375, 0.1445770263671875, 0.161773681640625, 0.1789703369140625, 0.1961669921875, 0.2133636474609375, 0.230560302734375, 0.2477569580078125, 0.26495361328125, 0.2821502685546875, 0.299346923828125, 0.3165435791015625, 0.333740234375, 0.3509368896484375, 0.368133544921875, 0.3853302001953125, 0.40252685546875, 0.4197235107421875, 0.436920166015625, 0.4541168212890625, 0.4713134765625, 0.4885101318359375, 0.505706787109375, 0.5229034423828125, 0.54010009765625, 0.5572967529296875, 0.574493408203125, 0.5916900634765625, 0.60888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 4.0, 9.0, 12.0, 13.0, 11.0, 21.0, 18.0, 39.0, 36.0, 55.0, 65.0, 84.0, 124.0, 103.0, 89.0, 58.0, 61.0, 35.0, 28.0, 27.0, 21.0, 16.0, 11.0, 6.0, 10.0, 9.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006322860717773438, -0.0006068795919418335, -0.0005814731121063232, -0.000556066632270813, -0.0005306601524353027, -0.0005052536725997925, -0.0004798471927642822, -0.00045444071292877197, -0.0004290342330932617, -0.00040362775325775146, -0.0003782212734222412, -0.00035281479358673096, -0.0003274083137512207, -0.00030200183391571045, -0.0002765953540802002, -0.00025118887424468994, -0.0002257823944091797, -0.00020037591457366943, -0.00017496943473815918, -0.00014956295490264893, -0.00012415647506713867, -9.874999523162842e-05, -7.334351539611816e-05, -4.793703556060791e-05, -2.2530555725097656e-05, 2.8759241104125977e-06, 2.828240394592285e-05, 5.3688883781433105e-05, 7.909536361694336e-05, 0.00010450184345245361, 0.00012990832328796387, 0.00015531480312347412, 0.00018072128295898438, 0.00020612776279449463, 0.00023153424263000488, 0.00025694072246551514, 0.0002823472023010254, 0.00030775368213653564, 0.0003331601619720459, 0.00035856664180755615, 0.0003839731216430664, 0.00040937960147857666, 0.0004347860813140869, 0.00046019256114959717, 0.0004855990409851074, 0.0005110055208206177, 0.0005364120006561279, 0.0005618184804916382, 0.0005872249603271484, 0.0006126314401626587, 0.0006380379199981689, 0.0006634443998336792, 0.0006888508796691895, 0.0007142573595046997, 0.00073966383934021, 0.0007650703191757202, 0.0007904767990112305, 0.0008158832788467407, 0.000841289758682251, 0.0008666962385177612, 0.0008921027183532715, 0.0009175091981887817, 0.000942915678024292, 0.0009683221578598022, 0.0009937286376953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 12.0, 8.0, 6.0, 5.0, 11.0, 29.0, 30.0, 46.0, 71.0, 98.0, 202.0, 255.0, 406.0, 700.0, 1251.0, 2577.0, 5516.0, 14444.0, 57111.0, 810276.0, 119377.0, 21412.0, 7687.0, 3240.0, 1601.0, 880.0, 489.0, 274.0, 182.0, 106.0, 69.0, 49.0, 35.0, 11.0, 17.0, 13.0, 17.0, 13.0, 7.0, 2.0, 3.0, 2.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.26806640625, -0.2596015930175781, -0.25113677978515625, -0.24267196655273438, -0.2342071533203125, -0.22574234008789062, -0.21727752685546875, -0.20881271362304688, -0.200347900390625, -0.19188308715820312, -0.18341827392578125, -0.17495346069335938, -0.1664886474609375, -0.15802383422851562, -0.14955902099609375, -0.14109420776367188, -0.13262939453125, -0.12416458129882812, -0.11569976806640625, -0.10723495483398438, -0.0987701416015625, -0.09030532836914062, -0.08184051513671875, -0.07337570190429688, -0.064910888671875, -0.056446075439453125, -0.04798126220703125, -0.039516448974609375, -0.0310516357421875, -0.022586822509765625, -0.01412200927734375, -0.005657196044921875, 0.0028076171875, 0.011272430419921875, 0.01973724365234375, 0.028202056884765625, 0.0366668701171875, 0.045131683349609375, 0.05359649658203125, 0.062061309814453125, 0.070526123046875, 0.07899093627929688, 0.08745574951171875, 0.09592056274414062, 0.1043853759765625, 0.11285018920898438, 0.12131500244140625, 0.12977981567382812, 0.13824462890625, 0.14670944213867188, 0.15517425537109375, 0.16363906860351562, 0.1721038818359375, 0.18056869506835938, 0.18903350830078125, 0.19749832153320312, 0.205963134765625, 0.21442794799804688, 0.22289276123046875, 0.23135757446289062, 0.2398223876953125, 0.24828720092773438, 0.25675201416015625, 0.2652168273925781, 0.273681640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 8.0, 10.0, 7.0, 15.0, 8.0, 20.0, 19.0, 26.0, 43.0, 62.0, 105.0, 195.0, 152.0, 82.0, 47.0, 45.0, 34.0, 18.0, 19.0, 8.0, 10.0, 9.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.265625, -0.257537841796875, -0.24945068359375, -0.241363525390625, -0.2332763671875, -0.225189208984375, -0.21710205078125, -0.209014892578125, -0.200927734375, -0.192840576171875, -0.18475341796875, -0.176666259765625, -0.1685791015625, -0.160491943359375, -0.15240478515625, -0.144317626953125, -0.13623046875, -0.128143310546875, -0.12005615234375, -0.111968994140625, -0.1038818359375, -0.095794677734375, -0.08770751953125, -0.079620361328125, -0.071533203125, -0.063446044921875, -0.05535888671875, -0.047271728515625, -0.0391845703125, -0.031097412109375, -0.02301025390625, -0.014923095703125, -0.0068359375, 0.001251220703125, 0.00933837890625, 0.017425537109375, 0.0255126953125, 0.033599853515625, 0.04168701171875, 0.049774169921875, 0.057861328125, 0.065948486328125, 0.07403564453125, 0.082122802734375, 0.0902099609375, 0.098297119140625, 0.10638427734375, 0.114471435546875, 0.12255859375, 0.130645751953125, 0.13873291015625, 0.146820068359375, 0.1549072265625, 0.162994384765625, 0.17108154296875, 0.179168701171875, 0.187255859375, 0.195343017578125, 0.20343017578125, 0.211517333984375, 0.2196044921875, 0.227691650390625, 0.23577880859375, 0.243865966796875, 0.251953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 17.0, 33.0, 111.0, 550.0, 203.0, 42.0, 14.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9412035942077637, -3.8085577487945557, -3.6759119033813477, -3.5432660579681396, -3.4106202125549316, -3.2779746055603027, -3.1453287601470947, -3.0126829147338867, -2.8800370693206787, -2.7473912239074707, -2.6147453784942627, -2.4820995330810547, -2.349453926086426, -2.2168078422546387, -2.0841622352600098, -1.9515163898468018, -1.8188705444335938, -1.6862246990203857, -1.5535788536071777, -1.4209331274032593, -1.2882872819900513, -1.1556414365768433, -1.0229957103729248, -0.8903498649597168, -0.7577040195465088, -0.6250581741333008, -0.49241238832473755, -0.35976657271385193, -0.2271207571029663, -0.0944749116897583, 0.03817087411880493, 0.17081665992736816, 0.30346250534057617, 0.4361083209514618, 0.5687541365623474, 0.7013999223709106, 0.8340457677841187, 0.9666916131973267, 1.0993373394012451, 1.2319831848144531, 1.3646290302276611, 1.4972748756408691, 1.6299207210540771, 1.7625664472579956, 1.8952122926712036, 2.027858257293701, 2.16050386428833, 2.293149709701538, 2.425795555114746, 2.558441400527954, 2.691087245941162, 2.82373309135437, 2.956378936767578, 3.089024543762207, 3.221670389175415, 3.354316234588623, 3.486962080001831, 3.619607925415039, 3.752253770828247, 3.884899616241455, 4.017545223236084, 4.150191307067871, 4.2828369140625, 4.415482521057129, 4.548128604888916]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 5.0, 8.0, 4.0, 6.0, 5.0, 14.0, 32.0, 46.0, 72.0, 87.0, 136.0, 155.0, 119.0, 108.0, 55.0, 43.0, 30.0, 16.0, 3.0, 8.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.2524478435516357, -3.168166160583496, -3.0838844776153564, -2.999602794647217, -2.915320873260498, -2.8310391902923584, -2.7467575073242188, -2.662475824356079, -2.5781941413879395, -2.4939124584198, -2.40963077545166, -2.3253488540649414, -2.2410671710968018, -2.156785488128662, -2.0725038051605225, -1.9882221221923828, -1.903940200805664, -1.8196585178375244, -1.7353767156600952, -1.6510950326919556, -1.5668132305145264, -1.4825315475463867, -1.398249864578247, -1.3139681816101074, -1.2296863794326782, -1.1454046964645386, -1.0611228942871094, -0.9768412113189697, -0.8925594687461853, -0.8082777261734009, -0.7239960432052612, -0.6397143006324768, -0.5554323196411133, -0.47115057706832886, -0.3868688642978668, -0.3025871515274048, -0.21830540895462036, -0.13402366638183594, -0.04974198341369629, 0.034539759159088135, 0.11882150173187256, 0.2031032294034958, 0.287384957075119, 0.37166666984558105, 0.4559484124183655, 0.5402301549911499, 0.6245118379592896, 0.708793580532074, 0.7930753231048584, 0.8773570656776428, 0.9616388082504272, 1.045920491218567, 1.130202293395996, 1.2144839763641357, 1.2987656593322754, 1.383047342300415, 1.4673291444778442, 1.5516108274459839, 1.635892629623413, 1.7201743125915527, 1.8044559955596924, 1.8887377977371216, 1.9730194807052612, 2.0573012828826904, 2.14158296585083]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 2.0, 6.0, 1.0, 9.0, 5.0, 14.0, 12.0, 13.0, 23.0, 19.0, 34.0, 46.0, 112.0, 780.0, 24096.0, 4158305.0, 10194.0, 389.0, 77.0, 27.0, 25.0, 16.0, 13.0, 12.0, 8.0, 7.0, 5.0, 9.0, 3.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.365234375, -3.275299072265625, -3.18536376953125, -3.095428466796875, -3.0054931640625, -2.915557861328125, -2.82562255859375, -2.735687255859375, -2.645751953125, -2.555816650390625, -2.46588134765625, -2.375946044921875, -2.2860107421875, -2.196075439453125, -2.10614013671875, -2.016204833984375, -1.92626953125, -1.836334228515625, -1.74639892578125, -1.656463623046875, -1.5665283203125, -1.476593017578125, -1.38665771484375, -1.296722412109375, -1.206787109375, -1.116851806640625, -1.02691650390625, -0.936981201171875, -0.8470458984375, -0.757110595703125, -0.66717529296875, -0.577239990234375, -0.4873046875, -0.397369384765625, -0.30743408203125, -0.217498779296875, -0.1275634765625, -0.037628173828125, 0.05230712890625, 0.142242431640625, 0.232177734375, 0.322113037109375, 0.41204833984375, 0.501983642578125, 0.5919189453125, 0.681854248046875, 0.77178955078125, 0.861724853515625, 0.95166015625, 1.041595458984375, 1.13153076171875, 1.221466064453125, 1.3114013671875, 1.401336669921875, 1.49127197265625, 1.581207275390625, 1.671142578125, 1.761077880859375, 1.85101318359375, 1.940948486328125, 2.0308837890625, 2.120819091796875, 2.21075439453125, 2.300689697265625, 2.390625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 9.0, 7.0, 8.0, 10.0, 12.0, 13.0, 24.0, 43.0, 94.0, 149.0, 211.0, 167.0, 95.0, 44.0, 23.0, 17.0, 8.0, 11.0, 12.0, 4.0, 2.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175628662109375, -0.0169217586517334, -0.016280651092529297, -0.015639543533325195, -0.014998435974121094, -0.014357328414916992, -0.01371622085571289, -0.013075113296508789, -0.012434005737304688, -0.011792898178100586, -0.011151790618896484, -0.010510683059692383, -0.009869575500488281, -0.00922846794128418, -0.008587360382080078, -0.007946252822875977, -0.007305145263671875, -0.0066640377044677734, -0.006022930145263672, -0.00538182258605957, -0.004740715026855469, -0.004099607467651367, -0.0034584999084472656, -0.002817392349243164, -0.0021762847900390625, -0.001535177230834961, -0.0008940696716308594, -0.0002529621124267578, 0.00038814544677734375, 0.0010292530059814453, 0.0016703605651855469, 0.0023114681243896484, 0.00295257568359375, 0.0035936832427978516, 0.004234790802001953, 0.004875898361206055, 0.005517005920410156, 0.006158113479614258, 0.006799221038818359, 0.007440328598022461, 0.008081436157226562, 0.008722543716430664, 0.009363651275634766, 0.010004758834838867, 0.010645866394042969, 0.01128697395324707, 0.011928081512451172, 0.012569189071655273, 0.013210296630859375, 0.013851404190063477, 0.014492511749267578, 0.01513361930847168, 0.01577472686767578, 0.016415834426879883, 0.017056941986083984, 0.017698049545288086, 0.018339157104492188, 0.01898026466369629, 0.01962137222290039, 0.020262479782104492, 0.020903587341308594, 0.021544694900512695, 0.022185802459716797, 0.0228269100189209, 0.023468017578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 7.0, 11.0, 11.0, 10.0, 15.0, 22.0, 30.0, 39.0, 59.0, 55.0, 81.0, 127.0, 210.0, 490.0, 1640.0, 12268.0, 2921411.0, 1244959.0, 10084.0, 1524.0, 458.0, 245.0, 144.0, 86.0, 74.0, 62.0, 32.0, 25.0, 21.0, 19.0, 11.0, 12.0, 9.0, 9.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4541053771972656, -0.43726348876953125, -0.4204216003417969, -0.4035797119140625, -0.3867378234863281, -0.36989593505859375, -0.3530540466308594, -0.336212158203125, -0.3193702697753906, -0.30252838134765625, -0.2856864929199219, -0.2688446044921875, -0.2520027160644531, -0.23516082763671875, -0.21831893920898438, -0.20147705078125, -0.18463516235351562, -0.16779327392578125, -0.15095138549804688, -0.1341094970703125, -0.11726760864257812, -0.10042572021484375, -0.08358383178710938, -0.066741943359375, -0.049900054931640625, -0.03305816650390625, -0.016216278076171875, 0.0006256103515625, 0.017467498779296875, 0.03430938720703125, 0.051151275634765625, 0.0679931640625, 0.08483505249023438, 0.10167694091796875, 0.11851882934570312, 0.1353607177734375, 0.15220260620117188, 0.16904449462890625, 0.18588638305664062, 0.202728271484375, 0.21957015991210938, 0.23641204833984375, 0.2532539367675781, 0.2700958251953125, 0.2869377136230469, 0.30377960205078125, 0.3206214904785156, 0.33746337890625, 0.3543052673339844, 0.37114715576171875, 0.3879890441894531, 0.4048309326171875, 0.4216728210449219, 0.43851470947265625, 0.4553565979003906, 0.472198486328125, 0.4890403747558594, 0.5058822631835938, 0.5227241516113281, 0.5395660400390625, 0.5564079284667969, 0.5732498168945312, 0.5900917053222656, 0.60693359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 10.0, 15.0, 18.0, 18.0, 36.0, 64.0, 133.0, 371.0, 948.0, 1438.0, 581.0, 193.0, 92.0, 39.0, 28.0, 25.0, 15.0, 11.0, 9.0, 5.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044281005859375, -0.0430607795715332, -0.041840553283691406, -0.04062032699584961, -0.03940010070800781, -0.038179874420166016, -0.03695964813232422, -0.03573942184448242, -0.034519195556640625, -0.03329896926879883, -0.03207874298095703, -0.030858516693115234, -0.029638290405273438, -0.02841806411743164, -0.027197837829589844, -0.025977611541748047, -0.02475738525390625, -0.023537158966064453, -0.022316932678222656, -0.02109670639038086, -0.019876480102539062, -0.018656253814697266, -0.01743602752685547, -0.016215801239013672, -0.014995574951171875, -0.013775348663330078, -0.012555122375488281, -0.011334896087646484, -0.010114669799804688, -0.00889444351196289, -0.007674217224121094, -0.006453990936279297, -0.0052337646484375, -0.004013538360595703, -0.0027933120727539062, -0.0015730857849121094, -0.0003528594970703125, 0.0008673667907714844, 0.0020875930786132812, 0.003307819366455078, 0.004528045654296875, 0.005748271942138672, 0.006968498229980469, 0.008188724517822266, 0.009408950805664062, 0.01062917709350586, 0.011849403381347656, 0.013069629669189453, 0.01428985595703125, 0.015510082244873047, 0.016730308532714844, 0.01795053482055664, 0.019170761108398438, 0.020390987396240234, 0.02161121368408203, 0.022831439971923828, 0.024051666259765625, 0.025271892547607422, 0.02649211883544922, 0.027712345123291016, 0.028932571411132812, 0.03015279769897461, 0.031373023986816406, 0.0325932502746582, 0.0338134765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 18.0, 117.0, 674.0, 162.0, 18.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41194289922714233, -0.37945497035980225, -0.34696701169013977, -0.3144790530204773, -0.2819911241531372, -0.24950318038463593, -0.21701523661613464, -0.18452729284763336, -0.15203934907913208, -0.1195514053106308, -0.08706346154212952, -0.054575517773628235, -0.022087574005126953, 0.010400369763374329, 0.04288831353187561, 0.07537625730037689, 0.10786420106887817, 0.14035214483737946, 0.17284008860588074, 0.20532803237438202, 0.2378159761428833, 0.2703039050102234, 0.30279186367988586, 0.33527982234954834, 0.3677677512168884, 0.4002556800842285, 0.432743638753891, 0.46523159742355347, 0.49771952629089355, 0.5302074551582336, 0.5626953840255737, 0.5951833724975586, 0.6276713609695435, 0.6601592898368835, 0.6926472187042236, 0.7251352071762085, 0.7576231360435486, 0.7901110649108887, 0.8225990533828735, 0.8550869822502136, 0.8875749111175537, 0.9200628399848938, 0.9525507688522339, 0.9850387573242188, 1.017526626586914, 1.050014615058899, 1.0825026035308838, 1.114990472793579, 1.147478461265564, 1.1799664497375488, 1.2124543190002441, 1.244942307472229, 1.2774302959442139, 1.3099181652069092, 1.342406153678894, 1.3748940229415894, 1.4073820114135742, 1.439869999885559, 1.4723578691482544, 1.5048458576202393, 1.5373337268829346, 1.5698217153549194, 1.6023097038269043, 1.6347975730895996, 1.6672855615615845]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 1.0, 10.0, 6.0, 7.0, 14.0, 21.0, 15.0, 18.0, 20.0, 20.0, 32.0, 38.0, 34.0, 32.0, 37.0, 39.0, 52.0, 49.0, 56.0, 61.0, 45.0, 42.0, 47.0, 52.0, 32.0, 30.0, 26.0, 25.0, 30.0, 17.0, 15.0, 14.0, 19.0, 10.0, 11.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12242555618286133, -0.11850714683532715, -0.11458873748779297, -0.11067032814025879, -0.10675191879272461, -0.10283350944519043, -0.09891509264707565, -0.09499668329954147, -0.0910782739520073, -0.08715986460447311, -0.08324145525693893, -0.07932304590940475, -0.07540462911128998, -0.0714862197637558, -0.06756781041622162, -0.06364940106868744, -0.05973099172115326, -0.05581258237361908, -0.0518941730260849, -0.04797575995326042, -0.04405735060572624, -0.04013894125819206, -0.036220528185367584, -0.032302118837833405, -0.028383709490299225, -0.024465300142765045, -0.020546888932585716, -0.016628477722406387, -0.012710068374872208, -0.008791659027338028, -0.004873247817158699, -0.0009548366069793701, 0.0029635727405548096, 0.006881983019411564, 0.010800393298268318, 0.014718803577125072, 0.018637213855981827, 0.022555623203516006, 0.026474034413695335, 0.030392445623874664, 0.034310854971408844, 0.038229264318943024, 0.0421476736664772, 0.04606608673930168, 0.04998449608683586, 0.05390290543437004, 0.05782131850719452, 0.0617397278547287, 0.06565813720226288, 0.06957654654979706, 0.07349495589733124, 0.07741336524486542, 0.0813317745923996, 0.08525018393993378, 0.08916860073804855, 0.09308701008558273, 0.09700541943311691, 0.10092382878065109, 0.10484223812818527, 0.10876064747571945, 0.11267906427383423, 0.11659747362136841, 0.12051588296890259, 0.12443429231643677, 0.12835270166397095]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 20.0, 18.0, 24.0, 35.0, 55.0, 80.0, 101.0, 185.0, 254.0, 422.0, 607.0, 1023.0, 1788.0, 3444.0, 7717.0, 23070.0, 189102.0, 757972.0, 40953.0, 11094.0, 4765.0, 2283.0, 1320.0, 767.0, 454.0, 338.0, 190.0, 151.0, 105.0, 63.0, 32.0, 29.0, 24.0, 18.0, 8.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2587890625, -0.2504920959472656, -0.24219512939453125, -0.23389816284179688, -0.2256011962890625, -0.21730422973632812, -0.20900726318359375, -0.20071029663085938, -0.192413330078125, -0.18411636352539062, -0.17581939697265625, -0.16752243041992188, -0.1592254638671875, -0.15092849731445312, -0.14263153076171875, -0.13433456420898438, -0.12603759765625, -0.11774063110351562, -0.10944366455078125, -0.10114669799804688, -0.0928497314453125, -0.08455276489257812, -0.07625579833984375, -0.06795883178710938, -0.059661865234375, -0.051364898681640625, -0.04306793212890625, -0.034770965576171875, -0.0264739990234375, -0.018177032470703125, -0.00988006591796875, -0.001583099365234375, 0.0067138671875, 0.015010833740234375, 0.02330780029296875, 0.031604766845703125, 0.0399017333984375, 0.048198699951171875, 0.05649566650390625, 0.06479263305664062, 0.073089599609375, 0.08138656616210938, 0.08968353271484375, 0.09798049926757812, 0.1062774658203125, 0.11457443237304688, 0.12287139892578125, 0.13116836547851562, 0.13946533203125, 0.14776229858398438, 0.15605926513671875, 0.16435623168945312, 0.1726531982421875, 0.18095016479492188, 0.18924713134765625, 0.19754409790039062, 0.205841064453125, 0.21413803100585938, 0.22243499755859375, 0.23073196411132812, 0.2390289306640625, 0.24732589721679688, 0.25562286376953125, 0.2639198303222656, 0.272216796875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 5.0, 8.0, 8.0, 13.0, 9.0, 15.0, 13.0, 26.0, 52.0, 122.0, 152.0, 176.0, 126.0, 102.0, 55.0, 35.0, 19.0, 9.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01629638671875, -0.015737295150756836, -0.015178203582763672, -0.014619112014770508, -0.014060020446777344, -0.01350092887878418, -0.012941837310791016, -0.012382745742797852, -0.011823654174804688, -0.011264562606811523, -0.01070547103881836, -0.010146379470825195, -0.009587287902832031, -0.009028196334838867, -0.008469104766845703, -0.007910013198852539, -0.007350921630859375, -0.006791830062866211, -0.006232738494873047, -0.005673646926879883, -0.005114555358886719, -0.004555463790893555, -0.003996372222900391, -0.0034372806549072266, -0.0028781890869140625, -0.0023190975189208984, -0.0017600059509277344, -0.0012009143829345703, -0.0006418228149414062, -8.273124694824219e-05, 0.0004763603210449219, 0.001035451889038086, 0.00159454345703125, 0.002153635025024414, 0.002712726593017578, 0.003271818161010742, 0.0038309097290039062, 0.00439000129699707, 0.004949092864990234, 0.0055081844329833984, 0.0060672760009765625, 0.0066263675689697266, 0.007185459136962891, 0.007744550704956055, 0.008303642272949219, 0.008862733840942383, 0.009421825408935547, 0.009980916976928711, 0.010540008544921875, 0.011099100112915039, 0.011658191680908203, 0.012217283248901367, 0.012776374816894531, 0.013335466384887695, 0.01389455795288086, 0.014453649520874023, 0.015012741088867188, 0.015571832656860352, 0.016130924224853516, 0.01669001579284668, 0.017249107360839844, 0.017808198928833008, 0.018367290496826172, 0.018926382064819336, 0.0194854736328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 2.0, 4.0, 18.0, 18.0, 13.0, 32.0, 40.0, 69.0, 99.0, 144.0, 233.0, 344.0, 622.0, 1116.0, 2320.0, 6053.0, 25088.0, 427772.0, 547233.0, 26329.0, 6049.0, 2361.0, 1116.0, 551.0, 321.0, 203.0, 129.0, 90.0, 43.0, 37.0, 30.0, 10.0, 13.0, 14.0, 12.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2481689453125, -0.24042129516601562, -0.23267364501953125, -0.22492599487304688, -0.2171783447265625, -0.20943069458007812, -0.20168304443359375, -0.19393539428710938, -0.186187744140625, -0.17844009399414062, -0.17069244384765625, -0.16294479370117188, -0.1551971435546875, -0.14744949340820312, -0.13970184326171875, -0.13195419311523438, -0.12420654296875, -0.11645889282226562, -0.10871124267578125, -0.10096359252929688, -0.0932159423828125, -0.08546829223632812, -0.07772064208984375, -0.06997299194335938, -0.062225341796875, -0.054477691650390625, -0.04673004150390625, -0.038982391357421875, -0.0312347412109375, -0.023487091064453125, -0.01573944091796875, -0.007991790771484375, -0.000244140625, 0.007503509521484375, 0.01525115966796875, 0.022998809814453125, 0.0307464599609375, 0.038494110107421875, 0.04624176025390625, 0.053989410400390625, 0.061737060546875, 0.06948471069335938, 0.07723236083984375, 0.08498001098632812, 0.0927276611328125, 0.10047531127929688, 0.10822296142578125, 0.11597061157226562, 0.12371826171875, 0.13146591186523438, 0.13921356201171875, 0.14696121215820312, 0.1547088623046875, 0.16245651245117188, 0.17020416259765625, 0.17795181274414062, 0.185699462890625, 0.19344711303710938, 0.20119476318359375, 0.20894241333007812, 0.2166900634765625, 0.22443771362304688, 0.23218536376953125, 0.23993301391601562, 0.2476806640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 9.0, 13.0, 29.0, 12.0, 22.0, 21.0, 18.0, 29.0, 30.0, 28.0, 40.0, 46.0, 46.0, 49.0, 44.0, 57.0, 47.0, 53.0, 41.0, 48.0, 41.0, 38.0, 36.0, 47.0, 38.0, 17.0, 10.0, 15.0, 12.0, 11.0, 8.0, 8.0, 3.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0777587890625, -0.0754852294921875, -0.073211669921875, -0.0709381103515625, -0.06866455078125, -0.0663909912109375, -0.064117431640625, -0.0618438720703125, -0.0595703125, -0.0572967529296875, -0.055023193359375, -0.0527496337890625, -0.05047607421875, -0.0482025146484375, -0.045928955078125, -0.0436553955078125, -0.0413818359375, -0.0391082763671875, -0.036834716796875, -0.0345611572265625, -0.03228759765625, -0.0300140380859375, -0.027740478515625, -0.0254669189453125, -0.023193359375, -0.0209197998046875, -0.018646240234375, -0.0163726806640625, -0.01409912109375, -0.0118255615234375, -0.009552001953125, -0.0072784423828125, -0.0050048828125, -0.0027313232421875, -0.000457763671875, 0.0018157958984375, 0.00408935546875, 0.0063629150390625, 0.008636474609375, 0.0109100341796875, 0.01318359375, 0.0154571533203125, 0.017730712890625, 0.0200042724609375, 0.02227783203125, 0.0245513916015625, 0.026824951171875, 0.0290985107421875, 0.0313720703125, 0.0336456298828125, 0.035919189453125, 0.0381927490234375, 0.04046630859375, 0.0427398681640625, 0.045013427734375, 0.0472869873046875, 0.049560546875, 0.0518341064453125, 0.054107666015625, 0.0563812255859375, 0.05865478515625, 0.0609283447265625, 0.063201904296875, 0.0654754638671875, 0.0677490234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 11.0, 19.0, 14.0, 34.0, 33.0, 48.0, 64.0, 109.0, 198.0, 357.0, 650.0, 1293.0, 3104.0, 10418.0, 130575.0, 867419.0, 25122.0, 5166.0, 1874.0, 866.0, 435.0, 259.0, 138.0, 83.0, 62.0, 40.0, 39.0, 28.0, 18.0, 18.0, 13.0, 12.0, 5.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24853515625, -0.23868560791015625, -0.2288360595703125, -0.21898651123046875, -0.209136962890625, -0.19928741455078125, -0.1894378662109375, -0.17958831787109375, -0.16973876953125, -0.15988922119140625, -0.1500396728515625, -0.14019012451171875, -0.130340576171875, -0.12049102783203125, -0.1106414794921875, -0.10079193115234375, -0.0909423828125, -0.08109283447265625, -0.0712432861328125, -0.06139373779296875, -0.051544189453125, -0.04169464111328125, -0.0318450927734375, -0.02199554443359375, -0.01214599609375, -0.00229644775390625, 0.0075531005859375, 0.01740264892578125, 0.027252197265625, 0.03710174560546875, 0.0469512939453125, 0.05680084228515625, 0.066650390625, 0.07649993896484375, 0.0863494873046875, 0.09619903564453125, 0.106048583984375, 0.11589813232421875, 0.1257476806640625, 0.13559722900390625, 0.14544677734375, 0.15529632568359375, 0.1651458740234375, 0.17499542236328125, 0.184844970703125, 0.19469451904296875, 0.2045440673828125, 0.21439361572265625, 0.2242431640625, 0.23409271240234375, 0.2439422607421875, 0.25379180908203125, 0.263641357421875, 0.27349090576171875, 0.2833404541015625, 0.29319000244140625, 0.30303955078125, 0.31288909912109375, 0.3227386474609375, 0.33258819580078125, 0.342437744140625, 0.35228729248046875, 0.3621368408203125, 0.37198638916015625, 0.3818359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 2.0, 4.0, 6.0, 7.0, 14.0, 10.0, 30.0, 44.0, 63.0, 135.0, 344.0, 116.0, 74.0, 46.0, 28.0, 10.0, 6.0, 4.0, 8.0, 5.0, 8.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009541511535644531, -0.0009218230843544006, -0.0008894950151443481, -0.0008571669459342957, -0.0008248388767242432, -0.0007925108075141907, -0.0007601827383041382, -0.0007278546690940857, -0.0006955265998840332, -0.0006631985306739807, -0.0006308704614639282, -0.0005985423922538757, -0.0005662143230438232, -0.0005338862538337708, -0.0005015581846237183, -0.00046923011541366577, -0.0004369020462036133, -0.0004045739769935608, -0.0003722459077835083, -0.0003399178385734558, -0.0003075897693634033, -0.00027526170015335083, -0.00024293363094329834, -0.00021060556173324585, -0.00017827749252319336, -0.00014594942331314087, -0.00011362135410308838, -8.129328489303589e-05, -4.89652156829834e-05, -1.6637146472930908e-05, 1.5690922737121582e-05, 4.801899194717407e-05, 8.034706115722656e-05, 0.00011267513036727905, 0.00014500319957733154, 0.00017733126878738403, 0.00020965933799743652, 0.00024198740720748901, 0.0002743154764175415, 0.000306643545627594, 0.0003389716148376465, 0.000371299684047699, 0.00040362775325775146, 0.00043595582246780396, 0.00046828389167785645, 0.0005006119608879089, 0.0005329400300979614, 0.0005652680993080139, 0.0005975961685180664, 0.0006299242377281189, 0.0006622523069381714, 0.0006945803761482239, 0.0007269084453582764, 0.0007592365145683289, 0.0007915645837783813, 0.0008238926529884338, 0.0008562207221984863, 0.0008885487914085388, 0.0009208768606185913, 0.0009532049298286438, 0.0009855329990386963, 0.0010178610682487488, 0.0010501891374588013, 0.0010825172066688538, 0.0011148452758789062]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 10.0, 11.0, 34.0, 40.0, 75.0, 135.0, 314.0, 641.0, 1580.0, 5200.0, 22395.0, 251763.0, 702763.0, 49726.0, 9158.0, 2764.0, 1022.0, 426.0, 211.0, 107.0, 68.0, 36.0, 19.0, 16.0, 7.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.18877410888671875, -0.1827239990234375, -0.17667388916015625, -0.170623779296875, -0.16457366943359375, -0.1585235595703125, -0.15247344970703125, -0.14642333984375, -0.14037322998046875, -0.1343231201171875, -0.12827301025390625, -0.122222900390625, -0.11617279052734375, -0.1101226806640625, -0.10407257080078125, -0.0980224609375, -0.09197235107421875, -0.0859222412109375, -0.07987213134765625, -0.073822021484375, -0.06777191162109375, -0.0617218017578125, -0.05567169189453125, -0.04962158203125, -0.04357147216796875, -0.0375213623046875, -0.03147125244140625, -0.025421142578125, -0.01937103271484375, -0.0133209228515625, -0.00727081298828125, -0.001220703125, 0.00482940673828125, 0.0108795166015625, 0.01692962646484375, 0.022979736328125, 0.02902984619140625, 0.0350799560546875, 0.04113006591796875, 0.04718017578125, 0.05323028564453125, 0.0592803955078125, 0.06533050537109375, 0.071380615234375, 0.07743072509765625, 0.0834808349609375, 0.08953094482421875, 0.0955810546875, 0.10163116455078125, 0.1076812744140625, 0.11373138427734375, 0.119781494140625, 0.12583160400390625, 0.1318817138671875, 0.13793182373046875, 0.14398193359375, 0.15003204345703125, 0.1560821533203125, 0.16213226318359375, 0.168182373046875, 0.17423248291015625, 0.1802825927734375, 0.18633270263671875, 0.1923828125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 9.0, 7.0, 8.0, 13.0, 14.0, 32.0, 49.0, 50.0, 79.0, 110.0, 121.0, 135.0, 85.0, 77.0, 53.0, 36.0, 27.0, 21.0, 11.0, 7.0, 12.0, 7.0, 3.0, 3.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1357421875, -0.13149452209472656, -0.12724685668945312, -0.12299919128417969, -0.11875152587890625, -0.11450386047363281, -0.11025619506835938, -0.10600852966308594, -0.1017608642578125, -0.09751319885253906, -0.09326553344726562, -0.08901786804199219, -0.08477020263671875, -0.08052253723144531, -0.07627487182617188, -0.07202720642089844, -0.067779541015625, -0.06353187561035156, -0.059284210205078125, -0.05503654479980469, -0.05078887939453125, -0.04654121398925781, -0.042293548583984375, -0.03804588317871094, -0.0337982177734375, -0.029550552368164062, -0.025302886962890625, -0.021055221557617188, -0.01680755615234375, -0.012559890747070312, -0.008312225341796875, -0.0040645599365234375, 0.00018310546875, 0.0044307708740234375, 0.008678436279296875, 0.012926101684570312, 0.01717376708984375, 0.021421432495117188, 0.025669097900390625, 0.029916763305664062, 0.0341644287109375, 0.03841209411621094, 0.042659759521484375, 0.04690742492675781, 0.05115509033203125, 0.05540275573730469, 0.059650421142578125, 0.06389808654785156, 0.068145751953125, 0.07239341735839844, 0.07664108276367188, 0.08088874816894531, 0.08513641357421875, 0.08938407897949219, 0.09363174438476562, 0.09787940979003906, 0.1021270751953125, 0.10637474060058594, 0.11062240600585938, 0.11487007141113281, 0.11911773681640625, 0.12336540222167969, 0.12761306762695312, 0.13186073303222656, 0.1361083984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 11.0, 21.0, 60.0, 215.0, 377.0, 160.0, 61.0, 33.0, 11.0, 12.0, 5.0, 6.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1713391542434692, -1.1339681148529053, -1.0965971946716309, -1.059226155281067, -1.021855115890503, -0.9844841361045837, -0.9471131563186646, -0.9097421169281006, -0.8723711371421814, -0.8350001573562622, -0.7976291179656982, -0.760258138179779, -0.7228871583938599, -0.6855161190032959, -0.6481451392173767, -0.6107741594314575, -0.5734031200408936, -0.5360321402549744, -0.4986611008644104, -0.4612901210784912, -0.42391911149024963, -0.38654810190200806, -0.34917712211608887, -0.3118061125278473, -0.2744351029396057, -0.23706409335136414, -0.19969309866428375, -0.16232210397720337, -0.12495109438896179, -0.08758008480072021, -0.05020909011363983, -0.012838095426559448, 0.02453303337097168, 0.06190403550863266, 0.09927503764629364, 0.13664603233337402, 0.1740170419216156, 0.21138805150985718, 0.24875904619693756, 0.28613004088401794, 0.3235010504722595, 0.3608720600605011, 0.3982430696487427, 0.43561404943466187, 0.47298505902290344, 0.510356068611145, 0.5477270483970642, 0.5850980281829834, 0.6224690675735474, 0.6598400473594666, 0.6972110867500305, 0.7345820665359497, 0.7719531059265137, 0.8093240857124329, 0.846695065498352, 0.884066104888916, 0.9214370846748352, 0.9588080644607544, 0.9961791038513184, 1.0335501432418823, 1.0709210634231567, 1.1082921028137207, 1.1456631422042847, 1.183034062385559, 1.220405101776123]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 6.0, 11.0, 7.0, 14.0, 8.0, 18.0, 23.0, 27.0, 22.0, 53.0, 56.0, 81.0, 63.0, 84.0, 57.0, 94.0, 54.0, 58.0, 60.0, 42.0, 25.0, 19.0, 15.0, 19.0, 13.0, 10.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6412411332130432, -0.6204051971435547, -0.5995692014694214, -0.5787332653999329, -0.5578973293304443, -0.537061333656311, -0.5162253975868225, -0.4953894317150116, -0.4745534658432007, -0.45371749997138977, -0.43288153409957886, -0.41204559803009033, -0.3912096321582794, -0.3703736662864685, -0.34953773021698, -0.32870176434516907, -0.30786579847335815, -0.28702983260154724, -0.26619386672973633, -0.2453579306602478, -0.2245219647884369, -0.20368599891662598, -0.18285004794597626, -0.16201409697532654, -0.14117813110351562, -0.12034217268228531, -0.09950621426105499, -0.07867025583982468, -0.05783429741859436, -0.036998338997364044, -0.016162380576133728, 0.004673570394515991, 0.02550959587097168, 0.046345554292201996, 0.06718151271343231, 0.08801747113466263, 0.10885342955589294, 0.12968939542770386, 0.15052534639835358, 0.1713612973690033, 0.1921972632408142, 0.21303322911262512, 0.23386918008327484, 0.25470513105392456, 0.2755410969257355, 0.2963770627975464, 0.3172129988670349, 0.3380489647388458, 0.35888493061065674, 0.37972089648246765, 0.40055686235427856, 0.4213927984237671, 0.442228764295578, 0.4630647301673889, 0.48390066623687744, 0.5047366619110107, 0.5255725979804993, 0.5464085340499878, 0.5672445297241211, 0.5880804657936096, 0.6089164018630981, 0.6297523975372314, 0.65058833360672, 0.6714242696762085, 0.6922602653503418]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 2.0, 3.0, 6.0, 7.0, 6.0, 4.0, 13.0, 21.0, 7.0, 10.0, 26.0, 17.0, 33.0, 39.0, 257.0, 2377.0, 516777.0, 3672083.0, 2167.0, 226.0, 45.0, 25.0, 25.0, 5.0, 11.0, 7.0, 12.0, 13.0, 8.0, 2.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-1.7744140625, -1.7251739501953125, -1.675933837890625, -1.6266937255859375, -1.57745361328125, -1.5282135009765625, -1.478973388671875, -1.4297332763671875, -1.3804931640625, -1.3312530517578125, -1.282012939453125, -1.2327728271484375, -1.18353271484375, -1.1342926025390625, -1.085052490234375, -1.0358123779296875, -0.986572265625, -0.9373321533203125, -0.888092041015625, -0.8388519287109375, -0.78961181640625, -0.7403717041015625, -0.691131591796875, -0.6418914794921875, -0.5926513671875, -0.5434112548828125, -0.494171142578125, -0.4449310302734375, -0.39569091796875, -0.3464508056640625, -0.297210693359375, -0.2479705810546875, -0.19873046875, -0.1494903564453125, -0.100250244140625, -0.0510101318359375, -0.00177001953125, 0.0474700927734375, 0.096710205078125, 0.1459503173828125, 0.1951904296875, 0.2444305419921875, 0.293670654296875, 0.3429107666015625, 0.39215087890625, 0.4413909912109375, 0.490631103515625, 0.5398712158203125, 0.589111328125, 0.6383514404296875, 0.687591552734375, 0.7368316650390625, 0.78607177734375, 0.8353118896484375, 0.884552001953125, 0.9337921142578125, 0.9830322265625, 1.0322723388671875, 1.081512451171875, 1.1307525634765625, 1.17999267578125, 1.2292327880859375, 1.278472900390625, 1.3277130126953125, 1.376953125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 6.0, 2.0, 7.0, 5.0, 5.0, 7.0, 3.0, 6.0, 7.0, 21.0, 29.0, 36.0, 33.0, 70.0, 116.0, 139.0, 133.0, 102.0, 92.0, 61.0, 35.0, 22.0, 10.0, 8.0, 10.0, 9.0, 7.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0153350830078125, -0.014882326126098633, -0.014429569244384766, -0.013976812362670898, -0.013524055480957031, -0.013071298599243164, -0.012618541717529297, -0.01216578483581543, -0.011713027954101562, -0.011260271072387695, -0.010807514190673828, -0.010354757308959961, -0.009902000427246094, -0.009449243545532227, -0.00899648666381836, -0.008543729782104492, -0.008090972900390625, -0.007638216018676758, -0.007185459136962891, -0.0067327022552490234, -0.006279945373535156, -0.005827188491821289, -0.005374431610107422, -0.004921674728393555, -0.0044689178466796875, -0.00401616096496582, -0.003563404083251953, -0.003110647201538086, -0.0026578903198242188, -0.0022051334381103516, -0.0017523765563964844, -0.0012996196746826172, -0.00084686279296875, -0.0003941059112548828, 5.8650970458984375e-05, 0.0005114078521728516, 0.0009641647338867188, 0.001416921615600586, 0.0018696784973144531, 0.0023224353790283203, 0.0027751922607421875, 0.0032279491424560547, 0.003680706024169922, 0.004133462905883789, 0.004586219787597656, 0.0050389766693115234, 0.005491733551025391, 0.005944490432739258, 0.006397247314453125, 0.006850004196166992, 0.007302761077880859, 0.0077555179595947266, 0.008208274841308594, 0.008661031723022461, 0.009113788604736328, 0.009566545486450195, 0.010019302368164062, 0.01047205924987793, 0.010924816131591797, 0.011377573013305664, 0.011830329895019531, 0.012283086776733398, 0.012735843658447266, 0.013188600540161133, 0.013641357421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 0.0, 2.0, 3.0, 5.0, 5.0, 9.0, 13.0, 16.0, 34.0, 46.0, 79.0, 194.0, 483.0, 3398.0, 1238347.0, 2946328.0, 4358.0, 533.0, 191.0, 99.0, 48.0, 37.0, 17.0, 15.0, 5.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.87353515625, -0.85369873046875, -0.8338623046875, -0.81402587890625, -0.794189453125, -0.77435302734375, -0.7545166015625, -0.73468017578125, -0.71484375, -0.69500732421875, -0.6751708984375, -0.65533447265625, -0.635498046875, -0.61566162109375, -0.5958251953125, -0.57598876953125, -0.55615234375, -0.53631591796875, -0.5164794921875, -0.49664306640625, -0.476806640625, -0.45697021484375, -0.4371337890625, -0.41729736328125, -0.3974609375, -0.37762451171875, -0.3577880859375, -0.33795166015625, -0.318115234375, -0.29827880859375, -0.2784423828125, -0.25860595703125, -0.23876953125, -0.21893310546875, -0.1990966796875, -0.17926025390625, -0.159423828125, -0.13958740234375, -0.1197509765625, -0.09991455078125, -0.080078125, -0.06024169921875, -0.0404052734375, -0.02056884765625, -0.000732421875, 0.01910400390625, 0.0389404296875, 0.05877685546875, 0.07861328125, 0.09844970703125, 0.1182861328125, 0.13812255859375, 0.157958984375, 0.17779541015625, 0.1976318359375, 0.21746826171875, 0.2373046875, 0.25714111328125, 0.2769775390625, 0.29681396484375, 0.316650390625, 0.33648681640625, 0.3563232421875, 0.37615966796875, 0.39599609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 8.0, 11.0, 13.0, 25.0, 29.0, 34.0, 72.0, 131.0, 249.0, 457.0, 858.0, 969.0, 556.0, 283.0, 134.0, 76.0, 45.0, 29.0, 16.0, 16.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.030792236328125, -0.02988886833190918, -0.02898550033569336, -0.02808213233947754, -0.02717876434326172, -0.0262753963470459, -0.025372028350830078, -0.024468660354614258, -0.023565292358398438, -0.022661924362182617, -0.021758556365966797, -0.020855188369750977, -0.019951820373535156, -0.019048452377319336, -0.018145084381103516, -0.017241716384887695, -0.016338348388671875, -0.015434980392456055, -0.014531612396240234, -0.013628244400024414, -0.012724876403808594, -0.011821508407592773, -0.010918140411376953, -0.010014772415161133, -0.009111404418945312, -0.008208036422729492, -0.007304668426513672, -0.0064013004302978516, -0.005497932434082031, -0.004594564437866211, -0.0036911964416503906, -0.0027878284454345703, -0.00188446044921875, -0.0009810924530029297, -7.772445678710938e-05, 0.0008256435394287109, 0.0017290115356445312, 0.0026323795318603516, 0.003535747528076172, 0.004439115524291992, 0.0053424835205078125, 0.006245851516723633, 0.007149219512939453, 0.008052587509155273, 0.008955955505371094, 0.009859323501586914, 0.010762691497802734, 0.011666059494018555, 0.012569427490234375, 0.013472795486450195, 0.014376163482666016, 0.015279531478881836, 0.016182899475097656, 0.017086267471313477, 0.017989635467529297, 0.018893003463745117, 0.019796371459960938, 0.020699739456176758, 0.021603107452392578, 0.0225064754486084, 0.02340984344482422, 0.02431321144104004, 0.02521657943725586, 0.02611994743347168, 0.0270233154296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 98.0, 881.0, 27.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1009111404418945, -2.0615293979644775, -2.0221476554870605, -1.9827659130096436, -1.943384051322937, -1.90400230884552, -1.864620566368103, -1.825238823890686, -1.785857081413269, -1.746475338935852, -1.707093596458435, -1.6677117347717285, -1.6283299922943115, -1.5889482498168945, -1.5495665073394775, -1.5101847648620605, -1.4708030223846436, -1.4314212799072266, -1.3920395374298096, -1.3526577949523926, -1.313275933265686, -1.273894190788269, -1.234512448310852, -1.195130705833435, -1.1557488441467285, -1.1163671016693115, -1.0769853591918945, -1.0376036167144775, -0.9982218146324158, -0.958840012550354, -0.919458270072937, -0.88007652759552, -0.840694785118103, -0.801313042640686, -0.7619312405586243, -0.7225494980812073, -0.6831677556037903, -0.6437859535217285, -0.6044042110443115, -0.5650224685668945, -0.5256407260894775, -0.48625895380973816, -0.44687721133232117, -0.4074954390525818, -0.3681136965751648, -0.3287319242954254, -0.28935015201568604, -0.24996840953826904, -0.21058663725852966, -0.17120487987995148, -0.1318231225013733, -0.09244135022163391, -0.053059592843055725, -0.013677835464477539, 0.02570393681526184, 0.06508567929267883, 0.10446745157241821, 0.1438492089509964, 0.18323096632957458, 0.22261273860931396, 0.26199448108673096, 0.30137625336647034, 0.3407580256462097, 0.3801397681236267, 0.4195215404033661]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 5.0, 9.0, 14.0, 12.0, 23.0, 40.0, 46.0, 71.0, 72.0, 84.0, 92.0, 104.0, 109.0, 88.0, 68.0, 44.0, 35.0, 27.0, 18.0, 8.0, 9.0, 5.0, 3.0, 5.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.23314106464385986, -0.22759222984313965, -0.22204339504241943, -0.21649456024169922, -0.210945725440979, -0.2053968906402588, -0.19984805583953857, -0.19429922103881836, -0.18875038623809814, -0.18320155143737793, -0.17765271663665771, -0.1721038818359375, -0.16655504703521729, -0.16100621223449707, -0.15545737743377686, -0.14990854263305664, -0.14435970783233643, -0.1388108730316162, -0.133262038230896, -0.12771320343017578, -0.12216436862945557, -0.11661553382873535, -0.11106669902801514, -0.10551786422729492, -0.09996902942657471, -0.09442019462585449, -0.08887135982513428, -0.08332252502441406, -0.07777369022369385, -0.07222485542297363, -0.06667602062225342, -0.0611271858215332, -0.05557835102081299, -0.05002951622009277, -0.04448068141937256, -0.038931846618652344, -0.03338301181793213, -0.027834177017211914, -0.0222853422164917, -0.016736507415771484, -0.01118767261505127, -0.005638837814331055, -9.000301361083984e-05, 0.005458831787109375, 0.01100766658782959, 0.016556501388549805, 0.02210533618927002, 0.027654170989990234, 0.03320300579071045, 0.038751840591430664, 0.04430067539215088, 0.049849510192871094, 0.05539834499359131, 0.06094717979431152, 0.06649601459503174, 0.07204484939575195, 0.07759368419647217, 0.08314251899719238, 0.0886913537979126, 0.09424018859863281, 0.09978902339935303, 0.10533785820007324, 0.11088669300079346, 0.11643552780151367, 0.12198436260223389]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 14.0, 27.0, 32.0, 39.0, 64.0, 120.0, 220.0, 598.0, 2081.0, 12187.0, 207273.0, 786294.0, 33623.0, 4310.0, 946.0, 333.0, 130.0, 80.0, 35.0, 34.0, 31.0, 8.0, 8.0, 13.0, 2.0, 2.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.235107421875, -0.2291126251220703, -0.22311782836914062, -0.21712303161621094, -0.21112823486328125, -0.20513343811035156, -0.19913864135742188, -0.1931438446044922, -0.1871490478515625, -0.1811542510986328, -0.17515945434570312, -0.16916465759277344, -0.16316986083984375, -0.15717506408691406, -0.15118026733398438, -0.1451854705810547, -0.139190673828125, -0.1331958770751953, -0.12720108032226562, -0.12120628356933594, -0.11521148681640625, -0.10921669006347656, -0.10322189331054688, -0.09722709655761719, -0.0912322998046875, -0.08523750305175781, -0.07924270629882812, -0.07324790954589844, -0.06725311279296875, -0.06125831604003906, -0.055263519287109375, -0.04926872253417969, -0.04327392578125, -0.03727912902832031, -0.031284332275390625, -0.025289535522460938, -0.01929473876953125, -0.013299942016601562, -0.007305145263671875, -0.0013103485107421875, 0.0046844482421875, 0.010679244995117188, 0.016674041748046875, 0.022668838500976562, 0.02866363525390625, 0.03465843200683594, 0.040653228759765625, 0.04664802551269531, 0.052642822265625, 0.05863761901855469, 0.06463241577148438, 0.07062721252441406, 0.07662200927734375, 0.08261680603027344, 0.08861160278320312, 0.09460639953613281, 0.1006011962890625, 0.10659599304199219, 0.11259078979492188, 0.11858558654785156, 0.12458038330078125, 0.13057518005371094, 0.13656997680664062, 0.1425647735595703, 0.1485595703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 4.0, 12.0, 14.0, 18.0, 50.0, 87.0, 165.0, 192.0, 197.0, 127.0, 70.0, 25.0, 18.0, 11.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.039520263671875, -0.038755059242248535, -0.03798985481262207, -0.037224650382995605, -0.03645944595336914, -0.035694241523742676, -0.03492903709411621, -0.034163832664489746, -0.03339862823486328, -0.032633423805236816, -0.03186821937561035, -0.031103014945983887, -0.030337810516357422, -0.029572606086730957, -0.028807401657104492, -0.028042197227478027, -0.027276992797851562, -0.026511788368225098, -0.025746583938598633, -0.024981379508972168, -0.024216175079345703, -0.02345097064971924, -0.022685766220092773, -0.02192056179046631, -0.021155357360839844, -0.02039015293121338, -0.019624948501586914, -0.01885974407196045, -0.018094539642333984, -0.01732933521270752, -0.016564130783081055, -0.01579892635345459, -0.015033721923828125, -0.01426851749420166, -0.013503313064575195, -0.01273810863494873, -0.011972904205322266, -0.0112076997756958, -0.010442495346069336, -0.009677290916442871, -0.008912086486816406, -0.008146882057189941, -0.0073816776275634766, -0.006616473197937012, -0.005851268768310547, -0.005086064338684082, -0.004320859909057617, -0.0035556554794311523, -0.0027904510498046875, -0.0020252466201782227, -0.0012600421905517578, -0.000494837760925293, 0.0002703666687011719, 0.0010355710983276367, 0.0018007755279541016, 0.0025659799575805664, 0.0033311843872070312, 0.004096388816833496, 0.004861593246459961, 0.005626797676086426, 0.006392002105712891, 0.0071572065353393555, 0.00792241096496582, 0.008687615394592285, 0.00945281982421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 5.0, 11.0, 7.0, 9.0, 14.0, 25.0, 24.0, 43.0, 57.0, 58.0, 98.0, 149.0, 214.0, 354.0, 584.0, 1357.0, 4676.0, 24786.0, 170707.0, 627161.0, 183645.0, 26392.0, 4955.0, 1498.0, 624.0, 341.0, 191.0, 132.0, 107.0, 78.0, 59.0, 40.0, 33.0, 16.0, 17.0, 18.0, 10.0, 6.0, 7.0, 9.0, 5.0, 5.0, 3.0, 1.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.08367919921875, -0.081024169921875, -0.078369140625, -0.075714111328125, -0.07305908203125, -0.070404052734375, -0.0677490234375, -0.065093994140625, -0.06243896484375, -0.059783935546875, -0.05712890625, -0.054473876953125, -0.05181884765625, -0.049163818359375, -0.0465087890625, -0.043853759765625, -0.04119873046875, -0.038543701171875, -0.035888671875, -0.033233642578125, -0.03057861328125, -0.027923583984375, -0.0252685546875, -0.022613525390625, -0.01995849609375, -0.017303466796875, -0.0146484375, -0.011993408203125, -0.00933837890625, -0.006683349609375, -0.0040283203125, -0.001373291015625, 0.00128173828125, 0.003936767578125, 0.006591796875, 0.009246826171875, 0.01190185546875, 0.014556884765625, 0.0172119140625, 0.019866943359375, 0.02252197265625, 0.025177001953125, 0.02783203125, 0.030487060546875, 0.03314208984375, 0.035797119140625, 0.0384521484375, 0.041107177734375, 0.04376220703125, 0.046417236328125, 0.049072265625, 0.051727294921875, 0.05438232421875, 0.057037353515625, 0.0596923828125, 0.062347412109375, 0.06500244140625, 0.067657470703125, 0.0703125, 0.072967529296875, 0.07562255859375, 0.078277587890625, 0.0809326171875, 0.083587646484375, 0.08624267578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 16.0, 15.0, 17.0, 12.0, 16.0, 22.0, 29.0, 28.0, 20.0, 35.0, 38.0, 35.0, 39.0, 51.0, 48.0, 46.0, 41.0, 49.0, 38.0, 38.0, 31.0, 35.0, 34.0, 35.0, 31.0, 28.0, 22.0, 23.0, 19.0, 15.0, 11.0, 10.0, 11.0, 4.0, 5.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04315185546875, -0.041769981384277344, -0.04038810729980469, -0.03900623321533203, -0.037624359130859375, -0.03624248504638672, -0.03486061096191406, -0.033478736877441406, -0.03209686279296875, -0.030714988708496094, -0.029333114624023438, -0.02795124053955078, -0.026569366455078125, -0.02518749237060547, -0.023805618286132812, -0.022423744201660156, -0.0210418701171875, -0.019659996032714844, -0.018278121948242188, -0.01689624786376953, -0.015514373779296875, -0.014132499694824219, -0.012750625610351562, -0.011368751525878906, -0.00998687744140625, -0.008605003356933594, -0.0072231292724609375, -0.005841255187988281, -0.004459381103515625, -0.0030775070190429688, -0.0016956329345703125, -0.00031375885009765625, 0.001068115234375, 0.0024499893188476562, 0.0038318634033203125, 0.005213737487792969, 0.006595611572265625, 0.007977485656738281, 0.009359359741210938, 0.010741233825683594, 0.01212310791015625, 0.013504981994628906, 0.014886856079101562, 0.01626873016357422, 0.017650604248046875, 0.01903247833251953, 0.020414352416992188, 0.021796226501464844, 0.0231781005859375, 0.024559974670410156, 0.025941848754882812, 0.02732372283935547, 0.028705596923828125, 0.03008747100830078, 0.03146934509277344, 0.032851219177246094, 0.03423309326171875, 0.035614967346191406, 0.03699684143066406, 0.03837871551513672, 0.039760589599609375, 0.04114246368408203, 0.04252433776855469, 0.043906211853027344, 0.0452880859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 3.0, 5.0, 5.0, 5.0, 6.0, 12.0, 13.0, 20.0, 30.0, 50.0, 71.0, 152.0, 399.0, 1496.0, 12060.0, 546656.0, 474697.0, 10768.0, 1400.0, 354.0, 138.0, 73.0, 30.0, 24.0, 27.0, 13.0, 7.0, 9.0, 5.0, 7.0, 5.0, 3.0, 1.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18707656860351562, -0.18103790283203125, -0.17499923706054688, -0.1689605712890625, -0.16292190551757812, -0.15688323974609375, -0.15084457397460938, -0.144805908203125, -0.13876724243164062, -0.13272857666015625, -0.12668991088867188, -0.1206512451171875, -0.11461257934570312, -0.10857391357421875, -0.10253524780273438, -0.09649658203125, -0.09045791625976562, -0.08441925048828125, -0.07838058471679688, -0.0723419189453125, -0.06630325317382812, -0.06026458740234375, -0.054225921630859375, -0.048187255859375, -0.042148590087890625, -0.03610992431640625, -0.030071258544921875, -0.0240325927734375, -0.017993927001953125, -0.01195526123046875, -0.005916595458984375, 0.0001220703125, 0.006160736083984375, 0.01219940185546875, 0.018238067626953125, 0.0242767333984375, 0.030315399169921875, 0.03635406494140625, 0.042392730712890625, 0.048431396484375, 0.054470062255859375, 0.06050872802734375, 0.06654739379882812, 0.0725860595703125, 0.07862472534179688, 0.08466339111328125, 0.09070205688476562, 0.09674072265625, 0.10277938842773438, 0.10881805419921875, 0.11485671997070312, 0.1208953857421875, 0.12693405151367188, 0.13297271728515625, 0.13901138305664062, 0.145050048828125, 0.15108871459960938, 0.15712738037109375, 0.16316604614257812, 0.1692047119140625, 0.17524337768554688, 0.18128204345703125, 0.18732070922851562, 0.193359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 12.0, 12.0, 10.0, 22.0, 27.0, 38.0, 53.0, 112.0, 272.0, 155.0, 64.0, 43.0, 43.0, 28.0, 24.0, 12.0, 17.0, 8.0, 4.0, 5.0, 1.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006566047668457031, -0.0006337538361549377, -0.0006109029054641724, -0.000588051974773407, -0.0005652010440826416, -0.0005423501133918762, -0.0005194991827011108, -0.0004966482520103455, -0.0004737973213195801, -0.0004509463906288147, -0.0004280954599380493, -0.00040524452924728394, -0.00038239359855651855, -0.0003595426678657532, -0.0003366917371749878, -0.0003138408064842224, -0.00029098987579345703, -0.00026813894510269165, -0.00024528801441192627, -0.0002224370837211609, -0.0001995861530303955, -0.00017673522233963013, -0.00015388429164886475, -0.00013103336095809937, -0.00010818243026733398, -8.53314995765686e-05, -6.248056888580322e-05, -3.962963819503784e-05, -1.677870750427246e-05, 6.07222318649292e-06, 2.89231538772583e-05, 5.177408456802368e-05, 7.462501525878906e-05, 9.747594594955444e-05, 0.00012032687664031982, 0.0001431778073310852, 0.00016602873802185059, 0.00018887966871261597, 0.00021173059940338135, 0.00023458153009414673, 0.0002574324607849121, 0.0002802833914756775, 0.00030313432216644287, 0.00032598525285720825, 0.00034883618354797363, 0.000371687114238739, 0.0003945380449295044, 0.0004173889756202698, 0.00044023990631103516, 0.00046309083700180054, 0.0004859417676925659, 0.0005087926983833313, 0.0005316436290740967, 0.0005544945597648621, 0.0005773454904556274, 0.0006001964211463928, 0.0006230473518371582, 0.0006458982825279236, 0.000668749213218689, 0.0006916001439094543, 0.0007144510746002197, 0.0007373020052909851, 0.0007601529359817505, 0.0007830038666725159, 0.0008058547973632812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 7.0, 7.0, 18.0, 17.0, 28.0, 54.0, 99.0, 217.0, 495.0, 1675.0, 7513.0, 76427.0, 872219.0, 79084.0, 7883.0, 1767.0, 542.0, 216.0, 100.0, 53.0, 35.0, 21.0, 14.0, 8.0, 7.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.185791015625, -0.1804065704345703, -0.17502212524414062, -0.16963768005371094, -0.16425323486328125, -0.15886878967285156, -0.15348434448242188, -0.1480998992919922, -0.1427154541015625, -0.1373310089111328, -0.13194656372070312, -0.12656211853027344, -0.12117767333984375, -0.11579322814941406, -0.11040878295898438, -0.10502433776855469, -0.099639892578125, -0.09425544738769531, -0.08887100219726562, -0.08348655700683594, -0.07810211181640625, -0.07271766662597656, -0.06733322143554688, -0.06194877624511719, -0.0565643310546875, -0.05117988586425781, -0.045795440673828125, -0.04041099548339844, -0.03502655029296875, -0.029642105102539062, -0.024257659912109375, -0.018873214721679688, -0.01348876953125, -0.008104324340820312, -0.002719879150390625, 0.0026645660400390625, 0.00804901123046875, 0.013433456420898438, 0.018817901611328125, 0.024202346801757812, 0.0295867919921875, 0.03497123718261719, 0.040355682373046875, 0.04574012756347656, 0.05112457275390625, 0.05650901794433594, 0.061893463134765625, 0.06727790832519531, 0.072662353515625, 0.07804679870605469, 0.08343124389648438, 0.08881568908691406, 0.09420013427734375, 0.09958457946777344, 0.10496902465820312, 0.11035346984863281, 0.1157379150390625, 0.12112236022949219, 0.12650680541992188, 0.13189125061035156, 0.13727569580078125, 0.14266014099121094, 0.14804458618164062, 0.1534290313720703, 0.1588134765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 10.0, 16.0, 24.0, 61.0, 108.0, 183.0, 204.0, 158.0, 80.0, 44.0, 27.0, 16.0, 7.0, 3.0, 5.0, 1.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088134765625, -0.08512687683105469, -0.08211898803710938, -0.07911109924316406, -0.07610321044921875, -0.07309532165527344, -0.07008743286132812, -0.06707954406738281, -0.0640716552734375, -0.06106376647949219, -0.058055877685546875, -0.05504798889160156, -0.05204010009765625, -0.04903221130371094, -0.046024322509765625, -0.04301643371582031, -0.040008544921875, -0.03700065612792969, -0.033992767333984375, -0.030984878540039062, -0.02797698974609375, -0.024969100952148438, -0.021961212158203125, -0.018953323364257812, -0.0159454345703125, -0.012937545776367188, -0.009929656982421875, -0.0069217681884765625, -0.00391387939453125, -0.0009059906005859375, 0.002101898193359375, 0.0051097869873046875, 0.00811767578125, 0.011125564575195312, 0.014133453369140625, 0.017141342163085938, 0.02014923095703125, 0.023157119750976562, 0.026165008544921875, 0.029172897338867188, 0.0321807861328125, 0.03518867492675781, 0.038196563720703125, 0.04120445251464844, 0.04421234130859375, 0.04722023010253906, 0.050228118896484375, 0.05323600769042969, 0.056243896484375, 0.05925178527832031, 0.062259674072265625, 0.06526756286621094, 0.06827545166015625, 0.07128334045410156, 0.07429122924804688, 0.07729911804199219, 0.0803070068359375, 0.08331489562988281, 0.08632278442382812, 0.08933067321777344, 0.09233856201171875, 0.09534645080566406, 0.09835433959960938, 0.10136222839355469, 0.1043701171875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 464.0, 543.0, 6.0], "bins": [-15.131683349609375, -14.887587547302246, -14.643492698669434, -14.399396896362305, -14.155301094055176, -13.911205291748047, -13.667110443115234, -13.423014640808105, -13.178918838500977, -12.934823036193848, -12.690728187561035, -12.446632385253906, -12.202536582946777, -11.958440780639648, -11.714345932006836, -11.470250129699707, -11.226155281066895, -10.982059478759766, -10.737964630126953, -10.493868827819824, -10.249773025512695, -10.005678176879883, -9.761582374572754, -9.517486572265625, -9.273390769958496, -9.029294967651367, -8.785200119018555, -8.541104316711426, -8.297008514404297, -8.052913665771484, -7.8088178634643555, -7.564722061157227, -7.320626735687256, -7.076531410217285, -6.832435607910156, -6.5883402824401855, -6.344244480133057, -6.100149154663086, -5.856053352355957, -5.611958026885986, -5.367862701416016, -5.123767375946045, -4.879671573638916, -4.635576248168945, -4.391480445861816, -4.147385120391846, -3.903289556503296, -3.659193992614746, -3.4150984287261963, -3.1710028648376465, -2.9269073009490967, -2.682811737060547, -2.438716411590576, -2.1946208477020264, -1.9505252838134766, -1.7064298391342163, -1.4623342752456665, -1.2182387113571167, -0.9741432666778564, -0.7300477027893066, -0.4859521985054016, -0.24185669422149658, 0.0022388696670532227, 0.24633431434631348, 0.49042990803718567]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 15.0, 21.0, 29.0, 35.0, 64.0, 45.0, 97.0, 129.0, 121.0, 116.0, 96.0, 66.0, 61.0, 39.0, 28.0, 17.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1898953914642334, -1.1650880575180054, -1.1402807235717773, -1.1154735088348389, -1.0906661748886108, -1.0658588409423828, -1.0410515069961548, -1.0162441730499268, -0.9914369583129883, -0.9666296243667603, -0.941822350025177, -0.917015016078949, -0.8922077417373657, -0.8674004077911377, -0.8425930738449097, -0.8177857995033264, -0.7929784655570984, -0.7681711316108704, -0.7433638572692871, -0.7185565233230591, -0.6937492489814758, -0.6689419150352478, -0.6441346406936646, -0.6193273067474365, -0.5945199728012085, -0.5697126388549805, -0.5449053645133972, -0.5200980305671692, -0.49529075622558594, -0.4704834222793579, -0.44567611813545227, -0.42086881399154663, -0.39606159925460815, -0.3712542951107025, -0.3464469909667969, -0.32163965702056885, -0.2968323826789856, -0.27202504873275757, -0.24721774458885193, -0.2224104404449463, -0.19760313630104065, -0.172795832157135, -0.14798852801322937, -0.12318120896816254, -0.0983739048242569, -0.07356660068035126, -0.048759281635284424, -0.023951977491378784, 0.0008553266525268555, 0.025662634521722794, 0.05046994239091873, 0.07527725398540497, 0.10008455812931061, 0.12489186227321625, 0.14969918131828308, 0.17450648546218872, 0.19931378960609436, 0.22412109375, 0.24892839789390564, 0.2737357020378113, 0.2985430359840393, 0.32335031032562256, 0.3481576442718506, 0.3729649484157562, 0.39777225255966187]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 14.0, 19.0, 27.0, 68.0, 155.0, 393.0, 2212.0, 1263633.0, 2925797.0, 1610.0, 203.0, 61.0, 31.0, 18.0, 15.0, 7.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0], "bins": [-1.34375, -1.3168830871582031, -1.2900161743164062, -1.2631492614746094, -1.2362823486328125, -1.2094154357910156, -1.1825485229492188, -1.1556816101074219, -1.128814697265625, -1.1019477844238281, -1.0750808715820312, -1.0482139587402344, -1.0213470458984375, -0.9944801330566406, -0.9676132202148438, -0.9407463073730469, -0.91387939453125, -0.8870124816894531, -0.8601455688476562, -0.8332786560058594, -0.8064117431640625, -0.7795448303222656, -0.7526779174804688, -0.7258110046386719, -0.698944091796875, -0.6720771789550781, -0.6452102661132812, -0.6183433532714844, -0.5914764404296875, -0.5646095275878906, -0.5377426147460938, -0.5108757019042969, -0.4840087890625, -0.4571418762207031, -0.43027496337890625, -0.4034080505371094, -0.3765411376953125, -0.3496742248535156, -0.32280731201171875, -0.2959403991699219, -0.269073486328125, -0.24220657348632812, -0.21533966064453125, -0.18847274780273438, -0.1616058349609375, -0.13473892211914062, -0.10787200927734375, -0.08100509643554688, -0.05413818359375, -0.027271270751953125, -0.00040435791015625, 0.026462554931640625, 0.0533294677734375, 0.08019638061523438, 0.10706329345703125, 0.13393020629882812, 0.160797119140625, 0.18766403198242188, 0.21453094482421875, 0.24139785766601562, 0.2682647705078125, 0.2951316833496094, 0.32199859619140625, 0.3488655090332031, 0.375732421875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 7.0, 10.0, 7.0, 22.0, 55.0, 80.0, 142.0, 176.0, 202.0, 149.0, 72.0, 40.0, 17.0, 19.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.047271728515625, -0.04636061191558838, -0.04544949531555176, -0.04453837871551514, -0.043627262115478516, -0.042716145515441895, -0.04180502891540527, -0.04089391231536865, -0.03998279571533203, -0.03907167911529541, -0.03816056251525879, -0.03724944591522217, -0.03633832931518555, -0.035427212715148926, -0.034516096115112305, -0.033604979515075684, -0.03269386291503906, -0.03178274631500244, -0.03087162971496582, -0.0299605131149292, -0.029049396514892578, -0.028138279914855957, -0.027227163314819336, -0.026316046714782715, -0.025404930114746094, -0.024493813514709473, -0.02358269691467285, -0.02267158031463623, -0.02176046371459961, -0.02084934711456299, -0.019938230514526367, -0.019027113914489746, -0.018115997314453125, -0.017204880714416504, -0.016293764114379883, -0.015382647514343262, -0.01447153091430664, -0.01356041431427002, -0.012649297714233398, -0.011738181114196777, -0.010827064514160156, -0.009915947914123535, -0.009004831314086914, -0.008093714714050293, -0.007182598114013672, -0.006271481513977051, -0.00536036491394043, -0.004449248313903809, -0.0035381317138671875, -0.0026270151138305664, -0.0017158985137939453, -0.0008047819137573242, 0.00010633468627929688, 0.001017451286315918, 0.001928567886352539, 0.00283968448638916, 0.0037508010864257812, 0.004661917686462402, 0.0055730342864990234, 0.0064841508865356445, 0.007395267486572266, 0.008306384086608887, 0.009217500686645508, 0.010128617286682129, 0.01103973388671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 16.0, 33.0, 80.0, 139.0, 229.0, 316.0, 2862.0, 4189219.0, 954.0, 226.0, 114.0, 42.0, 34.0, 16.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2890625, -2.2426986694335938, -2.1963348388671875, -2.1499710083007812, -2.103607177734375, -2.0572433471679688, -2.0108795166015625, -1.9645156860351562, -1.91815185546875, -1.8717880249023438, -1.8254241943359375, -1.7790603637695312, -1.732696533203125, -1.6863327026367188, -1.6399688720703125, -1.5936050415039062, -1.5472412109375, -1.5008773803710938, -1.4545135498046875, -1.4081497192382812, -1.361785888671875, -1.3154220581054688, -1.2690582275390625, -1.2226943969726562, -1.17633056640625, -1.1299667358398438, -1.0836029052734375, -1.0372390747070312, -0.990875244140625, -0.9445114135742188, -0.8981475830078125, -0.8517837524414062, -0.805419921875, -0.7590560913085938, -0.7126922607421875, -0.6663284301757812, -0.619964599609375, -0.5736007690429688, -0.5272369384765625, -0.48087310791015625, -0.43450927734375, -0.38814544677734375, -0.3417816162109375, -0.29541778564453125, -0.249053955078125, -0.20269012451171875, -0.1563262939453125, -0.10996246337890625, -0.0635986328125, -0.01723480224609375, 0.0291290283203125, 0.07549285888671875, 0.121856689453125, 0.16822052001953125, 0.2145843505859375, 0.26094818115234375, 0.30731201171875, 0.35367584228515625, 0.4000396728515625, 0.44640350341796875, 0.492767333984375, 0.5391311645507812, 0.5854949951171875, 0.6318588256835938, 0.67822265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 25.0, 442.0, 3374.0, 199.0, 26.0, 14.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291748046875, -0.28606414794921875, -0.2803802490234375, -0.27469635009765625, -0.269012451171875, -0.26332855224609375, -0.2576446533203125, -0.25196075439453125, -0.24627685546875, -0.24059295654296875, -0.2349090576171875, -0.22922515869140625, -0.223541259765625, -0.21785736083984375, -0.2121734619140625, -0.20648956298828125, -0.2008056640625, -0.19512176513671875, -0.1894378662109375, -0.18375396728515625, -0.178070068359375, -0.17238616943359375, -0.1667022705078125, -0.16101837158203125, -0.15533447265625, -0.14965057373046875, -0.1439666748046875, -0.13828277587890625, -0.132598876953125, -0.12691497802734375, -0.1212310791015625, -0.11554718017578125, -0.10986328125, -0.10417938232421875, -0.0984954833984375, -0.09281158447265625, -0.087127685546875, -0.08144378662109375, -0.0757598876953125, -0.07007598876953125, -0.06439208984375, -0.05870819091796875, -0.0530242919921875, -0.04734039306640625, -0.041656494140625, -0.03597259521484375, -0.0302886962890625, -0.02460479736328125, -0.0189208984375, -0.01323699951171875, -0.0075531005859375, -0.00186920166015625, 0.003814697265625, 0.00949859619140625, 0.0151824951171875, 0.02086639404296875, 0.02655029296875, 0.03223419189453125, 0.0379180908203125, 0.04360198974609375, 0.049285888671875, 0.05496978759765625, 0.0606536865234375, 0.06633758544921875, 0.072021484375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 17.0, 102.0, 752.0, 118.0, 14.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.599658489227295, -2.5511059761047363, -2.5025534629821777, -2.454000949859619, -2.4054486751556396, -2.356896162033081, -2.3083436489105225, -2.259791135787964, -2.2112386226654053, -2.1626861095428467, -2.114133596420288, -2.0655810832977295, -2.01702880859375, -1.9684761762619019, -1.9199237823486328, -1.8713712692260742, -1.8228187561035156, -1.774266242980957, -1.725713849067688, -1.6771613359451294, -1.6286088228225708, -1.5800563097000122, -1.5315039157867432, -1.4829514026641846, -1.4343990087509155, -1.385846495628357, -1.337294101715088, -1.2887415885925293, -1.2401890754699707, -1.191636562347412, -1.143084168434143, -1.0945316553115845, -1.0459792613983154, -0.9974268078804016, -0.948874294757843, -0.9003218412399292, -0.8517693281173706, -0.8032168745994568, -0.754664421081543, -0.7061119079589844, -0.6575593948364258, -0.609006941318512, -0.5604544281959534, -0.5119019746780396, -0.46334946155548096, -0.41479700803756714, -0.36624452471733093, -0.3176920413970947, -0.26913952827453613, -0.22058704495429993, -0.17203456163406372, -0.12348209321498871, -0.0749296098947525, -0.026377126574516296, 0.022175341844558716, 0.07072782516479492, 0.11928030848503113, 0.16783279180526733, 0.21638527512550354, 0.26493775844573975, 0.31349021196365356, 0.36204272508621216, 0.410595178604126, 0.4591476619243622, 0.5077001452445984]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 26.0, 29.0, 65.0, 88.0, 152.0, 169.0, 157.0, 112.0, 89.0, 52.0, 28.0, 13.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9455681443214417, -0.915765643119812, -0.8859630823135376, -0.856160581111908, -0.8263580203056335, -0.7965555191040039, -0.7667529582977295, -0.7369504570960999, -0.7071479558944702, -0.6773454546928406, -0.6475428938865662, -0.6177403926849365, -0.5879378318786621, -0.5581353306770325, -0.5283328294754028, -0.4985302686691284, -0.468727707862854, -0.438925176858902, -0.40912264585494995, -0.3793201446533203, -0.3495175838470459, -0.31971508264541626, -0.28991255164146423, -0.2601100206375122, -0.23030748963356018, -0.20050495862960815, -0.17070242762565613, -0.1408999115228653, -0.11109738051891327, -0.08129484951496124, -0.05149233341217041, -0.021689802408218384, 0.008112728595733643, 0.03791525587439537, 0.0677177831530571, 0.09752030670642853, 0.12732283771038055, 0.15712536871433258, 0.1869278848171234, 0.21673041582107544, 0.24653294682502747, 0.2763354778289795, 0.3061380088329315, 0.33594053983688354, 0.3657430410385132, 0.3955456018447876, 0.42534810304641724, 0.45515063405036926, 0.4849531650543213, 0.5147556662559509, 0.5445582270622253, 0.574360728263855, 0.6041632890701294, 0.633965790271759, 0.6637682914733887, 0.6935708522796631, 0.7233734130859375, 0.7531759142875671, 0.7829784750938416, 0.8127809762954712, 0.8425835371017456, 0.8723860383033752, 0.9021885395050049, 0.9319911003112793, 0.9617936015129089]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 11.0, 9.0, 16.0, 13.0, 36.0, 34.0, 62.0, 82.0, 179.0, 420.0, 1314.0, 5734.0, 135560.0, 880894.0, 20335.0, 2555.0, 747.0, 252.0, 108.0, 67.0, 51.0, 18.0, 19.0, 15.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347412109375, -0.33629608154296875, -0.3251800537109375, -0.31406402587890625, -0.302947998046875, -0.29183197021484375, -0.2807159423828125, -0.26959991455078125, -0.25848388671875, -0.24736785888671875, -0.2362518310546875, -0.22513580322265625, -0.214019775390625, -0.20290374755859375, -0.1917877197265625, -0.18067169189453125, -0.1695556640625, -0.15843963623046875, -0.1473236083984375, -0.13620758056640625, -0.125091552734375, -0.11397552490234375, -0.1028594970703125, -0.09174346923828125, -0.08062744140625, -0.06951141357421875, -0.0583953857421875, -0.04727935791015625, -0.036163330078125, -0.02504730224609375, -0.0139312744140625, -0.00281524658203125, 0.00830078125, 0.01941680908203125, 0.0305328369140625, 0.04164886474609375, 0.052764892578125, 0.06388092041015625, 0.0749969482421875, 0.08611297607421875, 0.09722900390625, 0.10834503173828125, 0.1194610595703125, 0.13057708740234375, 0.141693115234375, 0.15280914306640625, 0.1639251708984375, 0.17504119873046875, 0.1861572265625, 0.19727325439453125, 0.2083892822265625, 0.21950531005859375, 0.230621337890625, 0.24173736572265625, 0.2528533935546875, 0.26396942138671875, 0.27508544921875, 0.28620147705078125, 0.2973175048828125, 0.30843353271484375, 0.319549560546875, 0.33066558837890625, 0.3417816162109375, 0.35289764404296875, 0.364013671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 38.0, 60.0, 91.0, 117.0, 151.0, 165.0, 142.0, 92.0, 67.0, 33.0, 13.0, 13.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.07330322265625, -0.0717768669128418, -0.0702505111694336, -0.06872415542602539, -0.06719779968261719, -0.06567144393920898, -0.06414508819580078, -0.06261873245239258, -0.061092376708984375, -0.05956602096557617, -0.05803966522216797, -0.056513309478759766, -0.05498695373535156, -0.05346059799194336, -0.051934242248535156, -0.05040788650512695, -0.04888153076171875, -0.04735517501831055, -0.045828819274902344, -0.04430246353149414, -0.04277610778808594, -0.041249752044677734, -0.03972339630126953, -0.03819704055786133, -0.036670684814453125, -0.03514432907104492, -0.03361797332763672, -0.032091617584228516, -0.030565261840820312, -0.02903890609741211, -0.027512550354003906, -0.025986194610595703, -0.0244598388671875, -0.022933483123779297, -0.021407127380371094, -0.01988077163696289, -0.018354415893554688, -0.016828060150146484, -0.015301704406738281, -0.013775348663330078, -0.012248992919921875, -0.010722637176513672, -0.009196281433105469, -0.007669925689697266, -0.0061435699462890625, -0.004617214202880859, -0.0030908584594726562, -0.0015645027160644531, -3.814697265625e-05, 0.0014882087707519531, 0.0030145645141601562, 0.004540920257568359, 0.0060672760009765625, 0.007593631744384766, 0.009119987487792969, 0.010646343231201172, 0.012172698974609375, 0.013699054718017578, 0.015225410461425781, 0.016751766204833984, 0.018278121948242188, 0.01980447769165039, 0.021330833435058594, 0.022857189178466797, 0.024383544921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 6.0, 12.0, 23.0, 21.0, 30.0, 33.0, 37.0, 61.0, 87.0, 211.0, 533.0, 2422.0, 23597.0, 564878.0, 435275.0, 18270.0, 2000.0, 481.0, 191.0, 102.0, 60.0, 50.0, 42.0, 15.0, 19.0, 9.0, 15.0, 13.0, 8.0, 8.0, 4.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1685791015625, -0.16275596618652344, -0.15693283081054688, -0.1511096954345703, -0.14528656005859375, -0.1394634246826172, -0.13364028930664062, -0.12781715393066406, -0.1219940185546875, -0.11617088317871094, -0.11034774780273438, -0.10452461242675781, -0.09870147705078125, -0.09287834167480469, -0.08705520629882812, -0.08123207092285156, -0.075408935546875, -0.06958580017089844, -0.06376266479492188, -0.05793952941894531, -0.05211639404296875, -0.04629325866699219, -0.040470123291015625, -0.03464698791503906, -0.0288238525390625, -0.023000717163085938, -0.017177581787109375, -0.011354446411132812, -0.00553131103515625, 0.0002918243408203125, 0.006114959716796875, 0.011938095092773438, 0.01776123046875, 0.023584365844726562, 0.029407501220703125, 0.03523063659667969, 0.04105377197265625, 0.04687690734863281, 0.052700042724609375, 0.05852317810058594, 0.0643463134765625, 0.07016944885253906, 0.07599258422851562, 0.08181571960449219, 0.08763885498046875, 0.09346199035644531, 0.09928512573242188, 0.10510826110839844, 0.110931396484375, 0.11675453186035156, 0.12257766723632812, 0.1284008026123047, 0.13422393798828125, 0.1400470733642578, 0.14587020874023438, 0.15169334411621094, 0.1575164794921875, 0.16333961486816406, 0.16916275024414062, 0.1749858856201172, 0.18080902099609375, 0.1866321563720703, 0.19245529174804688, 0.19827842712402344, 0.2041015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 5.0, 5.0, 8.0, 11.0, 15.0, 17.0, 20.0, 32.0, 16.0, 27.0, 29.0, 57.0, 40.0, 38.0, 40.0, 56.0, 41.0, 54.0, 65.0, 46.0, 40.0, 37.0, 41.0, 47.0, 29.0, 24.0, 26.0, 24.0, 18.0, 21.0, 10.0, 14.0, 12.0, 5.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07828044891357422, -0.07568931579589844, -0.07309818267822266, -0.07050704956054688, -0.0679159164428711, -0.06532478332519531, -0.06273365020751953, -0.06014251708984375, -0.05755138397216797, -0.05496025085449219, -0.052369117736816406, -0.049777984619140625, -0.047186851501464844, -0.04459571838378906, -0.04200458526611328, -0.0394134521484375, -0.03682231903076172, -0.03423118591308594, -0.031640052795410156, -0.029048919677734375, -0.026457786560058594, -0.023866653442382812, -0.02127552032470703, -0.01868438720703125, -0.01609325408935547, -0.013502120971679688, -0.010910987854003906, -0.008319854736328125, -0.005728721618652344, -0.0031375885009765625, -0.0005464553833007812, 0.002044677734375, 0.004635810852050781, 0.0072269439697265625, 0.009818077087402344, 0.012409210205078125, 0.015000343322753906, 0.017591476440429688, 0.02018260955810547, 0.02277374267578125, 0.02536487579345703, 0.027956008911132812, 0.030547142028808594, 0.033138275146484375, 0.035729408264160156, 0.03832054138183594, 0.04091167449951172, 0.0435028076171875, 0.04609394073486328, 0.04868507385253906, 0.051276206970214844, 0.053867340087890625, 0.056458473205566406, 0.05904960632324219, 0.06164073944091797, 0.06423187255859375, 0.06682300567626953, 0.06941413879394531, 0.0720052719116211, 0.07459640502929688, 0.07718753814697266, 0.07977867126464844, 0.08236980438232422, 0.0849609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 10.0, 9.0, 13.0, 14.0, 29.0, 53.0, 82.0, 146.0, 261.0, 549.0, 1172.0, 3538.0, 14433.0, 131085.0, 696585.0, 176219.0, 17810.0, 3974.0, 1362.0, 559.0, 265.0, 137.0, 77.0, 39.0, 40.0, 18.0, 14.0, 13.0, 8.0, 5.0, 7.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0792236328125, -0.07644939422607422, -0.07367515563964844, -0.07090091705322266, -0.06812667846679688, -0.0653524398803711, -0.06257820129394531, -0.05980396270751953, -0.05702972412109375, -0.05425548553466797, -0.05148124694824219, -0.048707008361816406, -0.045932769775390625, -0.043158531188964844, -0.04038429260253906, -0.03761005401611328, -0.0348358154296875, -0.03206157684326172, -0.029287338256835938, -0.026513099670410156, -0.023738861083984375, -0.020964622497558594, -0.018190383911132812, -0.015416145324707031, -0.01264190673828125, -0.009867668151855469, -0.0070934295654296875, -0.004319190979003906, -0.001544952392578125, 0.0012292861938476562, 0.0040035247802734375, 0.006777763366699219, 0.009552001953125, 0.012326240539550781, 0.015100479125976562, 0.017874717712402344, 0.020648956298828125, 0.023423194885253906, 0.026197433471679688, 0.02897167205810547, 0.03174591064453125, 0.03452014923095703, 0.03729438781738281, 0.040068626403808594, 0.042842864990234375, 0.045617103576660156, 0.04839134216308594, 0.05116558074951172, 0.0539398193359375, 0.05671405792236328, 0.05948829650878906, 0.062262535095214844, 0.06503677368164062, 0.0678110122680664, 0.07058525085449219, 0.07335948944091797, 0.07613372802734375, 0.07890796661376953, 0.08168220520019531, 0.0844564437866211, 0.08723068237304688, 0.09000492095947266, 0.09277915954589844, 0.09555339813232422, 0.09832763671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 5.0, 7.0, 6.0, 11.0, 10.0, 18.0, 14.0, 18.0, 27.0, 39.0, 36.0, 52.0, 64.0, 96.0, 88.0, 90.0, 74.0, 63.0, 47.0, 40.0, 30.0, 18.0, 20.0, 26.0, 15.0, 19.0, 8.0, 3.0, 6.0, 4.0, 6.0, 3.0, 6.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00020492076873779297, -0.00019802898168563843, -0.0001911371946334839, -0.00018424540758132935, -0.0001773536205291748, -0.00017046183347702026, -0.00016357004642486572, -0.00015667825937271118, -0.00014978647232055664, -0.0001428946852684021, -0.00013600289821624756, -0.00012911111116409302, -0.00012221932411193848, -0.00011532753705978394, -0.0001084357500076294, -0.00010154396295547485, -9.465217590332031e-05, -8.776038885116577e-05, -8.086860179901123e-05, -7.397681474685669e-05, -6.708502769470215e-05, -6.019324064254761e-05, -5.3301453590393066e-05, -4.6409666538238525e-05, -3.9517879486083984e-05, -3.262609243392944e-05, -2.5734305381774902e-05, -1.884251832962036e-05, -1.195073127746582e-05, -5.058944225311279e-06, 1.8328428268432617e-06, 8.724629878997803e-06, 1.5616416931152344e-05, 2.2508203983306885e-05, 2.9399991035461426e-05, 3.629177808761597e-05, 4.318356513977051e-05, 5.007535219192505e-05, 5.696713924407959e-05, 6.385892629623413e-05, 7.075071334838867e-05, 7.764250040054321e-05, 8.453428745269775e-05, 9.14260745048523e-05, 9.831786155700684e-05, 0.00010520964860916138, 0.00011210143566131592, 0.00011899322271347046, 0.000125885009765625, 0.00013277679681777954, 0.00013966858386993408, 0.00014656037092208862, 0.00015345215797424316, 0.0001603439450263977, 0.00016723573207855225, 0.0001741275191307068, 0.00018101930618286133, 0.00018791109323501587, 0.0001948028802871704, 0.00020169466733932495, 0.0002085864543914795, 0.00021547824144363403, 0.00022237002849578857, 0.00022926181554794312, 0.00023615360260009766]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 10.0, 13.0, 24.0, 66.0, 142.0, 517.0, 2625.0, 49440.0, 946997.0, 45241.0, 2628.0, 567.0, 162.0, 58.0, 34.0, 9.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.16092491149902344, -0.15546798706054688, -0.1500110626220703, -0.14455413818359375, -0.1390972137451172, -0.13364028930664062, -0.12818336486816406, -0.1227264404296875, -0.11726951599121094, -0.11181259155273438, -0.10635566711425781, -0.10089874267578125, -0.09544181823730469, -0.08998489379882812, -0.08452796936035156, -0.079071044921875, -0.07361412048339844, -0.06815719604492188, -0.06270027160644531, -0.05724334716796875, -0.05178642272949219, -0.046329498291015625, -0.04087257385253906, -0.0354156494140625, -0.029958724975585938, -0.024501800537109375, -0.019044876098632812, -0.01358795166015625, -0.008131027221679688, -0.002674102783203125, 0.0027828216552734375, 0.00823974609375, 0.013696670532226562, 0.019153594970703125, 0.024610519409179688, 0.03006744384765625, 0.03552436828613281, 0.040981292724609375, 0.04643821716308594, 0.0518951416015625, 0.05735206604003906, 0.06280899047851562, 0.06826591491699219, 0.07372283935546875, 0.07917976379394531, 0.08463668823242188, 0.09009361267089844, 0.095550537109375, 0.10100746154785156, 0.10646438598632812, 0.11192131042480469, 0.11737823486328125, 0.12283515930175781, 0.12829208374023438, 0.13374900817871094, 0.1392059326171875, 0.14466285705566406, 0.15011978149414062, 0.1555767059326172, 0.16103363037109375, 0.1664905548095703, 0.17194747924804688, 0.17740440368652344, 0.182861328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 14.0, 9.0, 22.0, 32.0, 49.0, 86.0, 129.0, 155.0, 173.0, 124.0, 89.0, 46.0, 37.0, 19.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.06193828582763672, -0.05954551696777344, -0.057152748107910156, -0.054759979248046875, -0.052367210388183594, -0.04997444152832031, -0.04758167266845703, -0.04518890380859375, -0.04279613494873047, -0.04040336608886719, -0.038010597229003906, -0.035617828369140625, -0.033225059509277344, -0.030832290649414062, -0.02843952178955078, -0.0260467529296875, -0.02365398406982422, -0.021261215209960938, -0.018868446350097656, -0.016475677490234375, -0.014082908630371094, -0.011690139770507812, -0.009297370910644531, -0.00690460205078125, -0.004511833190917969, -0.0021190643310546875, 0.00027370452880859375, 0.002666473388671875, 0.005059242248535156, 0.0074520111083984375, 0.009844779968261719, 0.012237548828125, 0.014630317687988281, 0.017023086547851562, 0.019415855407714844, 0.021808624267578125, 0.024201393127441406, 0.026594161987304688, 0.02898693084716797, 0.03137969970703125, 0.03377246856689453, 0.03616523742675781, 0.038558006286621094, 0.040950775146484375, 0.043343544006347656, 0.04573631286621094, 0.04812908172607422, 0.0505218505859375, 0.05291461944580078, 0.05530738830566406, 0.057700157165527344, 0.060092926025390625, 0.062485694885253906, 0.06487846374511719, 0.06727123260498047, 0.06966400146484375, 0.07205677032470703, 0.07444953918457031, 0.0768423080444336, 0.07923507690429688, 0.08162784576416016, 0.08402061462402344, 0.08641338348388672, 0.08880615234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 30.0, 129.0, 399.0, 313.0, 86.0, 29.0, 12.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.047525405883789, -2.002643346786499, -1.9577611684799194, -1.9128791093826294, -1.8679970502853394, -1.8231148719787598, -1.7782328128814697, -1.7333507537841797, -1.6884686946868896, -1.6435866355895996, -1.59870445728302, -1.55382239818573, -1.50894033908844, -1.4640581607818604, -1.4191761016845703, -1.3742940425872803, -1.3294118642807007, -1.2845298051834106, -1.239647626876831, -1.194765567779541, -1.149883508682251, -1.105001449584961, -1.0601192712783813, -1.0152372121810913, -0.9703550934791565, -0.9254729747772217, -0.8805909156799316, -0.8357087969779968, -0.790826678276062, -0.745944619178772, -0.7010625004768372, -0.6561803817749023, -0.6112982034683228, -0.5664160847663879, -0.5215340256690979, -0.4766519069671631, -0.43176981806755066, -0.38688772916793823, -0.3420056104660034, -0.297123521566391, -0.25224143266677856, -0.20735934376716614, -0.16247723996639252, -0.1175951361656189, -0.07271304726600647, -0.027830958366394043, 0.01705116033554077, 0.0619332492351532, 0.10681533813476562, 0.15169742703437805, 0.19657953083515167, 0.2414616346359253, 0.2863437235355377, 0.33122581243515015, 0.37610793113708496, 0.4209900200366974, 0.4658721089363098, 0.5107542276382446, 0.5556362867355347, 0.6005184054374695, 0.6454005241394043, 0.6902825832366943, 0.7351647019386292, 0.780046820640564, 0.824928879737854]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 6.0, 11.0, 18.0, 15.0, 26.0, 33.0, 34.0, 45.0, 39.0, 55.0, 51.0, 47.0, 67.0, 44.0, 58.0, 46.0, 51.0, 55.0, 52.0, 48.0, 40.0, 29.0, 18.0, 22.0, 17.0, 14.0, 14.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49388551712036133, -0.4740165174007416, -0.4541475176811218, -0.4342785179615021, -0.4144095182418823, -0.3945405185222626, -0.3746715188026428, -0.35480254888534546, -0.3349335193634033, -0.31506451964378357, -0.2951955199241638, -0.27532652020454407, -0.2554575204849243, -0.23558852076530457, -0.215719535946846, -0.19585053622722626, -0.1759815514087677, -0.15611255168914795, -0.1362435519695282, -0.11637455970048904, -0.0965055599808693, -0.07663656026124954, -0.05676756799221039, -0.03689856827259064, -0.017029568552970886, 0.0028394293040037155, 0.022708427160978317, 0.04257742315530777, 0.06244642287492752, 0.08231542259454727, 0.10218441486358643, 0.12205341458320618, 0.14192241430282593, 0.16179141402244568, 0.18166041374206543, 0.20152941346168518, 0.22139841318130493, 0.24126741290092468, 0.26113641262054443, 0.2810053825378418, 0.30087441205978394, 0.3207434117794037, 0.34061241149902344, 0.3604814112186432, 0.38035041093826294, 0.4002194106578827, 0.42008841037750244, 0.4399573802947998, 0.45982638001441956, 0.4796953797340393, 0.49956437945365906, 0.5194333791732788, 0.5393023490905762, 0.5591713786125183, 0.5790403485298157, 0.5989093780517578, 0.6187783479690552, 0.6386473178863525, 0.6585163474082947, 0.678385317325592, 0.6982543468475342, 0.7181233167648315, 0.7379923462867737, 0.757861316204071, 0.7777303457260132]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 15.0, 15.0, 16.0, 25.0, 29.0, 44.0, 68.0, 71.0, 134.0, 188.0, 385.0, 832.0, 2252.0, 9804.0, 140696.0, 3960268.0, 70477.0, 6758.0, 1389.0, 475.0, 195.0, 74.0, 26.0, 13.0, 11.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.52978515625, -0.5190601348876953, -0.5083351135253906, -0.49761009216308594, -0.48688507080078125, -0.47616004943847656, -0.4654350280761719, -0.4547100067138672, -0.4439849853515625, -0.4332599639892578, -0.4225349426269531, -0.41180992126464844, -0.40108489990234375, -0.39035987854003906, -0.3796348571777344, -0.3689098358154297, -0.358184814453125, -0.3474597930908203, -0.3367347717285156, -0.32600975036621094, -0.31528472900390625, -0.30455970764160156, -0.2938346862792969, -0.2831096649169922, -0.2723846435546875, -0.2616596221923828, -0.2509346008300781, -0.24020957946777344, -0.22948455810546875, -0.21875953674316406, -0.20803451538085938, -0.1973094940185547, -0.18658447265625, -0.1758594512939453, -0.16513442993164062, -0.15440940856933594, -0.14368438720703125, -0.13295936584472656, -0.12223434448242188, -0.11150932312011719, -0.1007843017578125, -0.09005928039550781, -0.07933425903320312, -0.06860923767089844, -0.05788421630859375, -0.04715919494628906, -0.036434173583984375, -0.025709152221679688, -0.014984130859375, -0.0042591094970703125, 0.006465911865234375, 0.017190933227539062, 0.02791595458984375, 0.03864097595214844, 0.049365997314453125, 0.06009101867675781, 0.0708160400390625, 0.08154106140136719, 0.09226608276367188, 0.10299110412597656, 0.11371612548828125, 0.12444114685058594, 0.13516616821289062, 0.1458911895751953, 0.1566162109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 8.0, 10.0, 27.0, 54.0, 98.0, 106.0, 155.0, 151.0, 130.0, 115.0, 56.0, 43.0, 28.0, 13.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.07321715354919434, -0.07166624069213867, -0.07011532783508301, -0.06856441497802734, -0.06701350212097168, -0.06546258926391602, -0.06391167640686035, -0.06236076354980469, -0.06080985069274902, -0.05925893783569336, -0.057708024978637695, -0.05615711212158203, -0.05460619926452637, -0.0530552864074707, -0.05150437355041504, -0.049953460693359375, -0.04840254783630371, -0.04685163497924805, -0.04530072212219238, -0.04374980926513672, -0.042198896408081055, -0.04064798355102539, -0.03909707069396973, -0.03754615783691406, -0.0359952449798584, -0.034444332122802734, -0.03289341926574707, -0.031342506408691406, -0.029791593551635742, -0.028240680694580078, -0.026689767837524414, -0.02513885498046875, -0.023587942123413086, -0.022037029266357422, -0.020486116409301758, -0.018935203552246094, -0.01738429069519043, -0.015833377838134766, -0.014282464981079102, -0.012731552124023438, -0.011180639266967773, -0.00962972640991211, -0.008078813552856445, -0.006527900695800781, -0.004976987838745117, -0.003426074981689453, -0.001875162124633789, -0.000324249267578125, 0.001226663589477539, 0.002777576446533203, 0.004328489303588867, 0.005879402160644531, 0.007430315017700195, 0.00898122787475586, 0.010532140731811523, 0.012083053588867188, 0.013633966445922852, 0.015184879302978516, 0.01673579216003418, 0.018286705017089844, 0.019837617874145508, 0.021388530731201172, 0.022939443588256836, 0.0244903564453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 22.0, 68.0, 125.0, 448.0, 5098.0, 4186552.0, 1630.0, 224.0, 78.0, 28.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.2312393188476562, -2.1851348876953125, -2.1390304565429688, -2.092926025390625, -2.0468215942382812, -2.0007171630859375, -1.9546127319335938, -1.90850830078125, -1.8624038696289062, -1.8162994384765625, -1.7701950073242188, -1.724090576171875, -1.6779861450195312, -1.6318817138671875, -1.5857772827148438, -1.5396728515625, -1.4935684204101562, -1.4474639892578125, -1.4013595581054688, -1.355255126953125, -1.3091506958007812, -1.2630462646484375, -1.2169418334960938, -1.17083740234375, -1.1247329711914062, -1.0786285400390625, -1.0325241088867188, -0.986419677734375, -0.9403152465820312, -0.8942108154296875, -0.8481063842773438, -0.802001953125, -0.7558975219726562, -0.7097930908203125, -0.6636886596679688, -0.617584228515625, -0.5714797973632812, -0.5253753662109375, -0.47927093505859375, -0.43316650390625, -0.38706207275390625, -0.3409576416015625, -0.29485321044921875, -0.248748779296875, -0.20264434814453125, -0.1565399169921875, -0.11043548583984375, -0.0643310546875, -0.01822662353515625, 0.0278778076171875, 0.07398223876953125, 0.120086669921875, 0.16619110107421875, 0.2122955322265625, 0.25839996337890625, 0.30450439453125, 0.35060882568359375, 0.3967132568359375, 0.44281768798828125, 0.488922119140625, 0.5350265502929688, 0.5811309814453125, 0.6272354125976562, 0.67333984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 8.0, 14.0, 38.0, 207.0, 2491.0, 1110.0, 133.0, 53.0, 17.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.239990234375, -0.23544931411743164, -0.23090839385986328, -0.22636747360229492, -0.22182655334472656, -0.2172856330871582, -0.21274471282958984, -0.20820379257202148, -0.20366287231445312, -0.19912195205688477, -0.1945810317993164, -0.19004011154174805, -0.1854991912841797, -0.18095827102661133, -0.17641735076904297, -0.1718764305114746, -0.16733551025390625, -0.1627945899963379, -0.15825366973876953, -0.15371274948120117, -0.1491718292236328, -0.14463090896606445, -0.1400899887084961, -0.13554906845092773, -0.13100814819335938, -0.12646722793579102, -0.12192630767822266, -0.1173853874206543, -0.11284446716308594, -0.10830354690551758, -0.10376262664794922, -0.09922170639038086, -0.0946807861328125, -0.09013986587524414, -0.08559894561767578, -0.08105802536010742, -0.07651710510253906, -0.0719761848449707, -0.06743526458740234, -0.06289434432983398, -0.058353424072265625, -0.053812503814697266, -0.049271583557128906, -0.04473066329956055, -0.04018974304199219, -0.03564882278442383, -0.03110790252685547, -0.02656698226928711, -0.02202606201171875, -0.01748514175415039, -0.012944221496582031, -0.008403301239013672, -0.0038623809814453125, 0.0006785392761230469, 0.005219459533691406, 0.009760379791259766, 0.014301300048828125, 0.018842220306396484, 0.023383140563964844, 0.027924060821533203, 0.03246498107910156, 0.03700590133666992, 0.04154682159423828, 0.04608774185180664, 0.050628662109375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 14.0, 46.0, 408.0, 480.0, 53.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1380202770233154, -1.0960794687271118, -1.0541387796401978, -1.0121979713439941, -0.9702572226524353, -0.9283164739608765, -0.8863756656646729, -0.844434916973114, -0.8024941682815552, -0.7605534195899963, -0.7186126112937927, -0.6766718626022339, -0.634731113910675, -0.5927903652191162, -0.5508495569229126, -0.5089088082313538, -0.46696799993515015, -0.4250272214412689, -0.3830864727497101, -0.34114569425582886, -0.29920494556427, -0.2572641670703888, -0.21532338857650757, -0.17338263988494873, -0.1314418613910675, -0.08950109779834747, -0.047560326755046844, -0.005619555711746216, 0.036321207880973816, 0.07826197147369385, 0.12020274996757507, 0.1621434986591339, 0.20408427715301514, 0.24602504074573517, 0.2879658043384552, 0.3299065828323364, 0.37184733152389526, 0.4137881100177765, 0.4557288885116577, 0.49766963720321655, 0.5396103858947754, 0.5815511345863342, 0.6234919428825378, 0.6654326915740967, 0.7073734402656555, 0.7493141889572144, 0.791254997253418, 0.8331957459449768, 0.8751365542411804, 0.9170773029327393, 0.9590181112289429, 1.0009589195251465, 1.0428996086120605, 1.0848404169082642, 1.1267812252044678, 1.1687219142913818, 1.2106627225875854, 1.252603530883789, 1.2945442199707031, 1.3364850282669067, 1.3784258365631104, 1.4203665256500244, 1.462307333946228, 1.5042481422424316, 1.5461888313293457]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 15.0, 30.0, 37.0, 59.0, 83.0, 94.0, 135.0, 111.0, 109.0, 91.0, 92.0, 58.0, 35.0, 22.0, 10.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7593380808830261, -0.738797664642334, -0.7182571887969971, -0.6977167725563049, -0.6771763563156128, -0.6566358804702759, -0.6360954642295837, -0.6155550479888916, -0.5950145721435547, -0.5744741559028625, -0.5539336800575256, -0.5333932638168335, -0.5128527879714966, -0.49231237173080444, -0.4717719554901123, -0.4512315094470978, -0.43069106340408325, -0.4101506173610687, -0.3896101713180542, -0.36906975507736206, -0.34852930903434753, -0.327988862991333, -0.30744844675064087, -0.28690800070762634, -0.2663675546646118, -0.2458271086215973, -0.22528667747974396, -0.20474624633789062, -0.1842058002948761, -0.16366535425186157, -0.14312492311000824, -0.12258449196815491, -0.10204410552978516, -0.08150366693735123, -0.0609632283449173, -0.04042278975248337, -0.01988235116004944, 0.000658087432384491, 0.02119852602481842, 0.04173895716667175, 0.06227940320968628, 0.08281984180212021, 0.10336028039455414, 0.12390071898698807, 0.144441157579422, 0.16498160362243652, 0.18552203476428986, 0.2060624659061432, 0.22660291194915771, 0.24714335799217224, 0.26768380403518677, 0.2882242202758789, 0.30876466631889343, 0.32930511236190796, 0.3498455286026001, 0.3703859746456146, 0.39092642068862915, 0.4114668667316437, 0.4320073127746582, 0.45254772901535034, 0.47308817505836487, 0.4936286211013794, 0.5141690373420715, 0.5347094535827637, 0.5552499294281006]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 1.0, 4.0, 8.0, 10.0, 19.0, 14.0, 37.0, 39.0, 55.0, 94.0, 100.0, 171.0, 251.0, 454.0, 801.0, 1759.0, 4886.0, 21134.0, 142491.0, 707587.0, 139121.0, 20772.0, 5004.0, 1726.0, 796.0, 409.0, 227.0, 169.0, 89.0, 83.0, 64.0, 44.0, 37.0, 20.0, 16.0, 14.0, 14.0, 11.0, 7.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15925025939941406, -0.15419387817382812, -0.1491374969482422, -0.14408111572265625, -0.1390247344970703, -0.13396835327148438, -0.12891197204589844, -0.1238555908203125, -0.11879920959472656, -0.11374282836914062, -0.10868644714355469, -0.10363006591796875, -0.09857368469238281, -0.09351730346679688, -0.08846092224121094, -0.083404541015625, -0.07834815979003906, -0.07329177856445312, -0.06823539733886719, -0.06317901611328125, -0.05812263488769531, -0.053066253662109375, -0.04800987243652344, -0.0429534912109375, -0.03789710998535156, -0.032840728759765625, -0.027784347534179688, -0.02272796630859375, -0.017671585083007812, -0.012615203857421875, -0.0075588226318359375, -0.00250244140625, 0.0025539398193359375, 0.007610321044921875, 0.012666702270507812, 0.01772308349609375, 0.022779464721679688, 0.027835845947265625, 0.03289222717285156, 0.0379486083984375, 0.04300498962402344, 0.048061370849609375, 0.05311775207519531, 0.05817413330078125, 0.06323051452636719, 0.06828689575195312, 0.07334327697753906, 0.078399658203125, 0.08345603942871094, 0.08851242065429688, 0.09356880187988281, 0.09862518310546875, 0.10368156433105469, 0.10873794555664062, 0.11379432678222656, 0.1188507080078125, 0.12390708923339844, 0.12896347045898438, 0.1340198516845703, 0.13907623291015625, 0.1441326141357422, 0.14918899536132812, 0.15424537658691406, 0.1593017578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 18.0, 28.0, 52.0, 58.0, 89.0, 114.0, 116.0, 122.0, 118.0, 78.0, 85.0, 50.0, 22.0, 17.0, 14.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0777587890625, -0.07595348358154297, -0.07414817810058594, -0.0723428726196289, -0.07053756713867188, -0.06873226165771484, -0.06692695617675781, -0.06512165069580078, -0.06331634521484375, -0.06151103973388672, -0.05970573425292969, -0.057900428771972656, -0.056095123291015625, -0.054289817810058594, -0.05248451232910156, -0.05067920684814453, -0.0488739013671875, -0.04706859588623047, -0.04526329040527344, -0.043457984924316406, -0.041652679443359375, -0.039847373962402344, -0.03804206848144531, -0.03623676300048828, -0.03443145751953125, -0.03262615203857422, -0.030820846557617188, -0.029015541076660156, -0.027210235595703125, -0.025404930114746094, -0.023599624633789062, -0.02179431915283203, -0.019989013671875, -0.01818370819091797, -0.016378402709960938, -0.014573097229003906, -0.012767791748046875, -0.010962486267089844, -0.009157180786132812, -0.007351875305175781, -0.00554656982421875, -0.0037412643432617188, -0.0019359588623046875, -0.00013065338134765625, 0.001674652099609375, 0.0034799575805664062, 0.0052852630615234375, 0.007090568542480469, 0.0088958740234375, 0.010701179504394531, 0.012506484985351562, 0.014311790466308594, 0.016117095947265625, 0.017922401428222656, 0.019727706909179688, 0.02153301239013672, 0.02333831787109375, 0.02514362335205078, 0.026948928833007812, 0.028754234313964844, 0.030559539794921875, 0.032364845275878906, 0.03417015075683594, 0.03597545623779297, 0.03778076171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 2.0, 6.0, 10.0, 8.0, 15.0, 17.0, 17.0, 28.0, 46.0, 59.0, 96.0, 151.0, 263.0, 666.0, 2076.0, 9228.0, 62328.0, 651640.0, 287203.0, 27502.0, 4853.0, 1331.0, 428.0, 195.0, 108.0, 80.0, 53.0, 39.0, 34.0, 18.0, 14.0, 15.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1451416015625, -0.14010238647460938, -0.13506317138671875, -0.13002395629882812, -0.1249847412109375, -0.11994552612304688, -0.11490631103515625, -0.10986709594726562, -0.104827880859375, -0.09978866577148438, -0.09474945068359375, -0.08971023559570312, -0.0846710205078125, -0.07963180541992188, -0.07459259033203125, -0.06955337524414062, -0.06451416015625, -0.059474945068359375, -0.05443572998046875, -0.049396514892578125, -0.0443572998046875, -0.039318084716796875, -0.03427886962890625, -0.029239654541015625, -0.024200439453125, -0.019161224365234375, -0.01412200927734375, -0.009082794189453125, -0.0040435791015625, 0.000995635986328125, 0.00603485107421875, 0.011074066162109375, 0.01611328125, 0.021152496337890625, 0.02619171142578125, 0.031230926513671875, 0.0362701416015625, 0.041309356689453125, 0.04634857177734375, 0.051387786865234375, 0.056427001953125, 0.061466217041015625, 0.06650543212890625, 0.07154464721679688, 0.0765838623046875, 0.08162307739257812, 0.08666229248046875, 0.09170150756835938, 0.09674072265625, 0.10177993774414062, 0.10681915283203125, 0.11185836791992188, 0.1168975830078125, 0.12193679809570312, 0.12697601318359375, 0.13201522827148438, 0.137054443359375, 0.14209365844726562, 0.14713287353515625, 0.15217208862304688, 0.1572113037109375, 0.16225051879882812, 0.16728973388671875, 0.17232894897460938, 0.1773681640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 12.0, 8.0, 9.0, 18.0, 18.0, 17.0, 26.0, 31.0, 34.0, 29.0, 37.0, 43.0, 55.0, 48.0, 51.0, 55.0, 62.0, 61.0, 41.0, 56.0, 44.0, 33.0, 31.0, 26.0, 31.0, 21.0, 16.0, 20.0, 18.0, 8.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.10583019256591797, -0.10210227966308594, -0.0983743667602539, -0.09464645385742188, -0.09091854095458984, -0.08719062805175781, -0.08346271514892578, -0.07973480224609375, -0.07600688934326172, -0.07227897644042969, -0.06855106353759766, -0.06482315063476562, -0.061095237731933594, -0.05736732482910156, -0.05363941192626953, -0.0499114990234375, -0.04618358612060547, -0.04245567321777344, -0.038727760314941406, -0.034999847412109375, -0.031271934509277344, -0.027544021606445312, -0.02381610870361328, -0.02008819580078125, -0.01636028289794922, -0.012632369995117188, -0.008904457092285156, -0.005176544189453125, -0.0014486312866210938, 0.0022792816162109375, 0.006007194519042969, 0.009735107421875, 0.013463020324707031, 0.017190933227539062, 0.020918846130371094, 0.024646759033203125, 0.028374671936035156, 0.03210258483886719, 0.03583049774169922, 0.03955841064453125, 0.04328632354736328, 0.04701423645019531, 0.050742149353027344, 0.054470062255859375, 0.058197975158691406, 0.06192588806152344, 0.06565380096435547, 0.0693817138671875, 0.07310962677001953, 0.07683753967285156, 0.0805654525756836, 0.08429336547851562, 0.08802127838134766, 0.09174919128417969, 0.09547710418701172, 0.09920501708984375, 0.10293292999267578, 0.10666084289550781, 0.11038875579833984, 0.11411666870117188, 0.1178445816040039, 0.12157249450683594, 0.12530040740966797, 0.1290283203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 13.0, 23.0, 31.0, 30.0, 68.0, 99.0, 149.0, 289.0, 470.0, 989.0, 2024.0, 4926.0, 14030.0, 49380.0, 204417.0, 465732.0, 226489.0, 54393.0, 15052.0, 5274.0, 2199.0, 1084.0, 593.0, 318.0, 173.0, 99.0, 80.0, 41.0, 23.0, 21.0, 14.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.042266845703125, -0.04100656509399414, -0.03974628448486328, -0.03848600387573242, -0.03722572326660156, -0.0359654426574707, -0.034705162048339844, -0.033444881439208984, -0.032184600830078125, -0.030924320220947266, -0.029664039611816406, -0.028403759002685547, -0.027143478393554688, -0.025883197784423828, -0.02462291717529297, -0.02336263656616211, -0.02210235595703125, -0.02084207534790039, -0.01958179473876953, -0.018321514129638672, -0.017061233520507812, -0.015800952911376953, -0.014540672302246094, -0.013280391693115234, -0.012020111083984375, -0.010759830474853516, -0.009499549865722656, -0.008239269256591797, -0.0069789886474609375, -0.005718708038330078, -0.004458427429199219, -0.0031981468200683594, -0.0019378662109375, -0.0006775856018066406, 0.0005826950073242188, 0.0018429756164550781, 0.0031032562255859375, 0.004363536834716797, 0.005623817443847656, 0.006884098052978516, 0.008144378662109375, 0.009404659271240234, 0.010664939880371094, 0.011925220489501953, 0.013185501098632812, 0.014445781707763672, 0.01570606231689453, 0.01696634292602539, 0.01822662353515625, 0.01948690414428711, 0.02074718475341797, 0.022007465362548828, 0.023267745971679688, 0.024528026580810547, 0.025788307189941406, 0.027048587799072266, 0.028308868408203125, 0.029569149017333984, 0.030829429626464844, 0.0320897102355957, 0.03334999084472656, 0.03461027145385742, 0.03587055206298828, 0.03713083267211914, 0.03839111328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 2.0, 13.0, 22.0, 37.0, 28.0, 45.0, 59.0, 85.0, 122.0, 109.0, 111.0, 92.0, 80.0, 51.0, 38.0, 40.0, 15.0, 17.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00017833709716796875, -0.0001727379858493805, -0.00016713887453079224, -0.00016153976321220398, -0.00015594065189361572, -0.00015034154057502747, -0.0001447424292564392, -0.00013914331793785095, -0.0001335442066192627, -0.00012794509530067444, -0.00012234598398208618, -0.00011674687266349792, -0.00011114776134490967, -0.00010554865002632141, -9.994953870773315e-05, -9.43504273891449e-05, -8.875131607055664e-05, -8.315220475196838e-05, -7.755309343338013e-05, -7.195398211479187e-05, -6.635487079620361e-05, -6.0755759477615356e-05, -5.51566481590271e-05, -4.955753684043884e-05, -4.3958425521850586e-05, -3.835931420326233e-05, -3.276020288467407e-05, -2.7161091566085815e-05, -2.156198024749756e-05, -1.5962868928909302e-05, -1.0363757610321045e-05, -4.764646291732788e-06, 8.344650268554688e-07, 6.433576345443726e-06, 1.2032687664031982e-05, 1.763179898262024e-05, 2.3230910301208496e-05, 2.8830021619796753e-05, 3.442913293838501e-05, 4.0028244256973267e-05, 4.5627355575561523e-05, 5.122646689414978e-05, 5.682557821273804e-05, 6.24246895313263e-05, 6.802380084991455e-05, 7.362291216850281e-05, 7.922202348709106e-05, 8.482113480567932e-05, 9.042024612426758e-05, 9.601935744285583e-05, 0.00010161846876144409, 0.00010721758008003235, 0.0001128166913986206, 0.00011841580271720886, 0.00012401491403579712, 0.00012961402535438538, 0.00013521313667297363, 0.0001408122479915619, 0.00014641135931015015, 0.0001520104706287384, 0.00015760958194732666, 0.00016320869326591492, 0.00016880780458450317, 0.00017440691590309143, 0.0001800060272216797]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 17.0, 8.0, 21.0, 38.0, 63.0, 115.0, 171.0, 407.0, 817.0, 2015.0, 5672.0, 23478.0, 159297.0, 610612.0, 205906.0, 29122.0, 6691.0, 2284.0, 904.0, 421.0, 200.0, 122.0, 63.0, 30.0, 26.0, 19.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0], "bins": [-0.07623291015625, -0.07444190979003906, -0.07265090942382812, -0.07085990905761719, -0.06906890869140625, -0.06727790832519531, -0.06548690795898438, -0.06369590759277344, -0.0619049072265625, -0.06011390686035156, -0.058322906494140625, -0.05653190612792969, -0.05474090576171875, -0.05294990539550781, -0.051158905029296875, -0.04936790466308594, -0.047576904296875, -0.04578590393066406, -0.043994903564453125, -0.04220390319824219, -0.04041290283203125, -0.03862190246582031, -0.036830902099609375, -0.03503990173339844, -0.0332489013671875, -0.03145790100097656, -0.029666900634765625, -0.027875900268554688, -0.02608489990234375, -0.024293899536132812, -0.022502899169921875, -0.020711898803710938, -0.0189208984375, -0.017129898071289062, -0.015338897705078125, -0.013547897338867188, -0.01175689697265625, -0.009965896606445312, -0.008174896240234375, -0.0063838958740234375, -0.0045928955078125, -0.0028018951416015625, -0.001010894775390625, 0.0007801055908203125, 0.00257110595703125, 0.0043621063232421875, 0.006153106689453125, 0.007944107055664062, 0.009735107421875, 0.011526107788085938, 0.013317108154296875, 0.015108108520507812, 0.01689910888671875, 0.018690109252929688, 0.020481109619140625, 0.022272109985351562, 0.0240631103515625, 0.025854110717773438, 0.027645111083984375, 0.029436111450195312, 0.03122711181640625, 0.03301811218261719, 0.034809112548828125, 0.03660011291503906, 0.03839111328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 11.0, 7.0, 7.0, 12.0, 11.0, 20.0, 23.0, 40.0, 46.0, 38.0, 72.0, 87.0, 101.0, 86.0, 94.0, 76.0, 74.0, 55.0, 38.0, 32.0, 18.0, 13.0, 15.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035919189453125, -0.03465700149536133, -0.033394813537597656, -0.032132625579833984, -0.030870437622070312, -0.02960824966430664, -0.02834606170654297, -0.027083873748779297, -0.025821685791015625, -0.024559497833251953, -0.02329730987548828, -0.02203512191772461, -0.020772933959960938, -0.019510746002197266, -0.018248558044433594, -0.016986370086669922, -0.01572418212890625, -0.014461994171142578, -0.013199806213378906, -0.011937618255615234, -0.010675430297851562, -0.00941324234008789, -0.008151054382324219, -0.006888866424560547, -0.005626678466796875, -0.004364490509033203, -0.0031023025512695312, -0.0018401145935058594, -0.0005779266357421875, 0.0006842613220214844, 0.0019464492797851562, 0.003208637237548828, 0.0044708251953125, 0.005733013153076172, 0.006995201110839844, 0.008257389068603516, 0.009519577026367188, 0.01078176498413086, 0.012043952941894531, 0.013306140899658203, 0.014568328857421875, 0.015830516815185547, 0.01709270477294922, 0.01835489273071289, 0.019617080688476562, 0.020879268646240234, 0.022141456604003906, 0.023403644561767578, 0.02466583251953125, 0.025928020477294922, 0.027190208435058594, 0.028452396392822266, 0.029714584350585938, 0.03097677230834961, 0.03223896026611328, 0.03350114822387695, 0.034763336181640625, 0.0360255241394043, 0.03728771209716797, 0.03854990005493164, 0.03981208801269531, 0.041074275970458984, 0.042336463928222656, 0.04359865188598633, 0.04486083984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 39.0, 100.0, 426.0, 304.0, 76.0, 28.0, 12.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0597352981567383, -2.0105113983154297, -1.9612873792648315, -1.9120633602142334, -1.8628393411636353, -1.8136154413223267, -1.7643914222717285, -1.71516752243042, -1.6659435033798218, -1.6167194843292236, -1.567495584487915, -1.518271565437317, -1.4690475463867188, -1.4198236465454102, -1.370599627494812, -1.3213756084442139, -1.2721517086029053, -1.2229276895523071, -1.1737037897109985, -1.1244797706604004, -1.0752557516098022, -1.0260318517684937, -0.9768078327178955, -0.9275838732719421, -0.8783597946166992, -0.8291358351707458, -0.7799118161201477, -0.7306878566741943, -0.681463897228241, -0.6322399377822876, -0.5830159187316895, -0.5337919592857361, -0.4845679998397827, -0.43534401059150696, -0.3861200511455536, -0.33689606189727783, -0.28767210245132446, -0.2384481132030487, -0.18922412395477295, -0.14000016450881958, -0.09077617526054382, -0.04155219718813896, 0.0076717808842659, 0.05689576268196106, 0.10611973702907562, 0.15534371137619019, 0.20456770062446594, 0.2537916600704193, 0.30301564931869507, 0.3522396385669708, 0.4014635980129242, 0.45068758726119995, 0.4999115467071533, 0.5491355657577515, 0.5983595252037048, 0.6475834846496582, 0.6968075037002563, 0.7460314631462097, 0.7952554821968079, 0.8444794416427612, 0.8937034010887146, 0.942927360534668, 0.9921513795852661, 1.0413753986358643, 1.0905992984771729]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 10.0, 3.0, 8.0, 17.0, 11.0, 16.0, 18.0, 17.0, 24.0, 29.0, 25.0, 40.0, 41.0, 46.0, 58.0, 54.0, 71.0, 55.0, 56.0, 72.0, 52.0, 43.0, 35.0, 43.0, 35.0, 29.0, 21.0, 25.0, 11.0, 13.0, 12.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6694530844688416, -0.6468819975852966, -0.6243109703063965, -0.6017398834228516, -0.5791688561439514, -0.5565977692604065, -0.5340267419815063, -0.5114556550979614, -0.4888845980167389, -0.46631354093551636, -0.4437424838542938, -0.4211714267730713, -0.39860033988952637, -0.3760293126106262, -0.3534582257270813, -0.33088716864585876, -0.30831611156463623, -0.2857450544834137, -0.26317399740219116, -0.24060292541980743, -0.2180318683385849, -0.19546081125736237, -0.17288973927497864, -0.1503186821937561, -0.12774762511253357, -0.10517656803131104, -0.0826055034995079, -0.06003443896770477, -0.03746338188648224, -0.014892324805259705, 0.0076787471771240234, 0.030249804258346558, 0.05282086133956909, 0.07539191842079163, 0.09796298295259476, 0.12053404748439789, 0.14310510456562042, 0.16567616164684296, 0.18824723362922668, 0.21081829071044922, 0.23338934779167175, 0.2559604048728943, 0.2785314619541168, 0.30110251903533936, 0.3236736059188843, 0.3462446331977844, 0.36881572008132935, 0.3913867771625519, 0.4139578342437744, 0.43652889132499695, 0.4590999484062195, 0.4816710352897644, 0.5042420625686646, 0.5268131494522095, 0.5493842363357544, 0.5719552636146545, 0.5945262908935547, 0.6170973777770996, 0.6396684050559998, 0.6622394919395447, 0.6848105192184448, 0.7073816061019897, 0.7299526929855347, 0.7525237202644348, 0.7750948071479797]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 0.0, 6.0, 8.0, 20.0, 10.0, 19.0, 28.0, 33.0, 67.0, 87.0, 122.0, 213.0, 387.0, 654.0, 1517.0, 5109.0, 32349.0, 3457852.0, 670663.0, 19459.0, 3632.0, 1122.0, 476.0, 220.0, 97.0, 55.0, 26.0, 15.0, 14.0, 8.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.404052734375, -0.395050048828125, -0.38604736328125, -0.377044677734375, -0.3680419921875, -0.359039306640625, -0.35003662109375, -0.341033935546875, -0.33203125, -0.323028564453125, -0.31402587890625, -0.305023193359375, -0.2960205078125, -0.287017822265625, -0.27801513671875, -0.269012451171875, -0.260009765625, -0.251007080078125, -0.24200439453125, -0.233001708984375, -0.2239990234375, -0.214996337890625, -0.20599365234375, -0.196990966796875, -0.18798828125, -0.178985595703125, -0.16998291015625, -0.160980224609375, -0.1519775390625, -0.142974853515625, -0.13397216796875, -0.124969482421875, -0.115966796875, -0.106964111328125, -0.09796142578125, -0.088958740234375, -0.0799560546875, -0.070953369140625, -0.06195068359375, -0.052947998046875, -0.0439453125, -0.034942626953125, -0.02593994140625, -0.016937255859375, -0.0079345703125, 0.001068115234375, 0.01007080078125, 0.019073486328125, 0.028076171875, 0.037078857421875, 0.04608154296875, 0.055084228515625, 0.0640869140625, 0.073089599609375, 0.08209228515625, 0.091094970703125, 0.10009765625, 0.109100341796875, 0.11810302734375, 0.127105712890625, 0.1361083984375, 0.145111083984375, 0.15411376953125, 0.163116455078125, 0.172119140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 11.0, 17.0, 23.0, 41.0, 47.0, 76.0, 122.0, 108.0, 130.0, 110.0, 102.0, 77.0, 60.0, 30.0, 20.0, 8.0, 9.0, 9.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08282470703125, -0.08095884323120117, -0.07909297943115234, -0.07722711563110352, -0.07536125183105469, -0.07349538803100586, -0.07162952423095703, -0.0697636604309082, -0.06789779663085938, -0.06603193283081055, -0.06416606903076172, -0.06230020523071289, -0.06043434143066406, -0.058568477630615234, -0.056702613830566406, -0.05483675003051758, -0.05297088623046875, -0.05110502243041992, -0.049239158630371094, -0.047373294830322266, -0.04550743103027344, -0.04364156723022461, -0.04177570343017578, -0.03990983963012695, -0.038043975830078125, -0.0361781120300293, -0.03431224822998047, -0.03244638442993164, -0.030580520629882812, -0.028714656829833984, -0.026848793029785156, -0.024982929229736328, -0.0231170654296875, -0.021251201629638672, -0.019385337829589844, -0.017519474029541016, -0.015653610229492188, -0.01378774642944336, -0.011921882629394531, -0.010056018829345703, -0.008190155029296875, -0.006324291229248047, -0.004458427429199219, -0.0025925636291503906, -0.0007266998291015625, 0.0011391639709472656, 0.0030050277709960938, 0.004870891571044922, 0.00673675537109375, 0.008602619171142578, 0.010468482971191406, 0.012334346771240234, 0.014200210571289062, 0.01606607437133789, 0.01793193817138672, 0.019797801971435547, 0.021663665771484375, 0.023529529571533203, 0.02539539337158203, 0.02726125717163086, 0.029127120971679688, 0.030992984771728516, 0.032858848571777344, 0.03472471237182617, 0.036590576171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 16.0, 37.0, 83.0, 166.0, 295.0, 2258.0, 4189094.0, 1691.0, 303.0, 146.0, 83.0, 56.0, 30.0, 18.0, 9.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83642578125, -0.7992019653320312, -0.7619781494140625, -0.7247543334960938, -0.687530517578125, -0.6503067016601562, -0.6130828857421875, -0.5758590698242188, -0.53863525390625, -0.5014114379882812, -0.4641876220703125, -0.42696380615234375, -0.389739990234375, -0.35251617431640625, -0.3152923583984375, -0.27806854248046875, -0.2408447265625, -0.20362091064453125, -0.1663970947265625, -0.12917327880859375, -0.091949462890625, -0.05472564697265625, -0.0175018310546875, 0.01972198486328125, 0.05694580078125, 0.09416961669921875, 0.1313934326171875, 0.16861724853515625, 0.205841064453125, 0.24306488037109375, 0.2802886962890625, 0.31751251220703125, 0.354736328125, 0.39196014404296875, 0.4291839599609375, 0.46640777587890625, 0.503631591796875, 0.5408554077148438, 0.5780792236328125, 0.6153030395507812, 0.65252685546875, 0.6897506713867188, 0.7269744873046875, 0.7641983032226562, 0.801422119140625, 0.8386459350585938, 0.8758697509765625, 0.9130935668945312, 0.9503173828125, 0.9875411987304688, 1.0247650146484375, 1.0619888305664062, 1.099212646484375, 1.1364364624023438, 1.1736602783203125, 1.2108840942382812, 1.24810791015625, 1.2853317260742188, 1.3225555419921875, 1.3597793579101562, 1.397003173828125, 1.4342269897460938, 1.4714508056640625, 1.5086746215820312, 1.5458984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 13.0, 97.0, 2898.0, 1012.0, 58.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1959228515625, -0.18803977966308594, -0.18015670776367188, -0.1722736358642578, -0.16439056396484375, -0.1565074920654297, -0.14862442016601562, -0.14074134826660156, -0.1328582763671875, -0.12497520446777344, -0.11709213256835938, -0.10920906066894531, -0.10132598876953125, -0.09344291687011719, -0.08555984497070312, -0.07767677307128906, -0.069793701171875, -0.06191062927246094, -0.054027557373046875, -0.04614448547363281, -0.03826141357421875, -0.030378341674804688, -0.022495269775390625, -0.014612197875976562, -0.0067291259765625, 0.0011539459228515625, 0.009037017822265625, 0.016920089721679688, 0.02480316162109375, 0.03268623352050781, 0.040569305419921875, 0.04845237731933594, 0.05633544921875, 0.06421852111816406, 0.07210159301757812, 0.07998466491699219, 0.08786773681640625, 0.09575080871582031, 0.10363388061523438, 0.11151695251464844, 0.1194000244140625, 0.12728309631347656, 0.13516616821289062, 0.1430492401123047, 0.15093231201171875, 0.1588153839111328, 0.16669845581054688, 0.17458152770996094, 0.182464599609375, 0.19034767150878906, 0.19823074340820312, 0.2061138153076172, 0.21399688720703125, 0.2218799591064453, 0.22976303100585938, 0.23764610290527344, 0.2455291748046875, 0.25341224670410156, 0.2612953186035156, 0.2691783905029297, 0.27706146240234375, 0.2849445343017578, 0.2928276062011719, 0.30071067810058594, 0.30859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 19.0, 231.0, 747.0, 18.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3270034790039062, -2.2704896926879883, -2.2139759063720703, -2.1574618816375732, -2.1009480953216553, -2.0444343090057373, -1.9879204034805298, -1.9314064979553223, -1.8748927116394043, -1.8183789253234863, -1.7618650197982788, -1.7053511142730713, -1.6488373279571533, -1.5923235416412354, -1.5358096361160278, -1.4792957305908203, -1.4227819442749023, -1.3662681579589844, -1.3097542524337769, -1.2532403469085693, -1.1967265605926514, -1.1402127742767334, -1.0836988687515259, -1.0271849632263184, -0.9706711769104004, -0.9141573309898376, -0.8576434850692749, -0.8011296391487122, -0.7446157932281494, -0.6881019473075867, -0.6315881013870239, -0.5750742554664612, -0.518560528755188, -0.46204668283462524, -0.4055328369140625, -0.34901899099349976, -0.292505145072937, -0.23599129915237427, -0.17947745323181152, -0.12296360731124878, -0.06644976139068604, -0.009935915470123291, 0.04657793045043945, 0.1030917763710022, 0.15960562229156494, 0.21611946821212769, 0.27263331413269043, 0.3291471600532532, 0.3856610059738159, 0.44217485189437866, 0.4986886978149414, 0.5552025437355042, 0.6117163896560669, 0.6682302355766296, 0.7247440814971924, 0.7812579274177551, 0.8377717733383179, 0.8942856192588806, 0.9507994651794434, 1.0073132514953613, 1.0638271570205688, 1.1203410625457764, 1.1768548488616943, 1.2333686351776123, 1.2898825407028198]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 16.0, 37.0, 53.0, 71.0, 91.0, 128.0, 127.0, 137.0, 107.0, 82.0, 63.0, 41.0, 18.0, 13.0, 4.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5757104158401489, -0.5623830556869507, -0.5490556955337524, -0.5357283353805542, -0.5224009156227112, -0.5090735554695129, -0.4957461953163147, -0.48241883516311646, -0.4690914750099182, -0.45576411485671997, -0.44243672490119934, -0.4291093647480011, -0.41578200459480286, -0.4024546146392822, -0.389127254486084, -0.37579989433288574, -0.3624725341796875, -0.34914517402648926, -0.33581778407096863, -0.3224904239177704, -0.30916306376457214, -0.2958356738090515, -0.28250831365585327, -0.26918095350265503, -0.2558535635471344, -0.24252618849277496, -0.22919882833957672, -0.21587145328521729, -0.20254409313201904, -0.1892167180776596, -0.17588934302330017, -0.16256198287010193, -0.1492346227169037, -0.13590724766254425, -0.12257988750934601, -0.10925251245498657, -0.09592515230178833, -0.0825977772474289, -0.06927040964365005, -0.055943042039871216, -0.04261567443609238, -0.029288306832313538, -0.01596093736588955, -0.002633567899465561, 0.010693799704313278, 0.024021171033382416, 0.037348538637161255, 0.050675906240940094, 0.06400327384471893, 0.07733064144849777, 0.09065800905227661, 0.10398538410663605, 0.11731274425983429, 0.13064011931419373, 0.14396747946739197, 0.1572948545217514, 0.17062222957611084, 0.18394960463047028, 0.19727696478366852, 0.21060433983802795, 0.2239316999912262, 0.23725907504558563, 0.25058645009994507, 0.2639138102531433, 0.27724117040634155]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 9.0, 8.0, 13.0, 21.0, 44.0, 36.0, 62.0, 87.0, 104.0, 196.0, 270.0, 501.0, 818.0, 1536.0, 3862.0, 10857.0, 38994.0, 191712.0, 567790.0, 177244.0, 36823.0, 10334.0, 3542.0, 1480.0, 810.0, 429.0, 288.0, 184.0, 127.0, 101.0, 80.0, 47.0, 42.0, 30.0, 11.0, 10.0, 10.0, 9.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11688232421875, -0.11339092254638672, -0.10989952087402344, -0.10640811920166016, -0.10291671752929688, -0.0994253158569336, -0.09593391418457031, -0.09244251251220703, -0.08895111083984375, -0.08545970916748047, -0.08196830749511719, -0.0784769058227539, -0.07498550415039062, -0.07149410247802734, -0.06800270080566406, -0.06451129913330078, -0.0610198974609375, -0.05752849578857422, -0.05403709411621094, -0.050545692443847656, -0.047054290771484375, -0.043562889099121094, -0.04007148742675781, -0.03658008575439453, -0.03308868408203125, -0.02959728240966797, -0.026105880737304688, -0.022614479064941406, -0.019123077392578125, -0.015631675720214844, -0.012140274047851562, -0.008648872375488281, -0.005157470703125, -0.0016660690307617188, 0.0018253326416015625, 0.005316734313964844, 0.008808135986328125, 0.012299537658691406, 0.015790939331054688, 0.01928234100341797, 0.02277374267578125, 0.02626514434814453, 0.029756546020507812, 0.033247947692871094, 0.036739349365234375, 0.040230751037597656, 0.04372215270996094, 0.04721355438232422, 0.0507049560546875, 0.05419635772705078, 0.05768775939941406, 0.061179161071777344, 0.06467056274414062, 0.0681619644165039, 0.07165336608886719, 0.07514476776123047, 0.07863616943359375, 0.08212757110595703, 0.08561897277832031, 0.0891103744506836, 0.09260177612304688, 0.09609317779541016, 0.09958457946777344, 0.10307598114013672, 0.1065673828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 9.0, 10.0, 23.0, 36.0, 50.0, 49.0, 70.0, 85.0, 88.0, 98.0, 92.0, 100.0, 83.0, 46.0, 38.0, 41.0, 26.0, 18.0, 11.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05792236328125, -0.05646181106567383, -0.055001258850097656, -0.053540706634521484, -0.05208015441894531, -0.05061960220336914, -0.04915904998779297, -0.0476984977722168, -0.046237945556640625, -0.04477739334106445, -0.04331684112548828, -0.04185628890991211, -0.04039573669433594, -0.038935184478759766, -0.037474632263183594, -0.03601408004760742, -0.03455352783203125, -0.03309297561645508, -0.031632423400878906, -0.030171871185302734, -0.028711318969726562, -0.02725076675415039, -0.02579021453857422, -0.024329662322998047, -0.022869110107421875, -0.021408557891845703, -0.01994800567626953, -0.01848745346069336, -0.017026901245117188, -0.015566349029541016, -0.014105796813964844, -0.012645244598388672, -0.0111846923828125, -0.009724140167236328, -0.008263587951660156, -0.006803035736083984, -0.0053424835205078125, -0.0038819313049316406, -0.0024213790893554688, -0.0009608268737792969, 0.000499725341796875, 0.001960277557373047, 0.0034208297729492188, 0.004881381988525391, 0.0063419342041015625, 0.007802486419677734, 0.009263038635253906, 0.010723590850830078, 0.01218414306640625, 0.013644695281982422, 0.015105247497558594, 0.016565799713134766, 0.018026351928710938, 0.01948690414428711, 0.02094745635986328, 0.022408008575439453, 0.023868560791015625, 0.025329113006591797, 0.02678966522216797, 0.02825021743774414, 0.029710769653320312, 0.031171321868896484, 0.032631874084472656, 0.03409242630004883, 0.035552978515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 10.0, 6.0, 10.0, 17.0, 23.0, 44.0, 52.0, 112.0, 202.0, 478.0, 1289.0, 4865.0, 32477.0, 652891.0, 331571.0, 19233.0, 3498.0, 999.0, 375.0, 152.0, 88.0, 52.0, 34.0, 24.0, 15.0, 7.0, 6.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.234619140625, -0.2284259796142578, -0.22223281860351562, -0.21603965759277344, -0.20984649658203125, -0.20365333557128906, -0.19746017456054688, -0.1912670135498047, -0.1850738525390625, -0.1788806915283203, -0.17268753051757812, -0.16649436950683594, -0.16030120849609375, -0.15410804748535156, -0.14791488647460938, -0.1417217254638672, -0.135528564453125, -0.1293354034423828, -0.12314224243164062, -0.11694908142089844, -0.11075592041015625, -0.10456275939941406, -0.09836959838867188, -0.09217643737792969, -0.0859832763671875, -0.07979011535644531, -0.07359695434570312, -0.06740379333496094, -0.06121063232421875, -0.05501747131347656, -0.048824310302734375, -0.04263114929199219, -0.03643798828125, -0.030244827270507812, -0.024051666259765625, -0.017858505249023438, -0.01166534423828125, -0.0054721832275390625, 0.000720977783203125, 0.0069141387939453125, 0.0131072998046875, 0.019300460815429688, 0.025493621826171875, 0.03168678283691406, 0.03787994384765625, 0.04407310485839844, 0.050266265869140625, 0.05645942687988281, 0.062652587890625, 0.06884574890136719, 0.07503890991210938, 0.08123207092285156, 0.08742523193359375, 0.09361839294433594, 0.09981155395507812, 0.10600471496582031, 0.1121978759765625, 0.11839103698730469, 0.12458419799804688, 0.13077735900878906, 0.13697052001953125, 0.14316368103027344, 0.14935684204101562, 0.1555500030517578, 0.1617431640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 10.0, 9.0, 18.0, 20.0, 27.0, 30.0, 39.0, 43.0, 66.0, 84.0, 85.0, 86.0, 96.0, 81.0, 66.0, 53.0, 41.0, 35.0, 24.0, 23.0, 14.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2198486328125, -0.21418380737304688, -0.20851898193359375, -0.20285415649414062, -0.1971893310546875, -0.19152450561523438, -0.18585968017578125, -0.18019485473632812, -0.174530029296875, -0.16886520385742188, -0.16320037841796875, -0.15753555297851562, -0.1518707275390625, -0.14620590209960938, -0.14054107666015625, -0.13487625122070312, -0.12921142578125, -0.12354660034179688, -0.11788177490234375, -0.11221694946289062, -0.1065521240234375, -0.10088729858398438, -0.09522247314453125, -0.08955764770507812, -0.083892822265625, -0.07822799682617188, -0.07256317138671875, -0.06689834594726562, -0.0612335205078125, -0.055568695068359375, -0.04990386962890625, -0.044239044189453125, -0.03857421875, -0.032909393310546875, -0.02724456787109375, -0.021579742431640625, -0.0159149169921875, -0.010250091552734375, -0.00458526611328125, 0.001079559326171875, 0.006744384765625, 0.012409210205078125, 0.01807403564453125, 0.023738861083984375, 0.0294036865234375, 0.035068511962890625, 0.04073333740234375, 0.046398162841796875, 0.05206298828125, 0.057727813720703125, 0.06339263916015625, 0.06905746459960938, 0.0747222900390625, 0.08038711547851562, 0.08605194091796875, 0.09171676635742188, 0.097381591796875, 0.10304641723632812, 0.10871124267578125, 0.11437606811523438, 0.1200408935546875, 0.12570571899414062, 0.13137054443359375, 0.13703536987304688, 0.1427001953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 12.0, 5.0, 17.0, 16.0, 32.0, 24.0, 50.0, 68.0, 117.0, 174.0, 306.0, 668.0, 1167.0, 2572.0, 6440.0, 19759.0, 82453.0, 381518.0, 421016.0, 97280.0, 22296.0, 6899.0, 2832.0, 1274.0, 650.0, 341.0, 200.0, 134.0, 76.0, 49.0, 33.0, 30.0, 12.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04425048828125, -0.042911529541015625, -0.04157257080078125, -0.040233612060546875, -0.0388946533203125, -0.037555694580078125, -0.03621673583984375, -0.034877777099609375, -0.033538818359375, -0.032199859619140625, -0.03086090087890625, -0.029521942138671875, -0.0281829833984375, -0.026844024658203125, -0.02550506591796875, -0.024166107177734375, -0.0228271484375, -0.021488189697265625, -0.02014923095703125, -0.018810272216796875, -0.0174713134765625, -0.016132354736328125, -0.01479339599609375, -0.013454437255859375, -0.012115478515625, -0.010776519775390625, -0.00943756103515625, -0.008098602294921875, -0.0067596435546875, -0.005420684814453125, -0.00408172607421875, -0.002742767333984375, -0.00140380859375, -6.4849853515625e-05, 0.00127410888671875, 0.002613067626953125, 0.0039520263671875, 0.005290985107421875, 0.00662994384765625, 0.007968902587890625, 0.009307861328125, 0.010646820068359375, 0.01198577880859375, 0.013324737548828125, 0.0146636962890625, 0.016002655029296875, 0.01734161376953125, 0.018680572509765625, 0.02001953125, 0.021358489990234375, 0.02269744873046875, 0.024036407470703125, 0.0253753662109375, 0.026714324951171875, 0.02805328369140625, 0.029392242431640625, 0.030731201171875, 0.032070159912109375, 0.03340911865234375, 0.034748077392578125, 0.0360870361328125, 0.037425994873046875, 0.03876495361328125, 0.040103912353515625, 0.04144287109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 3.0, 6.0, 19.0, 17.0, 26.0, 21.0, 47.0, 45.0, 64.0, 78.0, 102.0, 103.0, 97.0, 69.0, 61.0, 54.0, 34.0, 38.0, 31.0, 16.0, 12.0, 12.0, 8.0, 5.0, 8.0, 3.0, 2.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011271238327026367, -0.00010887254029512405, -0.00010503269731998444, -0.00010119285434484482, -9.73530113697052e-05, -9.351316839456558e-05, -8.967332541942596e-05, -8.583348244428635e-05, -8.199363946914673e-05, -7.815379649400711e-05, -7.431395351886749e-05, -7.047411054372787e-05, -6.663426756858826e-05, -6.279442459344864e-05, -5.895458161830902e-05, -5.51147386431694e-05, -5.1274895668029785e-05, -4.743505269289017e-05, -4.359520971775055e-05, -3.975536674261093e-05, -3.5915523767471313e-05, -3.2075680792331696e-05, -2.8235837817192078e-05, -2.439599484205246e-05, -2.0556151866912842e-05, -1.6716308891773224e-05, -1.2876465916633606e-05, -9.036622941493988e-06, -5.19677996635437e-06, -1.3569369912147522e-06, 2.4829059839248657e-06, 6.322748959064484e-06, 1.0162591934204102e-05, 1.400243490934372e-05, 1.7842277884483337e-05, 2.1682120859622955e-05, 2.5521963834762573e-05, 2.936180680990219e-05, 3.320164978504181e-05, 3.704149276018143e-05, 4.0881335735321045e-05, 4.472117871046066e-05, 4.856102168560028e-05, 5.24008646607399e-05, 5.6240707635879517e-05, 6.0080550611019135e-05, 6.392039358615875e-05, 6.776023656129837e-05, 7.160007953643799e-05, 7.54399225115776e-05, 7.927976548671722e-05, 8.311960846185684e-05, 8.695945143699646e-05, 9.079929441213608e-05, 9.46391373872757e-05, 9.847898036241531e-05, 0.00010231882333755493, 0.00010615866631269455, 0.00010999850928783417, 0.00011383835226297379, 0.0001176781952381134, 0.00012151803821325302, 0.00012535788118839264, 0.00012919772416353226, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 13.0, 21.0, 23.0, 27.0, 40.0, 82.0, 99.0, 179.0, 295.0, 464.0, 1007.0, 2082.0, 4724.0, 12739.0, 45858.0, 211858.0, 497104.0, 206146.0, 44554.0, 12319.0, 4552.0, 2083.0, 973.0, 486.0, 294.0, 188.0, 112.0, 71.0, 50.0, 26.0, 22.0, 13.0, 19.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04437255859375, -0.043122291564941406, -0.04187202453613281, -0.04062175750732422, -0.039371490478515625, -0.03812122344970703, -0.03687095642089844, -0.035620689392089844, -0.03437042236328125, -0.033120155334472656, -0.03186988830566406, -0.03061962127685547, -0.029369354248046875, -0.02811908721923828, -0.026868820190429688, -0.025618553161621094, -0.0243682861328125, -0.023118019104003906, -0.021867752075195312, -0.02061748504638672, -0.019367218017578125, -0.01811695098876953, -0.016866683959960938, -0.015616416931152344, -0.01436614990234375, -0.013115882873535156, -0.011865615844726562, -0.010615348815917969, -0.009365081787109375, -0.008114814758300781, -0.0068645477294921875, -0.005614280700683594, -0.004364013671875, -0.0031137466430664062, -0.0018634796142578125, -0.0006132125854492188, 0.000637054443359375, 0.0018873214721679688, 0.0031375885009765625, 0.004387855529785156, 0.00563812255859375, 0.006888389587402344, 0.008138656616210938, 0.009388923645019531, 0.010639190673828125, 0.011889457702636719, 0.013139724731445312, 0.014389991760253906, 0.0156402587890625, 0.016890525817871094, 0.018140792846679688, 0.01939105987548828, 0.020641326904296875, 0.02189159393310547, 0.023141860961914062, 0.024392127990722656, 0.02564239501953125, 0.026892662048339844, 0.028142929077148438, 0.02939319610595703, 0.030643463134765625, 0.03189373016357422, 0.03314399719238281, 0.034394264221191406, 0.03564453125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 9.0, 12.0, 9.0, 11.0, 20.0, 29.0, 33.0, 43.0, 80.0, 67.0, 103.0, 111.0, 120.0, 87.0, 68.0, 48.0, 39.0, 31.0, 21.0, 18.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.043121337890625, -0.04190969467163086, -0.04069805145263672, -0.03948640823364258, -0.03827476501464844, -0.0370631217956543, -0.035851478576660156, -0.034639835357666016, -0.033428192138671875, -0.032216548919677734, -0.031004905700683594, -0.029793262481689453, -0.028581619262695312, -0.027369976043701172, -0.02615833282470703, -0.02494668960571289, -0.02373504638671875, -0.02252340316772461, -0.02131175994873047, -0.020100116729736328, -0.018888473510742188, -0.017676830291748047, -0.016465187072753906, -0.015253543853759766, -0.014041900634765625, -0.012830257415771484, -0.011618614196777344, -0.010406970977783203, -0.009195327758789062, -0.007983684539794922, -0.006772041320800781, -0.005560398101806641, -0.0043487548828125, -0.0031371116638183594, -0.0019254684448242188, -0.0007138252258300781, 0.0004978179931640625, 0.0017094612121582031, 0.0029211044311523438, 0.004132747650146484, 0.005344390869140625, 0.006556034088134766, 0.007767677307128906, 0.008979320526123047, 0.010190963745117188, 0.011402606964111328, 0.012614250183105469, 0.01382589340209961, 0.01503753662109375, 0.01624917984008789, 0.01746082305908203, 0.018672466278076172, 0.019884109497070312, 0.021095752716064453, 0.022307395935058594, 0.023519039154052734, 0.024730682373046875, 0.025942325592041016, 0.027153968811035156, 0.028365612030029297, 0.029577255249023438, 0.030788898468017578, 0.03200054168701172, 0.03321218490600586, 0.034423828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 19.0, 33.0, 80.0, 214.0, 299.0, 194.0, 89.0, 32.0, 13.0, 10.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3114013671875, -1.2755576372146606, -1.2397140264511108, -1.2038702964782715, -1.1680266857147217, -1.1321829557418823, -1.096339225769043, -1.0604956150054932, -1.0246518850326538, -0.9888082146644592, -0.9529645442962646, -0.9171208143234253, -0.8812771439552307, -0.8454334735870361, -0.8095898032188416, -0.773746132850647, -0.7379024624824524, -0.7020587921142578, -0.6662151217460632, -0.6303714513778687, -0.5945277214050293, -0.5586840510368347, -0.5228403806686401, -0.48699668049812317, -0.4511530101299286, -0.415309339761734, -0.37946563959121704, -0.34362196922302246, -0.3077782988548279, -0.2719345986843109, -0.23609092831611633, -0.20024722814559937, -0.16440361738204956, -0.1285599321126938, -0.09271625429391861, -0.05687257647514343, -0.02102889120578766, 0.014814794063568115, 0.050658464431762695, 0.08650216460227966, 0.12234583497047424, 0.15818952023983002, 0.1940332055091858, 0.22987687587738037, 0.26572054624557495, 0.3015642464160919, 0.3374079167842865, 0.37325161695480347, 0.40909528732299805, 0.4449389576911926, 0.4807826578617096, 0.5166263580322266, 0.5524700284004211, 0.5883136987686157, 0.6241573691368103, 0.6600010395050049, 0.6958447694778442, 0.7316884398460388, 0.7675321102142334, 0.8033758401870728, 0.8392195105552673, 0.8750631809234619, 0.9109068512916565, 0.9467505216598511, 0.9825941920280457]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 6.0, 15.0, 9.0, 28.0, 22.0, 21.0, 29.0, 39.0, 38.0, 56.0, 44.0, 66.0, 55.0, 49.0, 55.0, 56.0, 60.0, 47.0, 48.0, 38.0, 42.0, 40.0, 32.0, 20.0, 18.0, 10.0, 16.0, 12.0, 10.0, 4.0, 7.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7840007543563843, -0.759795069694519, -0.7355893850326538, -0.7113837003707886, -0.6871780157089233, -0.6629723906517029, -0.6387667059898376, -0.6145610213279724, -0.5903553366661072, -0.5661496520042419, -0.5419439673423767, -0.5177382826805115, -0.49353262782096863, -0.4693269431591034, -0.44512128829956055, -0.4209156036376953, -0.3967099189758301, -0.37250423431396484, -0.3482985496520996, -0.32409289479255676, -0.29988721013069153, -0.2756815254688263, -0.25147587060928345, -0.2272701859474182, -0.20306450128555298, -0.17885881662368774, -0.1546531468629837, -0.13044747710227966, -0.10624179244041443, -0.08203611522912979, -0.057830438017845154, -0.03362476825714111, -0.009419143199920654, 0.014786534011363983, 0.03899221122264862, 0.06319788843393326, 0.0874035656452179, 0.11160924285650253, 0.13581492006778717, 0.1600205898284912, 0.18422627449035645, 0.20843195915222168, 0.23263762891292572, 0.25684329867362976, 0.281048983335495, 0.30525466799736023, 0.3294603228569031, 0.3536660075187683, 0.37787169218063354, 0.4020773768424988, 0.426283061504364, 0.45048871636390686, 0.4746944010257721, 0.49890008568763733, 0.5231057405471802, 0.5473114252090454, 0.5715171098709106, 0.5957227945327759, 0.6199284791946411, 0.6441341638565063, 0.6683398485183716, 0.692545473575592, 0.7167511582374573, 0.7409568428993225, 0.7651625275611877]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 19.0, 20.0, 24.0, 50.0, 89.0, 127.0, 203.0, 382.0, 780.0, 1962.0, 6329.0, 49241.0, 3756744.0, 356029.0, 16803.0, 3418.0, 1112.0, 450.0, 218.0, 109.0, 56.0, 33.0, 26.0, 12.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.40673828125, -0.39765167236328125, -0.3885650634765625, -0.37947845458984375, -0.370391845703125, -0.36130523681640625, -0.3522186279296875, -0.34313201904296875, -0.33404541015625, -0.32495880126953125, -0.3158721923828125, -0.30678558349609375, -0.297698974609375, -0.28861236572265625, -0.2795257568359375, -0.27043914794921875, -0.2613525390625, -0.25226593017578125, -0.2431793212890625, -0.23409271240234375, -0.225006103515625, -0.21591949462890625, -0.2068328857421875, -0.19774627685546875, -0.18865966796875, -0.17957305908203125, -0.1704864501953125, -0.16139984130859375, -0.152313232421875, -0.14322662353515625, -0.1341400146484375, -0.12505340576171875, -0.115966796875, -0.10688018798828125, -0.0977935791015625, -0.08870697021484375, -0.079620361328125, -0.07053375244140625, -0.0614471435546875, -0.05236053466796875, -0.04327392578125, -0.03418731689453125, -0.0251007080078125, -0.01601409912109375, -0.006927490234375, 0.00215911865234375, 0.0112457275390625, 0.02033233642578125, 0.0294189453125, 0.03850555419921875, 0.0475921630859375, 0.05667877197265625, 0.065765380859375, 0.07485198974609375, 0.0839385986328125, 0.09302520751953125, 0.10211181640625, 0.11119842529296875, 0.1202850341796875, 0.12937164306640625, 0.138458251953125, 0.14754486083984375, 0.1566314697265625, 0.16571807861328125, 0.1748046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 11.0, 21.0, 29.0, 39.0, 66.0, 68.0, 87.0, 89.0, 110.0, 108.0, 87.0, 80.0, 43.0, 48.0, 37.0, 33.0, 13.0, 12.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.06988525390625, -0.06835556030273438, -0.06682586669921875, -0.06529617309570312, -0.0637664794921875, -0.062236785888671875, -0.06070709228515625, -0.059177398681640625, -0.057647705078125, -0.056118011474609375, -0.05458831787109375, -0.053058624267578125, -0.0515289306640625, -0.049999237060546875, -0.04846954345703125, -0.046939849853515625, -0.04541015625, -0.043880462646484375, -0.04235076904296875, -0.040821075439453125, -0.0392913818359375, -0.037761688232421875, -0.03623199462890625, -0.034702301025390625, -0.033172607421875, -0.031642913818359375, -0.03011322021484375, -0.028583526611328125, -0.0270538330078125, -0.025524139404296875, -0.02399444580078125, -0.022464752197265625, -0.02093505859375, -0.019405364990234375, -0.01787567138671875, -0.016345977783203125, -0.0148162841796875, -0.013286590576171875, -0.01175689697265625, -0.010227203369140625, -0.008697509765625, -0.007167816162109375, -0.00563812255859375, -0.004108428955078125, -0.0025787353515625, -0.001049041748046875, 0.00048065185546875, 0.002010345458984375, 0.0035400390625, 0.005069732666015625, 0.00659942626953125, 0.008129119873046875, 0.0096588134765625, 0.011188507080078125, 0.01271820068359375, 0.014247894287109375, 0.015777587890625, 0.017307281494140625, 0.01883697509765625, 0.020366668701171875, 0.0218963623046875, 0.023426055908203125, 0.02495574951171875, 0.026485443115234375, 0.02801513671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 2.0, 11.0, 10.0, 20.0, 32.0, 44.0, 68.0, 96.0, 209.0, 492.0, 1750.0, 9494.0, 2041139.0, 2129781.0, 8901.0, 1444.0, 431.0, 158.0, 84.0, 59.0, 20.0, 16.0, 4.0, 8.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59130859375, -0.5781688690185547, -0.5650291442871094, -0.5518894195556641, -0.5387496948242188, -0.5256099700927734, -0.5124702453613281, -0.4993305206298828, -0.4861907958984375, -0.4730510711669922, -0.4599113464355469, -0.44677162170410156, -0.43363189697265625, -0.42049217224121094, -0.4073524475097656, -0.3942127227783203, -0.381072998046875, -0.3679332733154297, -0.3547935485839844, -0.34165382385253906, -0.32851409912109375, -0.31537437438964844, -0.3022346496582031, -0.2890949249267578, -0.2759552001953125, -0.2628154754638672, -0.24967575073242188, -0.23653602600097656, -0.22339630126953125, -0.21025657653808594, -0.19711685180664062, -0.1839771270751953, -0.17083740234375, -0.1576976776123047, -0.14455795288085938, -0.13141822814941406, -0.11827850341796875, -0.10513877868652344, -0.09199905395507812, -0.07885932922363281, -0.0657196044921875, -0.05257987976074219, -0.039440155029296875, -0.026300430297851562, -0.01316070556640625, -2.09808349609375e-05, 0.013118743896484375, 0.026258468627929688, 0.039398193359375, 0.05253791809082031, 0.06567764282226562, 0.07881736755371094, 0.09195709228515625, 0.10509681701660156, 0.11823654174804688, 0.1313762664794922, 0.1445159912109375, 0.1576557159423828, 0.17079544067382812, 0.18393516540527344, 0.19707489013671875, 0.21021461486816406, 0.22335433959960938, 0.2364940643310547, 0.2496337890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 9.0, 10.0, 11.0, 32.0, 156.0, 1056.0, 2341.0, 344.0, 54.0, 22.0, 13.0, 10.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2281494140625, -0.2226123809814453, -0.21707534790039062, -0.21153831481933594, -0.20600128173828125, -0.20046424865722656, -0.19492721557617188, -0.1893901824951172, -0.1838531494140625, -0.1783161163330078, -0.17277908325195312, -0.16724205017089844, -0.16170501708984375, -0.15616798400878906, -0.15063095092773438, -0.1450939178466797, -0.139556884765625, -0.1340198516845703, -0.12848281860351562, -0.12294578552246094, -0.11740875244140625, -0.11187171936035156, -0.10633468627929688, -0.10079765319824219, -0.0952606201171875, -0.08972358703613281, -0.08418655395507812, -0.07864952087402344, -0.07311248779296875, -0.06757545471191406, -0.062038421630859375, -0.05650138854980469, -0.05096435546875, -0.04542732238769531, -0.039890289306640625, -0.03435325622558594, -0.02881622314453125, -0.023279190063476562, -0.017742156982421875, -0.012205123901367188, -0.0066680908203125, -0.0011310577392578125, 0.004405975341796875, 0.009943008422851562, 0.01548004150390625, 0.021017074584960938, 0.026554107666015625, 0.03209114074707031, 0.037628173828125, 0.04316520690917969, 0.048702239990234375, 0.05423927307128906, 0.05977630615234375, 0.06531333923339844, 0.07085037231445312, 0.07638740539550781, 0.0819244384765625, 0.08746147155761719, 0.09299850463867188, 0.09853553771972656, 0.10407257080078125, 0.10960960388183594, 0.11514663696289062, 0.12068367004394531, 0.126220703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 6.0, 17.0, 148.0, 509.0, 266.0, 40.0, 15.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0064046382904053, -1.9675244092941284, -1.9286441802978516, -1.8897640705108643, -1.8508838415145874, -1.8120036125183105, -1.7731233835220337, -1.7342431545257568, -1.6953630447387695, -1.6564828157424927, -1.6176025867462158, -1.5787224769592285, -1.5398422479629517, -1.5009620189666748, -1.462081789970398, -1.423201560974121, -1.3843213319778442, -1.3454411029815674, -1.3065608739852905, -1.2676807641983032, -1.2288005352020264, -1.1899203062057495, -1.1510400772094727, -1.1121598482131958, -1.073279619216919, -1.034399390220642, -0.99551922082901, -0.9566389918327332, -0.9177588224411011, -0.8788785934448242, -0.8399983644485474, -0.8011181354522705, -0.762238085269928, -0.7233578562736511, -0.684477686882019, -0.6455974578857422, -0.6067172288894653, -0.5678370594978333, -0.5289568305015564, -0.49007663130760193, -0.45119643211364746, -0.412316232919693, -0.3734360337257385, -0.33455580472946167, -0.2956756055355072, -0.25679540634155273, -0.21791519224643707, -0.1790349781513214, -0.14015477895736694, -0.10127457231283188, -0.062394365668296814, -0.02351415902376175, 0.015366047620773315, 0.05424624681472778, 0.09312646090984344, 0.1320066750049591, 0.17088687419891357, 0.20976707339286804, 0.2486472874879837, 0.28752750158309937, 0.32640770077705383, 0.3652878999710083, 0.40416812896728516, 0.4430483281612396, 0.4819285273551941]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 10.0, 10.0, 21.0, 46.0, 34.0, 47.0, 87.0, 87.0, 100.0, 123.0, 97.0, 106.0, 73.0, 59.0, 38.0, 25.0, 15.0, 17.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4835076332092285, -0.46717312932014465, -0.4508385956287384, -0.43450409173965454, -0.4181695580482483, -0.40183505415916443, -0.38550055027008057, -0.3691660165786743, -0.35283151268959045, -0.3364970088005066, -0.32016247510910034, -0.3038279712200165, -0.2874934673309326, -0.27115893363952637, -0.2548244297504425, -0.23848991096019745, -0.2221553921699524, -0.20582087337970734, -0.18948635458946228, -0.17315185070037842, -0.15681733191013336, -0.1404828131198883, -0.12414830178022385, -0.10781379044055939, -0.09147927165031433, -0.07514475286006927, -0.058810241520404816, -0.04247572645545006, -0.0261412113904953, -0.009806692600250244, 0.006527818739414215, 0.022862330079078674, 0.039196908473968506, 0.055531423538923264, 0.07186593860387802, 0.08820044994354248, 0.10453496873378754, 0.12086948752403259, 0.13720399141311646, 0.1535385102033615, 0.16987302899360657, 0.18620754778385162, 0.20254206657409668, 0.21887657046318054, 0.2352110892534256, 0.25154560804367065, 0.2678801119327545, 0.2842146158218384, 0.30054914951324463, 0.3168836534023285, 0.33321818709373474, 0.3495526909828186, 0.36588722467422485, 0.3822217285633087, 0.3985562324523926, 0.41489076614379883, 0.4312252700328827, 0.44755977392196655, 0.4638943076133728, 0.48022881150245667, 0.4965633153915405, 0.5128978490829468, 0.529232382774353, 0.5455668568611145, 0.5619013905525208]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 11.0, 11.0, 20.0, 21.0, 18.0, 41.0, 48.0, 80.0, 111.0, 182.0, 338.0, 587.0, 1275.0, 3526.0, 12190.0, 75154.0, 644473.0, 271333.0, 28365.0, 6536.0, 2128.0, 942.0, 429.0, 239.0, 152.0, 109.0, 70.0, 38.0, 27.0, 24.0, 12.0, 11.0, 10.0, 11.0, 2.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1602783203125, -0.15538597106933594, -0.15049362182617188, -0.1456012725830078, -0.14070892333984375, -0.1358165740966797, -0.13092422485351562, -0.12603187561035156, -0.1211395263671875, -0.11624717712402344, -0.11135482788085938, -0.10646247863769531, -0.10157012939453125, -0.09667778015136719, -0.09178543090820312, -0.08689308166503906, -0.082000732421875, -0.07710838317871094, -0.07221603393554688, -0.06732368469238281, -0.06243133544921875, -0.05753898620605469, -0.052646636962890625, -0.04775428771972656, -0.0428619384765625, -0.03796958923339844, -0.033077239990234375, -0.028184890747070312, -0.02329254150390625, -0.018400192260742188, -0.013507843017578125, -0.008615493774414062, -0.00372314453125, 0.0011692047119140625, 0.006061553955078125, 0.010953903198242188, 0.01584625244140625, 0.020738601684570312, 0.025630950927734375, 0.030523300170898438, 0.0354156494140625, 0.04030799865722656, 0.045200347900390625, 0.05009269714355469, 0.05498504638671875, 0.05987739562988281, 0.06476974487304688, 0.06966209411621094, 0.074554443359375, 0.07944679260253906, 0.08433914184570312, 0.08923149108886719, 0.09412384033203125, 0.09901618957519531, 0.10390853881835938, 0.10880088806152344, 0.1136932373046875, 0.11858558654785156, 0.12347793579101562, 0.1283702850341797, 0.13326263427734375, 0.1381549835205078, 0.14304733276367188, 0.14793968200683594, 0.15283203125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 22.0, 44.0, 64.0, 83.0, 110.0, 146.0, 126.0, 114.0, 104.0, 58.0, 49.0, 33.0, 14.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0733642578125, -0.07149171829223633, -0.06961917877197266, -0.06774663925170898, -0.06587409973144531, -0.06400156021118164, -0.06212902069091797, -0.0602564811706543, -0.058383941650390625, -0.05651140213012695, -0.05463886260986328, -0.05276632308959961, -0.05089378356933594, -0.049021244049072266, -0.047148704528808594, -0.04527616500854492, -0.04340362548828125, -0.04153108596801758, -0.039658546447753906, -0.037786006927490234, -0.03591346740722656, -0.03404092788696289, -0.03216838836669922, -0.030295848846435547, -0.028423309326171875, -0.026550769805908203, -0.02467823028564453, -0.02280569076538086, -0.020933151245117188, -0.019060611724853516, -0.017188072204589844, -0.015315532684326172, -0.0134429931640625, -0.011570453643798828, -0.009697914123535156, -0.007825374603271484, -0.0059528350830078125, -0.004080295562744141, -0.0022077560424804688, -0.0003352165222167969, 0.001537322998046875, 0.003409862518310547, 0.005282402038574219, 0.007154941558837891, 0.009027481079101562, 0.010900020599365234, 0.012772560119628906, 0.014645099639892578, 0.01651763916015625, 0.018390178680419922, 0.020262718200683594, 0.022135257720947266, 0.024007797241210938, 0.02588033676147461, 0.02775287628173828, 0.029625415802001953, 0.031497955322265625, 0.0333704948425293, 0.03524303436279297, 0.03711557388305664, 0.03898811340332031, 0.040860652923583984, 0.042733192443847656, 0.04460573196411133, 0.046478271484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 17.0, 24.0, 25.0, 45.0, 69.0, 119.0, 190.0, 382.0, 820.0, 2203.0, 6998.0, 30546.0, 199915.0, 610248.0, 162114.0, 25407.0, 5928.0, 1876.0, 765.0, 358.0, 210.0, 98.0, 66.0, 46.0, 28.0, 17.0, 7.0, 13.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07763671875, -0.07470130920410156, -0.07176589965820312, -0.06883049011230469, -0.06589508056640625, -0.06295967102050781, -0.060024261474609375, -0.05708885192871094, -0.0541534423828125, -0.05121803283691406, -0.048282623291015625, -0.04534721374511719, -0.04241180419921875, -0.03947639465332031, -0.036540985107421875, -0.03360557556152344, -0.030670166015625, -0.027734756469726562, -0.024799346923828125, -0.021863937377929688, -0.01892852783203125, -0.015993118286132812, -0.013057708740234375, -0.010122299194335938, -0.0071868896484375, -0.0042514801025390625, -0.001316070556640625, 0.0016193389892578125, 0.00455474853515625, 0.0074901580810546875, 0.010425567626953125, 0.013360977172851562, 0.01629638671875, 0.019231796264648438, 0.022167205810546875, 0.025102615356445312, 0.02803802490234375, 0.030973434448242188, 0.033908843994140625, 0.03684425354003906, 0.0397796630859375, 0.04271507263183594, 0.045650482177734375, 0.04858589172363281, 0.05152130126953125, 0.05445671081542969, 0.057392120361328125, 0.06032752990722656, 0.063262939453125, 0.06619834899902344, 0.06913375854492188, 0.07206916809082031, 0.07500457763671875, 0.07793998718261719, 0.08087539672851562, 0.08381080627441406, 0.0867462158203125, 0.08968162536621094, 0.09261703491210938, 0.09555244445800781, 0.09848785400390625, 0.10142326354980469, 0.10435867309570312, 0.10729408264160156, 0.1102294921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 7.0, 12.0, 8.0, 9.0, 20.0, 25.0, 29.0, 27.0, 46.0, 54.0, 47.0, 60.0, 54.0, 73.0, 59.0, 70.0, 60.0, 63.0, 59.0, 40.0, 49.0, 32.0, 33.0, 19.0, 17.0, 7.0, 9.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11090087890625, -0.10695743560791016, -0.10301399230957031, -0.09907054901123047, -0.09512710571289062, -0.09118366241455078, -0.08724021911621094, -0.0832967758178711, -0.07935333251953125, -0.0754098892211914, -0.07146644592285156, -0.06752300262451172, -0.06357955932617188, -0.05963611602783203, -0.05569267272949219, -0.051749229431152344, -0.0478057861328125, -0.043862342834472656, -0.03991889953613281, -0.03597545623779297, -0.032032012939453125, -0.02808856964111328, -0.024145126342773438, -0.020201683044433594, -0.01625823974609375, -0.012314796447753906, -0.008371353149414062, -0.004427909851074219, -0.000484466552734375, 0.0034589767456054688, 0.0074024200439453125, 0.011345863342285156, 0.015289306640625, 0.019232749938964844, 0.023176193237304688, 0.02711963653564453, 0.031063079833984375, 0.03500652313232422, 0.03894996643066406, 0.042893409729003906, 0.04683685302734375, 0.050780296325683594, 0.05472373962402344, 0.05866718292236328, 0.06261062622070312, 0.06655406951904297, 0.07049751281738281, 0.07444095611572266, 0.0783843994140625, 0.08232784271240234, 0.08627128601074219, 0.09021472930908203, 0.09415817260742188, 0.09810161590576172, 0.10204505920410156, 0.1059885025024414, 0.10993194580078125, 0.1138753890991211, 0.11781883239746094, 0.12176227569580078, 0.12570571899414062, 0.12964916229248047, 0.1335926055908203, 0.13753604888916016, 0.1414794921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 4.0, 12.0, 25.0, 29.0, 39.0, 58.0, 81.0, 114.0, 162.0, 252.0, 409.0, 708.0, 1314.0, 2670.0, 6784.0, 19892.0, 70386.0, 231300.0, 396186.0, 220958.0, 66160.0, 18751.0, 6388.0, 2679.0, 1244.0, 781.0, 389.0, 263.0, 167.0, 98.0, 69.0, 36.0, 31.0, 25.0, 23.0, 15.0, 5.0, 4.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0301055908203125, -0.029206275939941406, -0.028306961059570312, -0.02740764617919922, -0.026508331298828125, -0.02560901641845703, -0.024709701538085938, -0.023810386657714844, -0.02291107177734375, -0.022011756896972656, -0.021112442016601562, -0.02021312713623047, -0.019313812255859375, -0.01841449737548828, -0.017515182495117188, -0.016615867614746094, -0.015716552734375, -0.014817237854003906, -0.013917922973632812, -0.013018608093261719, -0.012119293212890625, -0.011219978332519531, -0.010320663452148438, -0.009421348571777344, -0.00852203369140625, -0.007622718811035156, -0.0067234039306640625, -0.005824089050292969, -0.004924774169921875, -0.004025459289550781, -0.0031261444091796875, -0.0022268295288085938, -0.0013275146484375, -0.00042819976806640625, 0.0004711151123046875, 0.0013704299926757812, 0.002269744873046875, 0.0031690597534179688, 0.0040683746337890625, 0.004967689514160156, 0.00586700439453125, 0.006766319274902344, 0.0076656341552734375, 0.008564949035644531, 0.009464263916015625, 0.010363578796386719, 0.011262893676757812, 0.012162208557128906, 0.0130615234375, 0.013960838317871094, 0.014860153198242188, 0.01575946807861328, 0.016658782958984375, 0.01755809783935547, 0.018457412719726562, 0.019356727600097656, 0.02025604248046875, 0.021155357360839844, 0.022054672241210938, 0.02295398712158203, 0.023853302001953125, 0.02475261688232422, 0.025651931762695312, 0.026551246643066406, 0.0274505615234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 13.0, 27.0, 22.0, 48.0, 105.0, 137.0, 156.0, 152.0, 102.0, 89.0, 59.0, 34.0, 24.0, 18.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0002598762512207031, -0.0002535395324230194, -0.0002472028136253357, -0.00024086609482765198, -0.00023452937602996826, -0.00022819265723228455, -0.00022185593843460083, -0.00021551921963691711, -0.0002091825008392334, -0.00020284578204154968, -0.00019650906324386597, -0.00019017234444618225, -0.00018383562564849854, -0.00017749890685081482, -0.0001711621880531311, -0.0001648254692554474, -0.00015848875045776367, -0.00015215203166007996, -0.00014581531286239624, -0.00013947859406471252, -0.0001331418752670288, -0.0001268051564693451, -0.00012046843767166138, -0.00011413171887397766, -0.00010779500007629395, -0.00010145828127861023, -9.512156248092651e-05, -8.87848436832428e-05, -8.244812488555908e-05, -7.611140608787537e-05, -6.977468729019165e-05, -6.343796849250793e-05, -5.710124969482422e-05, -5.07645308971405e-05, -4.442781209945679e-05, -3.809109330177307e-05, -3.1754374504089355e-05, -2.541765570640564e-05, -1.9080936908721924e-05, -1.2744218111038208e-05, -6.407499313354492e-06, -7.078051567077637e-08, 6.2659382820129395e-06, 1.2602657079696655e-05, 1.893937587738037e-05, 2.5276094675064087e-05, 3.16128134727478e-05, 3.794953227043152e-05, 4.4286251068115234e-05, 5.062296986579895e-05, 5.6959688663482666e-05, 6.329640746116638e-05, 6.96331262588501e-05, 7.596984505653381e-05, 8.230656385421753e-05, 8.864328265190125e-05, 9.498000144958496e-05, 0.00010131672024726868, 0.00010765343904495239, 0.00011399015784263611, 0.00012032687664031982, 0.00012666359543800354, 0.00013300031423568726, 0.00013933703303337097, 0.0001456737518310547]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 10.0, 16.0, 31.0, 29.0, 78.0, 87.0, 137.0, 274.0, 417.0, 836.0, 1591.0, 3709.0, 10494.0, 36698.0, 142002.0, 396479.0, 321703.0, 95875.0, 24864.0, 7473.0, 2845.0, 1241.0, 677.0, 391.0, 211.0, 131.0, 85.0, 50.0, 37.0, 18.0, 11.0, 11.0, 11.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027679443359375, -0.026685714721679688, -0.025691986083984375, -0.024698257446289062, -0.02370452880859375, -0.022710800170898438, -0.021717071533203125, -0.020723342895507812, -0.0197296142578125, -0.018735885620117188, -0.017742156982421875, -0.016748428344726562, -0.01575469970703125, -0.014760971069335938, -0.013767242431640625, -0.012773513793945312, -0.01177978515625, -0.010786056518554688, -0.009792327880859375, -0.008798599243164062, -0.00780487060546875, -0.0068111419677734375, -0.005817413330078125, -0.0048236846923828125, -0.0038299560546875, -0.0028362274169921875, -0.001842498779296875, -0.0008487701416015625, 0.00014495849609375, 0.0011386871337890625, 0.002132415771484375, 0.0031261444091796875, 0.004119873046875, 0.0051136016845703125, 0.006107330322265625, 0.0071010589599609375, 0.00809478759765625, 0.009088516235351562, 0.010082244873046875, 0.011075973510742188, 0.0120697021484375, 0.013063430786132812, 0.014057159423828125, 0.015050888061523438, 0.01604461669921875, 0.017038345336914062, 0.018032073974609375, 0.019025802612304688, 0.02001953125, 0.021013259887695312, 0.022006988525390625, 0.023000717163085938, 0.02399444580078125, 0.024988174438476562, 0.025981903076171875, 0.026975631713867188, 0.0279693603515625, 0.028963088989257812, 0.029956817626953125, 0.030950546264648438, 0.03194427490234375, 0.03293800354003906, 0.033931732177734375, 0.03492546081542969, 0.035919189453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 8.0, 11.0, 8.0, 12.0, 12.0, 26.0, 44.0, 60.0, 65.0, 89.0, 101.0, 108.0, 117.0, 91.0, 65.0, 56.0, 46.0, 22.0, 21.0, 20.0, 8.0, 6.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0450439453125, -0.04377412796020508, -0.042504310607910156, -0.041234493255615234, -0.03996467590332031, -0.03869485855102539, -0.03742504119873047, -0.03615522384643555, -0.034885406494140625, -0.0336155891418457, -0.03234577178955078, -0.03107595443725586, -0.029806137084960938, -0.028536319732666016, -0.027266502380371094, -0.025996685028076172, -0.02472686767578125, -0.023457050323486328, -0.022187232971191406, -0.020917415618896484, -0.019647598266601562, -0.01837778091430664, -0.01710796356201172, -0.015838146209716797, -0.014568328857421875, -0.013298511505126953, -0.012028694152832031, -0.01075887680053711, -0.009489059448242188, -0.008219242095947266, -0.006949424743652344, -0.005679607391357422, -0.0044097900390625, -0.003139972686767578, -0.0018701553344726562, -0.0006003379821777344, 0.0006694793701171875, 0.0019392967224121094, 0.0032091140747070312, 0.004478931427001953, 0.005748748779296875, 0.007018566131591797, 0.008288383483886719, 0.00955820083618164, 0.010828018188476562, 0.012097835540771484, 0.013367652893066406, 0.014637470245361328, 0.01590728759765625, 0.017177104949951172, 0.018446922302246094, 0.019716739654541016, 0.020986557006835938, 0.02225637435913086, 0.02352619171142578, 0.024796009063720703, 0.026065826416015625, 0.027335643768310547, 0.02860546112060547, 0.02987527847290039, 0.031145095825195312, 0.032414913177490234, 0.033684730529785156, 0.03495454788208008, 0.036224365234375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 7.0, 14.0, 10.0, 29.0, 39.0, 51.0, 86.0, 111.0, 121.0, 129.0, 111.0, 84.0, 61.0, 41.0, 19.0, 24.0, 12.0, 9.0, 14.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2958724796772003, -0.28334495425224304, -0.2708173990249634, -0.2582898736000061, -0.24576234817504883, -0.23323480784893036, -0.2207072675228119, -0.20817974209785461, -0.19565220177173615, -0.18312466144561768, -0.1705971360206604, -0.15806959569454193, -0.14554205536842346, -0.1330145299434662, -0.12048698961734772, -0.10795945674180984, -0.09543192386627197, -0.0829043909907341, -0.07037685811519623, -0.05784931778907776, -0.045321784913539886, -0.032794252038002014, -0.020266711711883545, -0.007739178836345673, 0.0047883540391922, 0.01731588877737522, 0.029843423515558243, 0.042370960116386414, 0.054898492991924286, 0.06742602586746216, 0.07995356619358063, 0.0924810990691185, 0.10500866174697876, 0.11753619462251663, 0.1300637274980545, 0.14259126782417297, 0.15511879324913025, 0.16764633357524872, 0.1801738739013672, 0.19270139932632446, 0.20522893965244293, 0.2177564799785614, 0.23028400540351868, 0.24281154572963715, 0.2553390860557556, 0.2678666114807129, 0.28039413690567017, 0.29292169213294983, 0.3054492175579071, 0.3179767429828644, 0.33050429821014404, 0.3430318236351013, 0.3555593490600586, 0.36808687448501587, 0.38061442971229553, 0.3931419551372528, 0.40566951036453247, 0.41819703578948975, 0.4307245910167694, 0.4432521164417267, 0.45577964186668396, 0.4683071970939636, 0.4808347225189209, 0.4933622479438782, 0.5058897733688354]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 13.0, 12.0, 10.0, 18.0, 32.0, 21.0, 35.0, 38.0, 42.0, 48.0, 44.0, 59.0, 80.0, 73.0, 69.0, 74.0, 57.0, 43.0, 43.0, 36.0, 27.0, 35.0, 28.0, 15.0, 21.0, 12.0, 3.0, 7.0, 9.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7188037037849426, -0.6966787576675415, -0.6745538711547852, -0.652428925037384, -0.6303039789199829, -0.6081790924072266, -0.5860541462898254, -0.5639292001724243, -0.541804313659668, -0.5196793675422668, -0.4975544512271881, -0.4754295349121094, -0.45330458879470825, -0.4311796724796295, -0.4090547561645508, -0.38692981004714966, -0.36480486392974854, -0.3426799476146698, -0.3205550014972687, -0.29843008518218994, -0.2763051390647888, -0.2541802227497101, -0.23205530643463135, -0.20993037521839142, -0.1878054440021515, -0.16568051278591156, -0.14355558156967163, -0.1214306652545929, -0.09930573403835297, -0.07718080282211304, -0.0550558865070343, -0.03293095529079437, -0.010805964469909668, 0.011318963021039963, 0.033443890511989594, 0.055568814277648926, 0.07769374549388885, 0.09981867671012878, 0.12194359302520752, 0.14406852424144745, 0.16619345545768738, 0.1883183866739273, 0.21044331789016724, 0.23256823420524597, 0.2546931505203247, 0.27681809663772583, 0.29894301295280457, 0.3210679292678833, 0.3431928753852844, 0.36531779170036316, 0.3874427378177643, 0.409567654132843, 0.43169260025024414, 0.4538175165653229, 0.4759424328804016, 0.49806737899780273, 0.5201922655105591, 0.5423172116279602, 0.5644420981407166, 0.5865670442581177, 0.6086919903755188, 0.6308169364929199, 0.6529418230056763, 0.6750667691230774, 0.6971917152404785]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 18.0, 31.0, 58.0, 105.0, 206.0, 433.0, 1491.0, 13037.0, 3948013.0, 225174.0, 4398.0, 759.0, 264.0, 130.0, 62.0, 32.0, 26.0, 11.0, 15.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.422607421875, -0.4127349853515625, -0.402862548828125, -0.3929901123046875, -0.38311767578125, -0.3732452392578125, -0.363372802734375, -0.3535003662109375, -0.3436279296875, -0.3337554931640625, -0.323883056640625, -0.3140106201171875, -0.30413818359375, -0.2942657470703125, -0.284393310546875, -0.2745208740234375, -0.2646484375, -0.2547760009765625, -0.244903564453125, -0.2350311279296875, -0.22515869140625, -0.2152862548828125, -0.205413818359375, -0.1955413818359375, -0.1856689453125, -0.1757965087890625, -0.165924072265625, -0.1560516357421875, -0.14617919921875, -0.1363067626953125, -0.126434326171875, -0.1165618896484375, -0.106689453125, -0.0968170166015625, -0.086944580078125, -0.0770721435546875, -0.06719970703125, -0.0573272705078125, -0.047454833984375, -0.0375823974609375, -0.0277099609375, -0.0178375244140625, -0.007965087890625, 0.0019073486328125, 0.01177978515625, 0.0216522216796875, 0.031524658203125, 0.0413970947265625, 0.05126953125, 0.0611419677734375, 0.071014404296875, 0.0808868408203125, 0.09075927734375, 0.1006317138671875, 0.110504150390625, 0.1203765869140625, 0.1302490234375, 0.1401214599609375, 0.149993896484375, 0.1598663330078125, 0.16973876953125, 0.1796112060546875, 0.189483642578125, 0.1993560791015625, 0.209228515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 9.0, 14.0, 32.0, 56.0, 63.0, 93.0, 111.0, 97.0, 101.0, 109.0, 109.0, 78.0, 45.0, 30.0, 18.0, 12.0, 9.0, 8.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07269287109375, -0.0709691047668457, -0.0692453384399414, -0.06752157211303711, -0.06579780578613281, -0.06407403945922852, -0.06235027313232422, -0.06062650680541992, -0.058902740478515625, -0.05717897415161133, -0.05545520782470703, -0.053731441497802734, -0.05200767517089844, -0.05028390884399414, -0.048560142517089844, -0.04683637619018555, -0.04511260986328125, -0.04338884353637695, -0.041665077209472656, -0.03994131088256836, -0.03821754455566406, -0.036493778228759766, -0.03477001190185547, -0.03304624557495117, -0.031322479248046875, -0.029598712921142578, -0.02787494659423828, -0.026151180267333984, -0.024427413940429688, -0.02270364761352539, -0.020979881286621094, -0.019256114959716797, -0.0175323486328125, -0.015808582305908203, -0.014084815979003906, -0.01236104965209961, -0.010637283325195312, -0.008913516998291016, -0.007189750671386719, -0.005465984344482422, -0.003742218017578125, -0.002018451690673828, -0.00029468536376953125, 0.0014290809631347656, 0.0031528472900390625, 0.004876613616943359, 0.006600379943847656, 0.008324146270751953, 0.01004791259765625, 0.011771678924560547, 0.013495445251464844, 0.01521921157836914, 0.016942977905273438, 0.018666744232177734, 0.02039051055908203, 0.022114276885986328, 0.023838043212890625, 0.025561809539794922, 0.02728557586669922, 0.029009342193603516, 0.030733108520507812, 0.03245687484741211, 0.034180641174316406, 0.0359044075012207, 0.037628173828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 9.0, 9.0, 19.0, 19.0, 42.0, 57.0, 72.0, 138.0, 325.0, 919.0, 3276.0, 20410.0, 427059.0, 3623195.0, 105912.0, 9547.0, 1905.0, 629.0, 260.0, 150.0, 106.0, 63.0, 52.0, 29.0, 21.0, 15.0, 18.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146484375, -0.1423358917236328, -0.13818740844726562, -0.13403892517089844, -0.12989044189453125, -0.12574195861816406, -0.12159347534179688, -0.11744499206542969, -0.1132965087890625, -0.10914802551269531, -0.10499954223632812, -0.10085105895996094, -0.09670257568359375, -0.09255409240722656, -0.08840560913085938, -0.08425712585449219, -0.080108642578125, -0.07596015930175781, -0.07181167602539062, -0.06766319274902344, -0.06351470947265625, -0.05936622619628906, -0.055217742919921875, -0.05106925964355469, -0.0469207763671875, -0.04277229309082031, -0.038623809814453125, -0.03447532653808594, -0.03032684326171875, -0.026178359985351562, -0.022029876708984375, -0.017881393432617188, -0.01373291015625, -0.009584426879882812, -0.005435943603515625, -0.0012874603271484375, 0.00286102294921875, 0.0070095062255859375, 0.011157989501953125, 0.015306472778320312, 0.0194549560546875, 0.023603439331054688, 0.027751922607421875, 0.03190040588378906, 0.03604888916015625, 0.04019737243652344, 0.044345855712890625, 0.04849433898925781, 0.052642822265625, 0.05679130554199219, 0.060939788818359375, 0.06508827209472656, 0.06923675537109375, 0.07338523864746094, 0.07753372192382812, 0.08168220520019531, 0.0858306884765625, 0.08997917175292969, 0.09412765502929688, 0.09827613830566406, 0.10242462158203125, 0.10657310485839844, 0.11072158813476562, 0.11487007141113281, 0.1190185546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 11.0, 13.0, 43.0, 96.0, 235.0, 835.0, 1795.0, 673.0, 194.0, 98.0, 33.0, 17.0, 14.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03125, -0.029338836669921875, -0.02742767333984375, -0.025516510009765625, -0.0236053466796875, -0.021694183349609375, -0.01978302001953125, -0.017871856689453125, -0.015960693359375, -0.014049530029296875, -0.01213836669921875, -0.010227203369140625, -0.0083160400390625, -0.006404876708984375, -0.00449371337890625, -0.002582550048828125, -0.00067138671875, 0.001239776611328125, 0.00315093994140625, 0.005062103271484375, 0.0069732666015625, 0.008884429931640625, 0.01079559326171875, 0.012706756591796875, 0.014617919921875, 0.016529083251953125, 0.01844024658203125, 0.020351409912109375, 0.0222625732421875, 0.024173736572265625, 0.02608489990234375, 0.027996063232421875, 0.0299072265625, 0.031818389892578125, 0.03372955322265625, 0.035640716552734375, 0.0375518798828125, 0.039463043212890625, 0.04137420654296875, 0.043285369873046875, 0.045196533203125, 0.047107696533203125, 0.04901885986328125, 0.050930023193359375, 0.0528411865234375, 0.054752349853515625, 0.05666351318359375, 0.058574676513671875, 0.06048583984375, 0.062397003173828125, 0.06430816650390625, 0.06621932983398438, 0.0681304931640625, 0.07004165649414062, 0.07195281982421875, 0.07386398315429688, 0.075775146484375, 0.07768630981445312, 0.07959747314453125, 0.08150863647460938, 0.0834197998046875, 0.08533096313476562, 0.08724212646484375, 0.08915328979492188, 0.091064453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 28.0, 149.0, 345.0, 316.0, 117.0, 27.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4395594596862793, -0.4218272864818573, -0.4040951430797577, -0.3863629698753357, -0.3686308264732361, -0.3508986532688141, -0.3331664800643921, -0.3154343366622925, -0.2977021634578705, -0.2799699902534485, -0.2622378468513489, -0.24450567364692688, -0.22677351534366608, -0.20904135704040527, -0.19130918383598328, -0.17357702553272247, -0.15584486722946167, -0.13811270892620087, -0.12038054317235947, -0.10264837741851807, -0.08491621911525726, -0.06718406081199646, -0.04945189505815506, -0.03171972930431366, -0.013987571001052856, 0.0037445910274982452, 0.021476753056049347, 0.03920891508460045, 0.05694107711315155, 0.07467323541641235, 0.09240540117025375, 0.11013756692409515, 0.12786966562271118, 0.14560182392597198, 0.1633339822292328, 0.18106615543365479, 0.1987983137369156, 0.2165304720401764, 0.2342626452445984, 0.251994788646698, 0.26972696185112, 0.287459135055542, 0.3051912784576416, 0.3229234516620636, 0.3406556248664856, 0.3583877682685852, 0.3761199414730072, 0.3938521146774292, 0.4115842580795288, 0.4293164312839508, 0.4470485746860504, 0.4647807478904724, 0.482512891292572, 0.5002450942993164, 0.517977237701416, 0.5357093811035156, 0.5534415245056152, 0.5711736679077148, 0.5889058709144592, 0.6066380143165588, 0.6243701577186584, 0.6421023607254028, 0.6598345041275024, 0.677566647529602, 0.6952988505363464]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 8.0, 22.0, 23.0, 35.0, 45.0, 58.0, 64.0, 71.0, 109.0, 83.0, 87.0, 77.0, 69.0, 59.0, 40.0, 52.0, 28.0, 18.0, 14.0, 12.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24046534299850464, -0.23315586149692535, -0.22584636509418488, -0.2185368835926056, -0.2112274020910263, -0.20391792058944702, -0.19660842418670654, -0.18929894268512726, -0.18198946118354797, -0.1746799796819687, -0.1673704832792282, -0.16006100177764893, -0.15275152027606964, -0.14544203877449036, -0.13813254237174988, -0.1308230608701706, -0.12351356446743011, -0.11620407551527023, -0.10889459401369095, -0.10158510506153107, -0.09427562355995178, -0.0869661346077919, -0.07965664565563202, -0.07234716415405273, -0.06503767520189285, -0.05772818997502327, -0.050418704748153687, -0.043109215795993805, -0.03579973056912422, -0.02849024534225464, -0.021180756390094757, -0.013871271163225174, -0.006561785936355591, 0.0007477002218365669, 0.008057186380028725, 0.015366673469543457, 0.02267615869641304, 0.029985643923282623, 0.037295132875442505, 0.04460461810231209, 0.05191410332918167, 0.059223588556051254, 0.06653307378292084, 0.07384256273508072, 0.0811520516872406, 0.08846153318881989, 0.09577102214097977, 0.10308051109313965, 0.11038999259471893, 0.11769948154687881, 0.1250089704990387, 0.13231845200061798, 0.13962793350219727, 0.14693742990493774, 0.15424691140651703, 0.1615563929080963, 0.1688658893108368, 0.17617537081241608, 0.18348486721515656, 0.19079434871673584, 0.19810383021831512, 0.2054133117198944, 0.2127228081226349, 0.22003228962421417, 0.22734177112579346]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 18.0, 29.0, 45.0, 56.0, 98.0, 186.0, 364.0, 875.0, 2379.0, 8914.0, 83309.0, 734752.0, 196322.0, 15511.0, 3463.0, 1207.0, 502.0, 206.0, 118.0, 61.0, 40.0, 28.0, 11.0, 14.0, 12.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.14142608642578125, -0.1364898681640625, -0.13155364990234375, -0.126617431640625, -0.12168121337890625, -0.1167449951171875, -0.11180877685546875, -0.10687255859375, -0.10193634033203125, -0.0970001220703125, -0.09206390380859375, -0.087127685546875, -0.08219146728515625, -0.0772552490234375, -0.07231903076171875, -0.0673828125, -0.06244659423828125, -0.0575103759765625, -0.05257415771484375, -0.047637939453125, -0.04270172119140625, -0.0377655029296875, -0.03282928466796875, -0.02789306640625, -0.02295684814453125, -0.0180206298828125, -0.01308441162109375, -0.008148193359375, -0.00321197509765625, 0.0017242431640625, 0.00666046142578125, 0.0115966796875, 0.01653289794921875, 0.0214691162109375, 0.02640533447265625, 0.031341552734375, 0.03627777099609375, 0.0412139892578125, 0.04615020751953125, 0.05108642578125, 0.05602264404296875, 0.0609588623046875, 0.06589508056640625, 0.070831298828125, 0.07576751708984375, 0.0807037353515625, 0.08563995361328125, 0.090576171875, 0.09551239013671875, 0.1004486083984375, 0.10538482666015625, 0.110321044921875, 0.11525726318359375, 0.1201934814453125, 0.12512969970703125, 0.13006591796875, 0.13500213623046875, 0.1399383544921875, 0.14487457275390625, 0.149810791015625, 0.15474700927734375, 0.1596832275390625, 0.16461944580078125, 0.1695556640625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 27.0, 36.0, 54.0, 77.0, 87.0, 103.0, 121.0, 108.0, 111.0, 81.0, 68.0, 55.0, 19.0, 17.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07427978515625, -0.07258176803588867, -0.07088375091552734, -0.06918573379516602, -0.06748771667480469, -0.06578969955444336, -0.06409168243408203, -0.0623936653137207, -0.060695648193359375, -0.05899763107299805, -0.05729961395263672, -0.05560159683227539, -0.05390357971191406, -0.052205562591552734, -0.050507545471191406, -0.04880952835083008, -0.04711151123046875, -0.04541349411010742, -0.043715476989746094, -0.042017459869384766, -0.04031944274902344, -0.03862142562866211, -0.03692340850830078, -0.03522539138793945, -0.033527374267578125, -0.0318293571472168, -0.03013134002685547, -0.02843332290649414, -0.026735305786132812, -0.025037288665771484, -0.023339271545410156, -0.021641254425048828, -0.0199432373046875, -0.018245220184326172, -0.016547203063964844, -0.014849185943603516, -0.013151168823242188, -0.01145315170288086, -0.009755134582519531, -0.008057117462158203, -0.006359100341796875, -0.004661083221435547, -0.0029630661010742188, -0.0012650489807128906, 0.0004329681396484375, 0.0021309852600097656, 0.0038290023803710938, 0.005527019500732422, 0.00722503662109375, 0.008923053741455078, 0.010621070861816406, 0.012319087982177734, 0.014017105102539062, 0.01571512222290039, 0.01741313934326172, 0.019111156463623047, 0.020809173583984375, 0.022507190704345703, 0.02420520782470703, 0.02590322494506836, 0.027601242065429688, 0.029299259185791016, 0.030997276306152344, 0.03269529342651367, 0.034393310546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 8.0, 4.0, 8.0, 8.0, 17.0, 15.0, 23.0, 31.0, 51.0, 48.0, 99.0, 136.0, 243.0, 359.0, 632.0, 1080.0, 2190.0, 5140.0, 14042.0, 43431.0, 147221.0, 383164.0, 305309.0, 97863.0, 29403.0, 9851.0, 3965.0, 1800.0, 953.0, 542.0, 323.0, 210.0, 107.0, 81.0, 63.0, 42.0, 25.0, 19.0, 17.0, 6.0, 12.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.055389404296875, -0.05375242233276367, -0.052115440368652344, -0.050478458404541016, -0.04884147644042969, -0.04720449447631836, -0.04556751251220703, -0.0439305305480957, -0.042293548583984375, -0.04065656661987305, -0.03901958465576172, -0.03738260269165039, -0.03574562072753906, -0.034108638763427734, -0.032471656799316406, -0.030834674835205078, -0.02919769287109375, -0.027560710906982422, -0.025923728942871094, -0.024286746978759766, -0.022649765014648438, -0.02101278305053711, -0.01937580108642578, -0.017738819122314453, -0.016101837158203125, -0.014464855194091797, -0.012827873229980469, -0.01119089126586914, -0.009553909301757812, -0.007916927337646484, -0.006279945373535156, -0.004642963409423828, -0.0030059814453125, -0.0013689994812011719, 0.00026798248291015625, 0.0019049644470214844, 0.0035419464111328125, 0.005178928375244141, 0.006815910339355469, 0.008452892303466797, 0.010089874267578125, 0.011726856231689453, 0.013363838195800781, 0.01500082015991211, 0.016637802124023438, 0.018274784088134766, 0.019911766052246094, 0.021548748016357422, 0.02318572998046875, 0.024822711944580078, 0.026459693908691406, 0.028096675872802734, 0.029733657836914062, 0.03137063980102539, 0.03300762176513672, 0.03464460372924805, 0.036281585693359375, 0.0379185676574707, 0.03955554962158203, 0.04119253158569336, 0.04282951354980469, 0.044466495513916016, 0.046103477478027344, 0.04774045944213867, 0.04937744140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 10.0, 5.0, 6.0, 13.0, 7.0, 16.0, 23.0, 18.0, 24.0, 25.0, 26.0, 25.0, 30.0, 33.0, 43.0, 36.0, 40.0, 44.0, 61.0, 44.0, 43.0, 30.0, 53.0, 42.0, 34.0, 33.0, 37.0, 29.0, 29.0, 17.0, 22.0, 21.0, 18.0, 16.0, 14.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09130859375, -0.08868694305419922, -0.08606529235839844, -0.08344364166259766, -0.08082199096679688, -0.0782003402709961, -0.07557868957519531, -0.07295703887939453, -0.07033538818359375, -0.06771373748779297, -0.06509208679199219, -0.062470436096191406, -0.059848785400390625, -0.057227134704589844, -0.05460548400878906, -0.05198383331298828, -0.0493621826171875, -0.04674053192138672, -0.04411888122558594, -0.041497230529785156, -0.038875579833984375, -0.036253929138183594, -0.03363227844238281, -0.03101062774658203, -0.02838897705078125, -0.02576732635498047, -0.023145675659179688, -0.020524024963378906, -0.017902374267578125, -0.015280723571777344, -0.012659072875976562, -0.010037422180175781, -0.007415771484375, -0.004794120788574219, -0.0021724700927734375, 0.00044918060302734375, 0.003070831298828125, 0.005692481994628906, 0.008314132690429688, 0.010935783386230469, 0.01355743408203125, 0.01617908477783203, 0.018800735473632812, 0.021422386169433594, 0.024044036865234375, 0.026665687561035156, 0.029287338256835938, 0.03190898895263672, 0.0345306396484375, 0.03715229034423828, 0.03977394104003906, 0.042395591735839844, 0.045017242431640625, 0.047638893127441406, 0.05026054382324219, 0.05288219451904297, 0.05550384521484375, 0.05812549591064453, 0.06074714660644531, 0.0633687973022461, 0.06599044799804688, 0.06861209869384766, 0.07123374938964844, 0.07385540008544922, 0.07647705078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 2.0, 5.0, 7.0, 14.0, 16.0, 28.0, 37.0, 66.0, 120.0, 173.0, 288.0, 551.0, 1062.0, 2029.0, 4805.0, 13143.0, 47339.0, 191892.0, 441218.0, 252649.0, 64823.0, 17269.0, 5861.0, 2457.0, 1214.0, 621.0, 344.0, 196.0, 108.0, 75.0, 48.0, 34.0, 15.0, 15.0, 13.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.039794921875, -0.03881502151489258, -0.037835121154785156, -0.036855220794677734, -0.03587532043457031, -0.03489542007446289, -0.03391551971435547, -0.03293561935424805, -0.031955718994140625, -0.030975818634033203, -0.02999591827392578, -0.02901601791381836, -0.028036117553710938, -0.027056217193603516, -0.026076316833496094, -0.025096416473388672, -0.02411651611328125, -0.023136615753173828, -0.022156715393066406, -0.021176815032958984, -0.020196914672851562, -0.01921701431274414, -0.01823711395263672, -0.017257213592529297, -0.016277313232421875, -0.015297412872314453, -0.014317512512207031, -0.01333761215209961, -0.012357711791992188, -0.011377811431884766, -0.010397911071777344, -0.009418010711669922, -0.0084381103515625, -0.007458209991455078, -0.006478309631347656, -0.005498409271240234, -0.0045185089111328125, -0.0035386085510253906, -0.0025587081909179688, -0.0015788078308105469, -0.000598907470703125, 0.0003809928894042969, 0.0013608932495117188, 0.0023407936096191406, 0.0033206939697265625, 0.004300594329833984, 0.005280494689941406, 0.006260395050048828, 0.00724029541015625, 0.008220195770263672, 0.009200096130371094, 0.010179996490478516, 0.011159896850585938, 0.01213979721069336, 0.013119697570800781, 0.014099597930908203, 0.015079498291015625, 0.016059398651123047, 0.01703929901123047, 0.01801919937133789, 0.018999099731445312, 0.019979000091552734, 0.020958900451660156, 0.021938800811767578, 0.022918701171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 12.0, 20.0, 15.0, 22.0, 23.0, 38.0, 39.0, 59.0, 76.0, 98.0, 74.0, 86.0, 84.0, 67.0, 64.0, 49.0, 34.0, 28.0, 21.0, 14.0, 12.0, 23.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.897615432739258e-05, -7.617473602294922e-05, -7.337331771850586e-05, -7.05718994140625e-05, -6.777048110961914e-05, -6.496906280517578e-05, -6.216764450073242e-05, -5.936622619628906e-05, -5.65648078918457e-05, -5.3763389587402344e-05, -5.0961971282958984e-05, -4.8160552978515625e-05, -4.5359134674072266e-05, -4.2557716369628906e-05, -3.975629806518555e-05, -3.695487976074219e-05, -3.415346145629883e-05, -3.135204315185547e-05, -2.855062484741211e-05, -2.574920654296875e-05, -2.294778823852539e-05, -2.014636993408203e-05, -1.7344951629638672e-05, -1.4543533325195312e-05, -1.1742115020751953e-05, -8.940696716308594e-06, -6.139278411865234e-06, -3.337860107421875e-06, -5.364418029785156e-07, 2.2649765014648438e-06, 5.066394805908203e-06, 7.867813110351562e-06, 1.0669231414794922e-05, 1.3470649719238281e-05, 1.627206802368164e-05, 1.9073486328125e-05, 2.187490463256836e-05, 2.467632293701172e-05, 2.7477741241455078e-05, 3.0279159545898438e-05, 3.30805778503418e-05, 3.5881996154785156e-05, 3.8683414459228516e-05, 4.1484832763671875e-05, 4.4286251068115234e-05, 4.7087669372558594e-05, 4.988908767700195e-05, 5.269050598144531e-05, 5.549192428588867e-05, 5.829334259033203e-05, 6.109476089477539e-05, 6.389617919921875e-05, 6.669759750366211e-05, 6.949901580810547e-05, 7.230043411254883e-05, 7.510185241699219e-05, 7.790327072143555e-05, 8.07046890258789e-05, 8.350610733032227e-05, 8.630752563476562e-05, 8.910894393920898e-05, 9.191036224365234e-05, 9.47117805480957e-05, 9.751319885253906e-05, 0.00010031461715698242]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 13.0, 13.0, 19.0, 27.0, 50.0, 53.0, 123.0, 172.0, 301.0, 548.0, 1027.0, 2038.0, 5180.0, 16061.0, 65842.0, 282658.0, 458139.0, 163236.0, 36260.0, 9903.0, 3517.0, 1514.0, 786.0, 421.0, 247.0, 148.0, 85.0, 63.0, 40.0, 28.0, 15.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.029327392578125, -0.02825307846069336, -0.02717876434326172, -0.026104450225830078, -0.025030136108398438, -0.023955821990966797, -0.022881507873535156, -0.021807193756103516, -0.020732879638671875, -0.019658565521240234, -0.018584251403808594, -0.017509937286376953, -0.016435623168945312, -0.015361309051513672, -0.014286994934082031, -0.01321268081665039, -0.01213836669921875, -0.01106405258178711, -0.009989738464355469, -0.008915424346923828, -0.007841110229492188, -0.006766796112060547, -0.005692481994628906, -0.004618167877197266, -0.003543853759765625, -0.0024695396423339844, -0.0013952255249023438, -0.0003209114074707031, 0.0007534027099609375, 0.0018277168273925781, 0.0029020309448242188, 0.003976345062255859, 0.0050506591796875, 0.006124973297119141, 0.007199287414550781, 0.008273601531982422, 0.009347915649414062, 0.010422229766845703, 0.011496543884277344, 0.012570858001708984, 0.013645172119140625, 0.014719486236572266, 0.015793800354003906, 0.016868114471435547, 0.017942428588867188, 0.019016742706298828, 0.02009105682373047, 0.02116537094116211, 0.02223968505859375, 0.02331399917602539, 0.02438831329345703, 0.025462627410888672, 0.026536941528320312, 0.027611255645751953, 0.028685569763183594, 0.029759883880615234, 0.030834197998046875, 0.031908512115478516, 0.032982826232910156, 0.0340571403503418, 0.03513145446777344, 0.03620576858520508, 0.03728008270263672, 0.03835439682006836, 0.0394287109375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 11.0, 3.0, 10.0, 25.0, 38.0, 49.0, 72.0, 105.0, 109.0, 119.0, 99.0, 93.0, 64.0, 61.0, 41.0, 34.0, 14.0, 19.0, 3.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0428466796875, -0.04152870178222656, -0.040210723876953125, -0.03889274597167969, -0.03757476806640625, -0.03625679016113281, -0.034938812255859375, -0.03362083435058594, -0.0323028564453125, -0.030984878540039062, -0.029666900634765625, -0.028348922729492188, -0.02703094482421875, -0.025712966918945312, -0.024394989013671875, -0.023077011108398438, -0.021759033203125, -0.020441055297851562, -0.019123077392578125, -0.017805099487304688, -0.01648712158203125, -0.015169143676757812, -0.013851165771484375, -0.012533187866210938, -0.0112152099609375, -0.009897232055664062, -0.008579254150390625, -0.0072612762451171875, -0.00594329833984375, -0.0046253204345703125, -0.003307342529296875, -0.0019893646240234375, -0.00067138671875, 0.0006465911865234375, 0.001964569091796875, 0.0032825469970703125, 0.00460052490234375, 0.0059185028076171875, 0.007236480712890625, 0.008554458618164062, 0.0098724365234375, 0.011190414428710938, 0.012508392333984375, 0.013826370239257812, 0.01514434814453125, 0.016462326049804688, 0.017780303955078125, 0.019098281860351562, 0.020416259765625, 0.021734237670898438, 0.023052215576171875, 0.024370193481445312, 0.02568817138671875, 0.027006149291992188, 0.028324127197265625, 0.029642105102539062, 0.0309600830078125, 0.03227806091308594, 0.033596038818359375, 0.03491401672363281, 0.03623199462890625, 0.03754997253417969, 0.038867950439453125, 0.04018592834472656, 0.04150390625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 29.0, 161.0, 425.0, 299.0, 71.0, 15.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.5728797912597656, -2.524954080581665, -2.4770283699035645, -2.429102897644043, -2.3811771869659424, -2.333251476287842, -2.285325765609741, -2.2374000549316406, -2.189474582672119, -2.1415488719940186, -2.093623161315918, -2.0456976890563965, -1.997771978378296, -1.9498462677001953, -1.9019205570220947, -1.8539948463439941, -1.8060691356658936, -1.758143424987793, -1.710217833518982, -1.6622921228408813, -1.6143665313720703, -1.5664408206939697, -1.5185151100158691, -1.4705893993377686, -1.4226638078689575, -1.374738097190857, -1.326812505722046, -1.2788867950439453, -1.2309610843658447, -1.1830354928970337, -1.135109782218933, -1.087184190750122, -1.0392584800720215, -0.9913328289985657, -0.9434071779251099, -0.8954814672470093, -0.8475558161735535, -0.7996301651000977, -0.7517044544219971, -0.7037788033485413, -0.6558530926704407, -0.6079274415969849, -0.5600017309188843, -0.5120760798454285, -0.46415042877197266, -0.41622477769851685, -0.36829909682273865, -0.32037341594696045, -0.27244776487350464, -0.22452209889888763, -0.17659643292427063, -0.12867076694965363, -0.08074510097503662, -0.03281943500041962, 0.015106230974197388, 0.06303191184997559, 0.1109575629234314, 0.1588832288980484, 0.2068088948726654, 0.2547345757484436, 0.3026602268218994, 0.3505858778953552, 0.3985115587711334, 0.4464372396469116, 0.49436289072036743]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 5.0, 12.0, 20.0, 22.0, 19.0, 23.0, 26.0, 24.0, 34.0, 41.0, 57.0, 47.0, 41.0, 44.0, 41.0, 40.0, 44.0, 44.0, 38.0, 39.0, 36.0, 36.0, 31.0, 28.0, 30.0, 23.0, 21.0, 19.0, 12.0, 15.0, 14.0, 11.0, 11.0, 5.0, 9.0, 4.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4259144067764282, -0.411609411239624, -0.3973044455051422, -0.382999449968338, -0.3686944842338562, -0.354389488697052, -0.3400845229625702, -0.325779527425766, -0.3114745616912842, -0.29716956615448, -0.28286460041999817, -0.26855960488319397, -0.25425463914871216, -0.23994964361190796, -0.22564467787742615, -0.21133968234062195, -0.19703470170497894, -0.18272972106933594, -0.16842474043369293, -0.15411975979804993, -0.13981477916240692, -0.12550979852676392, -0.11120481044054031, -0.09689982980489731, -0.0825948491692543, -0.0682898685336113, -0.05398488789796829, -0.03967990353703499, -0.025374922901391983, -0.01106993854045868, 0.003235042095184326, 0.01754002273082733, 0.03184500336647034, 0.04614998400211334, 0.06045496463775635, 0.07475994527339935, 0.08906492590904236, 0.10336991399526596, 0.11767489463090897, 0.13197988271713257, 0.14628484845161438, 0.16058982908725739, 0.1748948097229004, 0.1891997903585434, 0.2035047709941864, 0.2178097665309906, 0.2321147322654724, 0.2464197278022766, 0.2607247233390808, 0.275029718875885, 0.2893346846103668, 0.303639680147171, 0.31794464588165283, 0.33224964141845703, 0.34655460715293884, 0.36085960268974304, 0.37516456842422485, 0.38946956396102905, 0.40377452969551086, 0.41807952523231506, 0.4323844909667969, 0.4466894865036011, 0.4609944522380829, 0.4752994477748871, 0.4896044135093689]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 23.0, 30.0, 34.0, 60.0, 122.0, 168.0, 375.0, 821.0, 2130.0, 7893.0, 81477.0, 3946574.0, 139948.0, 10167.0, 2510.0, 961.0, 437.0, 206.0, 115.0, 79.0, 40.0, 28.0, 22.0, 16.0, 6.0, 6.0, 5.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2431640625, -0.23717117309570312, -0.23117828369140625, -0.22518539428710938, -0.2191925048828125, -0.21319961547851562, -0.20720672607421875, -0.20121383666992188, -0.195220947265625, -0.18922805786132812, -0.18323516845703125, -0.17724227905273438, -0.1712493896484375, -0.16525650024414062, -0.15926361083984375, -0.15327072143554688, -0.14727783203125, -0.14128494262695312, -0.13529205322265625, -0.12929916381835938, -0.1233062744140625, -0.11731338500976562, -0.11132049560546875, -0.10532760620117188, -0.099334716796875, -0.09334182739257812, -0.08734893798828125, -0.08135604858398438, -0.0753631591796875, -0.06937026977539062, -0.06337738037109375, -0.057384490966796875, -0.0513916015625, -0.045398712158203125, -0.03940582275390625, -0.033412933349609375, -0.0274200439453125, -0.021427154541015625, -0.01543426513671875, -0.009441375732421875, -0.003448486328125, 0.002544403076171875, 0.00853729248046875, 0.014530181884765625, 0.0205230712890625, 0.026515960693359375, 0.03250885009765625, 0.038501739501953125, 0.04449462890625, 0.050487518310546875, 0.05648040771484375, 0.062473297119140625, 0.0684661865234375, 0.07445907592773438, 0.08045196533203125, 0.08644485473632812, 0.092437744140625, 0.09843063354492188, 0.10442352294921875, 0.11041641235351562, 0.1164093017578125, 0.12240219116210938, 0.12839508056640625, 0.13438796997070312, 0.140380859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 23.0, 30.0, 36.0, 53.0, 65.0, 76.0, 90.0, 99.0, 100.0, 68.0, 89.0, 63.0, 70.0, 36.0, 25.0, 29.0, 14.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.057586669921875, -0.056115150451660156, -0.05464363098144531, -0.05317211151123047, -0.051700592041015625, -0.05022907257080078, -0.04875755310058594, -0.047286033630371094, -0.04581451416015625, -0.044342994689941406, -0.04287147521972656, -0.04139995574951172, -0.039928436279296875, -0.03845691680908203, -0.03698539733886719, -0.035513877868652344, -0.0340423583984375, -0.032570838928222656, -0.031099319458007812, -0.02962779998779297, -0.028156280517578125, -0.02668476104736328, -0.025213241577148438, -0.023741722106933594, -0.02227020263671875, -0.020798683166503906, -0.019327163696289062, -0.01785564422607422, -0.016384124755859375, -0.014912605285644531, -0.013441085815429688, -0.011969566345214844, -0.010498046875, -0.009026527404785156, -0.0075550079345703125, -0.006083488464355469, -0.004611968994140625, -0.0031404495239257812, -0.0016689300537109375, -0.00019741058349609375, 0.00127410888671875, 0.0027456283569335938, 0.0042171478271484375, 0.005688667297363281, 0.007160186767578125, 0.008631706237792969, 0.010103225708007812, 0.011574745178222656, 0.0130462646484375, 0.014517784118652344, 0.015989303588867188, 0.01746082305908203, 0.018932342529296875, 0.02040386199951172, 0.021875381469726562, 0.023346900939941406, 0.02481842041015625, 0.026289939880371094, 0.027761459350585938, 0.02923297882080078, 0.030704498291015625, 0.03217601776123047, 0.03364753723144531, 0.035119056701660156, 0.036590576171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 8.0, 10.0, 16.0, 26.0, 26.0, 41.0, 67.0, 83.0, 162.0, 280.0, 759.0, 2258.0, 8799.0, 49460.0, 706575.0, 3233116.0, 165638.0, 20494.0, 4284.0, 1202.0, 475.0, 210.0, 103.0, 67.0, 42.0, 26.0, 26.0, 5.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.12359619140625, -0.12060070037841797, -0.11760520935058594, -0.1146097183227539, -0.11161422729492188, -0.10861873626708984, -0.10562324523925781, -0.10262775421142578, -0.09963226318359375, -0.09663677215576172, -0.09364128112792969, -0.09064579010009766, -0.08765029907226562, -0.0846548080444336, -0.08165931701660156, -0.07866382598876953, -0.0756683349609375, -0.07267284393310547, -0.06967735290527344, -0.0666818618774414, -0.06368637084960938, -0.060690879821777344, -0.05769538879394531, -0.05469989776611328, -0.05170440673828125, -0.04870891571044922, -0.04571342468261719, -0.042717933654785156, -0.039722442626953125, -0.036726951599121094, -0.03373146057128906, -0.03073596954345703, -0.027740478515625, -0.02474498748779297, -0.021749496459960938, -0.018754005432128906, -0.015758514404296875, -0.012763023376464844, -0.009767532348632812, -0.006772041320800781, -0.00377655029296875, -0.0007810592651367188, 0.0022144317626953125, 0.005209922790527344, 0.008205413818359375, 0.011200904846191406, 0.014196395874023438, 0.01719188690185547, 0.0201873779296875, 0.02318286895751953, 0.026178359985351562, 0.029173851013183594, 0.032169342041015625, 0.035164833068847656, 0.03816032409667969, 0.04115581512451172, 0.04415130615234375, 0.04714679718017578, 0.05014228820800781, 0.053137779235839844, 0.056133270263671875, 0.059128761291503906, 0.06212425231933594, 0.06511974334716797, 0.068115234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 4.0, 9.0, 6.0, 17.0, 19.0, 36.0, 63.0, 120.0, 209.0, 526.0, 1238.0, 944.0, 430.0, 176.0, 114.0, 63.0, 34.0, 23.0, 14.0, 13.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06507062911987305, -0.0635519027709961, -0.06203317642211914, -0.06051445007324219, -0.058995723724365234, -0.05747699737548828, -0.05595827102661133, -0.054439544677734375, -0.05292081832885742, -0.05140209197998047, -0.049883365631103516, -0.04836463928222656, -0.04684591293334961, -0.045327186584472656, -0.0438084602355957, -0.04228973388671875, -0.0407710075378418, -0.039252281188964844, -0.03773355484008789, -0.03621482849121094, -0.034696102142333984, -0.03317737579345703, -0.03165864944458008, -0.030139923095703125, -0.028621196746826172, -0.02710247039794922, -0.025583744049072266, -0.024065017700195312, -0.02254629135131836, -0.021027565002441406, -0.019508838653564453, -0.0179901123046875, -0.016471385955810547, -0.014952659606933594, -0.01343393325805664, -0.011915206909179688, -0.010396480560302734, -0.008877754211425781, -0.007359027862548828, -0.005840301513671875, -0.004321575164794922, -0.0028028488159179688, -0.0012841224670410156, 0.0002346038818359375, 0.0017533302307128906, 0.0032720565795898438, 0.004790782928466797, 0.00630950927734375, 0.007828235626220703, 0.009346961975097656, 0.01086568832397461, 0.012384414672851562, 0.013903141021728516, 0.015421867370605469, 0.016940593719482422, 0.018459320068359375, 0.019978046417236328, 0.02149677276611328, 0.023015499114990234, 0.024534225463867188, 0.02605295181274414, 0.027571678161621094, 0.029090404510498047, 0.030609130859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 26.0, 77.0, 264.0, 357.0, 201.0, 56.0, 14.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13470131158828735, -0.11596983671188354, -0.09723836183547974, -0.07850688695907593, -0.05977541208267212, -0.04104393720626831, -0.022312462329864502, -0.0035809874534606934, 0.015150487422943115, 0.033881962299346924, 0.05261343717575073, 0.07134491205215454, 0.09007638692855835, 0.10880786180496216, 0.12753933668136597, 0.14627081155776978, 0.16500228643417358, 0.1837337613105774, 0.2024652361869812, 0.221196711063385, 0.23992818593978882, 0.2586596608161926, 0.27739113569259644, 0.29612261056900024, 0.31485408544540405, 0.33358556032180786, 0.35231703519821167, 0.3710485100746155, 0.3897799849510193, 0.4085114598274231, 0.4272429347038269, 0.4459744095802307, 0.46470582485198975, 0.48343729972839355, 0.5021687746047974, 0.5209002494812012, 0.539631724357605, 0.5583631992340088, 0.5770946741104126, 0.5958261489868164, 0.6145576238632202, 0.633289098739624, 0.6520205736160278, 0.6707520484924316, 0.6894835233688354, 0.7082149982452393, 0.7269464731216431, 0.7456779479980469, 0.7644094228744507, 0.7831408977508545, 0.8018723726272583, 0.8206038475036621, 0.8393353223800659, 0.8580667972564697, 0.8767982721328735, 0.8955297470092773, 0.9142612218856812, 0.932992696762085, 0.9517241716384888, 0.9704556465148926, 0.9891871213912964, 1.0079185962677002, 1.026650071144104, 1.0453815460205078, 1.0641130208969116]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 11.0, 14.0, 11.0, 19.0, 14.0, 20.0, 25.0, 24.0, 31.0, 37.0, 50.0, 47.0, 55.0, 44.0, 37.0, 39.0, 37.0, 46.0, 41.0, 44.0, 40.0, 41.0, 46.0, 31.0, 34.0, 29.0, 18.0, 20.0, 15.0, 20.0, 10.0, 7.0, 11.0, 9.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.13771313428878784, -0.13361859321594238, -0.12952403724193573, -0.12542949616909027, -0.12133495509624481, -0.11724040657281876, -0.1131458580493927, -0.10905131697654724, -0.10495676845312119, -0.10086221992969513, -0.09676767885684967, -0.09267313033342361, -0.08857858180999756, -0.0844840407371521, -0.08038949221372604, -0.07629494369029999, -0.07220040261745453, -0.06810585409402847, -0.06401131302118301, -0.05991676449775696, -0.0558222196996212, -0.05172767490148544, -0.04763312637805939, -0.04353858157992363, -0.03944403678178787, -0.035349491983652115, -0.03125494718551636, -0.0271603986620903, -0.023065853863954544, -0.018971309065818787, -0.01487676240503788, -0.010782215744256973, -0.006687670946121216, -0.0025931252166628838, 0.0015014205127954483, 0.00559596624225378, 0.009690511971712112, 0.01378505676984787, 0.017879603430628777, 0.021974150091409683, 0.02606869488954544, 0.030163239687681198, 0.034257784485816956, 0.03835233300924301, 0.04244687780737877, 0.046541422605514526, 0.05063597112894058, 0.05473051592707634, 0.0588250607252121, 0.06291960924863815, 0.06701415032148361, 0.07110869884490967, 0.07520323991775513, 0.07929778844118118, 0.08339233696460724, 0.0874868780374527, 0.09158142656087875, 0.09567597508430481, 0.09977051615715027, 0.10386506468057632, 0.10795961320400238, 0.11205415427684784, 0.1161487028002739, 0.12024325132369995, 0.12433779239654541]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 7.0, 5.0, 4.0, 11.0, 16.0, 23.0, 25.0, 37.0, 71.0, 102.0, 201.0, 369.0, 787.0, 1805.0, 5005.0, 20593.0, 171995.0, 700463.0, 123168.0, 16574.0, 4131.0, 1622.0, 729.0, 359.0, 183.0, 96.0, 53.0, 41.0, 25.0, 11.0, 14.0, 12.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134765625, -0.13073444366455078, -0.12670326232910156, -0.12267208099365234, -0.11864089965820312, -0.1146097183227539, -0.11057853698730469, -0.10654735565185547, -0.10251617431640625, -0.09848499298095703, -0.09445381164550781, -0.0904226303100586, -0.08639144897460938, -0.08236026763916016, -0.07832908630371094, -0.07429790496826172, -0.0702667236328125, -0.06623554229736328, -0.06220436096191406, -0.058173179626464844, -0.054141998291015625, -0.050110816955566406, -0.04607963562011719, -0.04204845428466797, -0.03801727294921875, -0.03398609161376953, -0.029954910278320312, -0.025923728942871094, -0.021892547607421875, -0.017861366271972656, -0.013830184936523438, -0.009799003601074219, -0.005767822265625, -0.0017366409301757812, 0.0022945404052734375, 0.006325721740722656, 0.010356903076171875, 0.014388084411621094, 0.018419265747070312, 0.02245044708251953, 0.02648162841796875, 0.03051280975341797, 0.03454399108886719, 0.038575172424316406, 0.042606353759765625, 0.046637535095214844, 0.05066871643066406, 0.05469989776611328, 0.0587310791015625, 0.06276226043701172, 0.06679344177246094, 0.07082462310791016, 0.07485580444335938, 0.0788869857788086, 0.08291816711425781, 0.08694934844970703, 0.09098052978515625, 0.09501171112060547, 0.09904289245605469, 0.1030740737915039, 0.10710525512695312, 0.11113643646240234, 0.11516761779785156, 0.11919879913330078, 0.12322998046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 8.0, 9.0, 14.0, 37.0, 39.0, 37.0, 62.0, 72.0, 67.0, 95.0, 76.0, 96.0, 72.0, 68.0, 58.0, 58.0, 36.0, 25.0, 17.0, 15.0, 13.0, 9.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.04998779296875, -0.048662662506103516, -0.04733753204345703, -0.04601240158081055, -0.04468727111816406, -0.04336214065551758, -0.042037010192871094, -0.04071187973022461, -0.039386749267578125, -0.03806161880493164, -0.036736488342285156, -0.03541135787963867, -0.03408622741699219, -0.0327610969543457, -0.03143596649169922, -0.030110836029052734, -0.02878570556640625, -0.027460575103759766, -0.02613544464111328, -0.024810314178466797, -0.023485183715820312, -0.022160053253173828, -0.020834922790527344, -0.01950979232788086, -0.018184661865234375, -0.01685953140258789, -0.015534400939941406, -0.014209270477294922, -0.012884140014648438, -0.011559009552001953, -0.010233879089355469, -0.008908748626708984, -0.0075836181640625, -0.006258487701416016, -0.004933357238769531, -0.003608226776123047, -0.0022830963134765625, -0.0009579658508300781, 0.00036716461181640625, 0.0016922950744628906, 0.003017425537109375, 0.004342555999755859, 0.005667686462402344, 0.006992816925048828, 0.008317947387695312, 0.009643077850341797, 0.010968208312988281, 0.012293338775634766, 0.01361846923828125, 0.014943599700927734, 0.01626873016357422, 0.017593860626220703, 0.018918991088867188, 0.020244121551513672, 0.021569252014160156, 0.02289438247680664, 0.024219512939453125, 0.02554464340209961, 0.026869773864746094, 0.028194904327392578, 0.029520034790039062, 0.030845165252685547, 0.03217029571533203, 0.033495426177978516, 0.034820556640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 9.0, 13.0, 14.0, 24.0, 25.0, 33.0, 53.0, 82.0, 102.0, 142.0, 241.0, 405.0, 671.0, 1436.0, 3293.0, 8951.0, 32126.0, 145074.0, 485660.0, 283576.0, 62003.0, 15032.0, 5035.0, 2073.0, 1004.0, 507.0, 319.0, 186.0, 142.0, 78.0, 60.0, 53.0, 34.0, 21.0, 20.0, 13.0, 8.0, 6.0, 3.0, 5.0, 8.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.059051513671875, -0.0571293830871582, -0.055207252502441406, -0.05328512191772461, -0.05136299133300781, -0.049440860748291016, -0.04751873016357422, -0.04559659957885742, -0.043674468994140625, -0.04175233840942383, -0.03983020782470703, -0.037908077239990234, -0.03598594665527344, -0.03406381607055664, -0.032141685485839844, -0.030219554901123047, -0.02829742431640625, -0.026375293731689453, -0.024453163146972656, -0.02253103256225586, -0.020608901977539062, -0.018686771392822266, -0.01676464080810547, -0.014842510223388672, -0.012920379638671875, -0.010998249053955078, -0.009076118469238281, -0.007153987884521484, -0.0052318572998046875, -0.0033097267150878906, -0.0013875961303710938, 0.0005345344543457031, 0.0024566650390625, 0.004378795623779297, 0.006300926208496094, 0.00822305679321289, 0.010145187377929688, 0.012067317962646484, 0.013989448547363281, 0.015911579132080078, 0.017833709716796875, 0.019755840301513672, 0.02167797088623047, 0.023600101470947266, 0.025522232055664062, 0.02744436264038086, 0.029366493225097656, 0.03128862380981445, 0.03321075439453125, 0.03513288497924805, 0.037055015563964844, 0.03897714614868164, 0.04089927673339844, 0.042821407318115234, 0.04474353790283203, 0.04666566848754883, 0.048587799072265625, 0.05050992965698242, 0.05243206024169922, 0.054354190826416016, 0.05627632141113281, 0.05819845199584961, 0.060120582580566406, 0.0620427131652832, 0.06396484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 8.0, 11.0, 9.0, 19.0, 12.0, 18.0, 19.0, 22.0, 26.0, 24.0, 46.0, 40.0, 38.0, 49.0, 49.0, 61.0, 57.0, 36.0, 36.0, 50.0, 38.0, 55.0, 42.0, 42.0, 16.0, 40.0, 21.0, 18.0, 14.0, 11.0, 20.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09124755859375, -0.08826637268066406, -0.08528518676757812, -0.08230400085449219, -0.07932281494140625, -0.07634162902832031, -0.07336044311523438, -0.07037925720214844, -0.0673980712890625, -0.06441688537597656, -0.061435699462890625, -0.05845451354980469, -0.05547332763671875, -0.05249214172363281, -0.049510955810546875, -0.04652976989746094, -0.043548583984375, -0.04056739807128906, -0.037586212158203125, -0.03460502624511719, -0.03162384033203125, -0.028642654418945312, -0.025661468505859375, -0.022680282592773438, -0.0196990966796875, -0.016717910766601562, -0.013736724853515625, -0.010755538940429688, -0.00777435302734375, -0.0047931671142578125, -0.001811981201171875, 0.0011692047119140625, 0.004150390625, 0.0071315765380859375, 0.010112762451171875, 0.013093948364257812, 0.01607513427734375, 0.019056320190429688, 0.022037506103515625, 0.025018692016601562, 0.0279998779296875, 0.030981063842773438, 0.033962249755859375, 0.03694343566894531, 0.03992462158203125, 0.04290580749511719, 0.045886993408203125, 0.04886817932128906, 0.051849365234375, 0.05483055114746094, 0.057811737060546875, 0.06079292297363281, 0.06377410888671875, 0.06675529479980469, 0.06973648071289062, 0.07271766662597656, 0.0756988525390625, 0.07868003845214844, 0.08166122436523438, 0.08464241027832031, 0.08762359619140625, 0.09060478210449219, 0.09358596801757812, 0.09656715393066406, 0.09954833984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 15.0, 39.0, 73.0, 147.0, 371.0, 959.0, 3702.0, 24417.0, 307244.0, 635359.0, 66180.0, 7424.0, 1634.0, 525.0, 206.0, 100.0, 57.0, 33.0, 13.0, 12.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048431396484375, -0.04671430587768555, -0.044997215270996094, -0.04328012466430664, -0.04156303405761719, -0.039845943450927734, -0.03812885284423828, -0.03641176223754883, -0.034694671630859375, -0.03297758102416992, -0.03126049041748047, -0.029543399810791016, -0.027826309204101562, -0.02610921859741211, -0.024392127990722656, -0.022675037384033203, -0.02095794677734375, -0.019240856170654297, -0.017523765563964844, -0.01580667495727539, -0.014089584350585938, -0.012372493743896484, -0.010655403137207031, -0.008938312530517578, -0.007221221923828125, -0.005504131317138672, -0.0037870407104492188, -0.0020699501037597656, -0.0003528594970703125, 0.0013642311096191406, 0.0030813217163085938, 0.004798412322998047, 0.0065155029296875, 0.008232593536376953, 0.009949684143066406, 0.01166677474975586, 0.013383865356445312, 0.015100955963134766, 0.01681804656982422, 0.018535137176513672, 0.020252227783203125, 0.021969318389892578, 0.02368640899658203, 0.025403499603271484, 0.027120590209960938, 0.02883768081665039, 0.030554771423339844, 0.0322718620300293, 0.03398895263671875, 0.0357060432434082, 0.037423133850097656, 0.03914022445678711, 0.04085731506347656, 0.042574405670166016, 0.04429149627685547, 0.04600858688354492, 0.047725677490234375, 0.04944276809692383, 0.05115985870361328, 0.052876949310302734, 0.05459403991699219, 0.05631113052368164, 0.058028221130371094, 0.05974531173706055, 0.06146240234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 11.0, 20.0, 61.0, 130.0, 263.0, 247.0, 150.0, 70.0, 33.0, 13.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005002021789550781, -0.0004898086190223694, -0.00047941505908966064, -0.0004690214991569519, -0.00045862793922424316, -0.0004482343792915344, -0.0004378408193588257, -0.00042744725942611694, -0.0004170536994934082, -0.00040666013956069946, -0.0003962665796279907, -0.000385873019695282, -0.00037547945976257324, -0.0003650858998298645, -0.00035469233989715576, -0.000344298779964447, -0.0003339052200317383, -0.00032351166009902954, -0.0003131181001663208, -0.00030272454023361206, -0.0002923309803009033, -0.0002819374203681946, -0.00027154386043548584, -0.0002611503005027771, -0.00025075674057006836, -0.00024036318063735962, -0.00022996962070465088, -0.00021957606077194214, -0.0002091825008392334, -0.00019878894090652466, -0.00018839538097381592, -0.00017800182104110718, -0.00016760826110839844, -0.0001572147011756897, -0.00014682114124298096, -0.00013642758131027222, -0.00012603402137756348, -0.00011564046144485474, -0.000105246901512146, -9.485334157943726e-05, -8.445978164672852e-05, -7.406622171401978e-05, -6.367266178131104e-05, -5.3279101848602295e-05, -4.2885541915893555e-05, -3.2491981983184814e-05, -2.2098422050476074e-05, -1.1704862117767334e-05, -1.3113021850585938e-06, 9.082257747650146e-06, 1.9475817680358887e-05, 2.9869377613067627e-05, 4.026293754577637e-05, 5.065649747848511e-05, 6.105005741119385e-05, 7.144361734390259e-05, 8.183717727661133e-05, 9.223073720932007e-05, 0.00010262429714202881, 0.00011301785707473755, 0.0001234114170074463, 0.00013380497694015503, 0.00014419853687286377, 0.0001545920968055725, 0.00016498565673828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 7.0, 8.0, 14.0, 15.0, 16.0, 41.0, 72.0, 129.0, 212.0, 533.0, 1209.0, 3855.0, 21994.0, 245423.0, 696288.0, 66822.0, 8453.0, 2021.0, 728.0, 349.0, 148.0, 104.0, 47.0, 37.0, 12.0, 9.0, 6.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05096435546875, -0.049094200134277344, -0.04722404479980469, -0.04535388946533203, -0.043483734130859375, -0.04161357879638672, -0.03974342346191406, -0.037873268127441406, -0.03600311279296875, -0.034132957458496094, -0.03226280212402344, -0.03039264678955078, -0.028522491455078125, -0.02665233612060547, -0.024782180786132812, -0.022912025451660156, -0.0210418701171875, -0.019171714782714844, -0.017301559448242188, -0.015431404113769531, -0.013561248779296875, -0.011691093444824219, -0.009820938110351562, -0.007950782775878906, -0.00608062744140625, -0.004210472106933594, -0.0023403167724609375, -0.00047016143798828125, 0.001399993896484375, 0.0032701492309570312, 0.0051403045654296875, 0.007010459899902344, 0.008880615234375, 0.010750770568847656, 0.012620925903320312, 0.014491081237792969, 0.016361236572265625, 0.01823139190673828, 0.020101547241210938, 0.021971702575683594, 0.02384185791015625, 0.025712013244628906, 0.027582168579101562, 0.02945232391357422, 0.031322479248046875, 0.03319263458251953, 0.03506278991699219, 0.036932945251464844, 0.0388031005859375, 0.040673255920410156, 0.04254341125488281, 0.04441356658935547, 0.046283721923828125, 0.04815387725830078, 0.05002403259277344, 0.051894187927246094, 0.05376434326171875, 0.055634498596191406, 0.05750465393066406, 0.05937480926513672, 0.061244964599609375, 0.06311511993408203, 0.06498527526855469, 0.06685543060302734, 0.0687255859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 18.0, 21.0, 23.0, 37.0, 61.0, 84.0, 107.0, 187.0, 166.0, 101.0, 66.0, 45.0, 19.0, 24.0, 13.0, 10.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06390380859375, -0.062165260314941406, -0.06042671203613281, -0.05868816375732422, -0.056949615478515625, -0.05521106719970703, -0.05347251892089844, -0.051733970642089844, -0.04999542236328125, -0.048256874084472656, -0.04651832580566406, -0.04477977752685547, -0.043041229248046875, -0.04130268096923828, -0.03956413269042969, -0.037825584411621094, -0.0360870361328125, -0.034348487854003906, -0.03260993957519531, -0.03087139129638672, -0.029132843017578125, -0.02739429473876953, -0.025655746459960938, -0.023917198181152344, -0.02217864990234375, -0.020440101623535156, -0.018701553344726562, -0.01696300506591797, -0.015224456787109375, -0.013485908508300781, -0.011747360229492188, -0.010008811950683594, -0.008270263671875, -0.006531715393066406, -0.0047931671142578125, -0.0030546188354492188, -0.001316070556640625, 0.00042247772216796875, 0.0021610260009765625, 0.0038995742797851562, 0.00563812255859375, 0.007376670837402344, 0.009115219116210938, 0.010853767395019531, 0.012592315673828125, 0.014330863952636719, 0.016069412231445312, 0.017807960510253906, 0.0195465087890625, 0.021285057067871094, 0.023023605346679688, 0.02476215362548828, 0.026500701904296875, 0.02823925018310547, 0.029977798461914062, 0.031716346740722656, 0.03345489501953125, 0.035193443298339844, 0.03693199157714844, 0.03867053985595703, 0.040409088134765625, 0.04214763641357422, 0.04388618469238281, 0.045624732971191406, 0.04736328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 12.0, 26.0, 49.0, 104.0, 184.0, 211.0, 188.0, 96.0, 59.0, 22.0, 15.0, 7.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6500645875930786, -0.6305150389671326, -0.6109654307365417, -0.5914158821105957, -0.5718662738800049, -0.5523167252540588, -0.5327671766281128, -0.513217568397522, -0.4936680197715759, -0.4741184413433075, -0.45456886291503906, -0.435019314289093, -0.4154697358608246, -0.39592015743255615, -0.3763706088066101, -0.3568210303783417, -0.33727145195007324, -0.3177218735218048, -0.2981722950935364, -0.27862274646759033, -0.2590731680393219, -0.23952358961105347, -0.21997402608394623, -0.200424462556839, -0.18087488412857056, -0.16132530570030212, -0.14177574217319489, -0.12222617119550705, -0.10267660021781921, -0.08312702924013138, -0.06357745826244354, -0.044027894735336304, -0.024478375911712646, -0.004928804934024811, 0.014620766043663025, 0.03417033702135086, 0.053719907999038696, 0.07326947897672653, 0.09281904995441437, 0.1123686134815216, 0.13191819190979004, 0.15146777033805847, 0.1710173338651657, 0.19056689739227295, 0.21011647582054138, 0.22966605424880981, 0.24921561777591705, 0.2687651813030243, 0.2883147597312927, 0.30786433815956116, 0.3274139165878296, 0.34696346521377563, 0.36651304364204407, 0.3860626220703125, 0.40561217069625854, 0.425161749124527, 0.4447113275527954, 0.46426090598106384, 0.4838104844093323, 0.5033600330352783, 0.5229096412658691, 0.5424591898918152, 0.5620087385177612, 0.581558346748352, 0.6011078953742981]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 9.0, 6.0, 12.0, 13.0, 9.0, 15.0, 16.0, 19.0, 22.0, 24.0, 36.0, 31.0, 33.0, 44.0, 44.0, 44.0, 40.0, 51.0, 37.0, 44.0, 51.0, 30.0, 44.0, 37.0, 34.0, 30.0, 36.0, 23.0, 26.0, 22.0, 29.0, 12.0, 13.0, 13.0, 8.0, 11.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3823842406272888, -0.3694644272327423, -0.3565446138381958, -0.3436248004436493, -0.3307049870491028, -0.31778520345687866, -0.30486539006233215, -0.29194557666778564, -0.27902576327323914, -0.2661059498786926, -0.2531861364841461, -0.2402663379907608, -0.2273465245962143, -0.21442671120166779, -0.20150691270828247, -0.18858709931373596, -0.17566728591918945, -0.16274747252464294, -0.14982765913009644, -0.13690786063671112, -0.12398804724216461, -0.1110682338476181, -0.09814842790365219, -0.08522862195968628, -0.07230880856513977, -0.05938899889588356, -0.04646918922662735, -0.03354937955737114, -0.02062956988811493, -0.00770975649356842, 0.0052100494503974915, 0.018129855394363403, 0.031049668788909912, 0.04396947845816612, 0.05688928812742233, 0.06980909407138824, 0.08272890746593475, 0.09564872086048126, 0.10856852680444717, 0.12148833274841309, 0.1344081461429596, 0.1473279595375061, 0.1602477729320526, 0.17316757142543793, 0.18608738481998444, 0.19900719821453094, 0.21192699670791626, 0.22484681010246277, 0.23776662349700928, 0.2506864368915558, 0.2636062502861023, 0.2765260636806488, 0.2894458770751953, 0.30236566066741943, 0.31528547406196594, 0.32820528745651245, 0.34112510085105896, 0.35404491424560547, 0.366964727640152, 0.3798845410346985, 0.3928043246269226, 0.4057241678237915, 0.4186439514160156, 0.43156376481056213, 0.44448357820510864]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 12.0, 13.0, 21.0, 31.0, 57.0, 89.0, 183.0, 389.0, 1165.0, 4628.0, 52203.0, 4040173.0, 87493.0, 5616.0, 1301.0, 440.0, 199.0, 91.0, 69.0, 33.0, 22.0, 16.0, 11.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.21630859375, -0.2100505828857422, -0.20379257202148438, -0.19753456115722656, -0.19127655029296875, -0.18501853942871094, -0.17876052856445312, -0.1725025177001953, -0.1662445068359375, -0.1599864959716797, -0.15372848510742188, -0.14747047424316406, -0.14121246337890625, -0.13495445251464844, -0.12869644165039062, -0.12243843078613281, -0.116180419921875, -0.10992240905761719, -0.10366439819335938, -0.09740638732910156, -0.09114837646484375, -0.08489036560058594, -0.07863235473632812, -0.07237434387207031, -0.0661163330078125, -0.05985832214355469, -0.053600311279296875, -0.04734230041503906, -0.04108428955078125, -0.03482627868652344, -0.028568267822265625, -0.022310256958007812, -0.01605224609375, -0.009794235229492188, -0.003536224365234375, 0.0027217864990234375, 0.00897979736328125, 0.015237808227539062, 0.021495819091796875, 0.027753829956054688, 0.0340118408203125, 0.04026985168457031, 0.046527862548828125, 0.05278587341308594, 0.05904388427734375, 0.06530189514160156, 0.07155990600585938, 0.07781791687011719, 0.084075927734375, 0.09033393859863281, 0.09659194946289062, 0.10284996032714844, 0.10910797119140625, 0.11536598205566406, 0.12162399291992188, 0.1278820037841797, 0.1341400146484375, 0.1403980255126953, 0.14665603637695312, 0.15291404724121094, 0.15917205810546875, 0.16543006896972656, 0.17168807983398438, 0.1779460906982422, 0.1842041015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 16.0, 23.0, 36.0, 45.0, 62.0, 92.0, 69.0, 88.0, 87.0, 99.0, 80.0, 70.0, 61.0, 54.0, 29.0, 22.0, 22.0, 11.0, 11.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.05804443359375, -0.05657958984375, -0.05511474609375, -0.05364990234375, -0.05218505859375, -0.05072021484375, -0.04925537109375, -0.04779052734375, -0.04632568359375, -0.04486083984375, -0.04339599609375, -0.04193115234375, -0.04046630859375, -0.03900146484375, -0.03753662109375, -0.03607177734375, -0.03460693359375, -0.03314208984375, -0.03167724609375, -0.03021240234375, -0.02874755859375, -0.02728271484375, -0.02581787109375, -0.02435302734375, -0.02288818359375, -0.02142333984375, -0.01995849609375, -0.01849365234375, -0.01702880859375, -0.01556396484375, -0.01409912109375, -0.01263427734375, -0.01116943359375, -0.00970458984375, -0.00823974609375, -0.00677490234375, -0.00531005859375, -0.00384521484375, -0.00238037109375, -0.00091552734375, 0.00054931640625, 0.00201416015625, 0.00347900390625, 0.00494384765625, 0.00640869140625, 0.00787353515625, 0.00933837890625, 0.01080322265625, 0.01226806640625, 0.01373291015625, 0.01519775390625, 0.01666259765625, 0.01812744140625, 0.01959228515625, 0.02105712890625, 0.02252197265625, 0.02398681640625, 0.02545166015625, 0.02691650390625, 0.02838134765625, 0.02984619140625, 0.03131103515625, 0.03277587890625, 0.03424072265625, 0.03570556640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 10.0, 21.0, 16.0, 38.0, 51.0, 90.0, 122.0, 213.0, 289.0, 495.0, 886.0, 1714.0, 4362.0, 15358.0, 111700.0, 3324418.0, 680357.0, 40405.0, 8074.0, 2638.0, 1226.0, 657.0, 415.0, 264.0, 150.0, 86.0, 73.0, 47.0, 35.0, 26.0, 9.0, 9.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.113037109375, -0.10996341705322266, -0.10688972473144531, -0.10381603240966797, -0.10074234008789062, -0.09766864776611328, -0.09459495544433594, -0.0915212631225586, -0.08844757080078125, -0.0853738784790039, -0.08230018615722656, -0.07922649383544922, -0.07615280151367188, -0.07307910919189453, -0.07000541687011719, -0.06693172454833984, -0.0638580322265625, -0.060784339904785156, -0.05771064758300781, -0.05463695526123047, -0.051563262939453125, -0.04848957061767578, -0.04541587829589844, -0.042342185974121094, -0.03926849365234375, -0.036194801330566406, -0.03312110900878906, -0.03004741668701172, -0.026973724365234375, -0.02390003204345703, -0.020826339721679688, -0.017752647399902344, -0.014678955078125, -0.011605262756347656, -0.008531570434570312, -0.005457878112792969, -0.002384185791015625, 0.0006895065307617188, 0.0037631988525390625, 0.006836891174316406, 0.00991058349609375, 0.012984275817871094, 0.016057968139648438, 0.01913166046142578, 0.022205352783203125, 0.02527904510498047, 0.028352737426757812, 0.031426429748535156, 0.0345001220703125, 0.037573814392089844, 0.04064750671386719, 0.04372119903564453, 0.046794891357421875, 0.04986858367919922, 0.05294227600097656, 0.056015968322753906, 0.05908966064453125, 0.062163352966308594, 0.06523704528808594, 0.06831073760986328, 0.07138442993164062, 0.07445812225341797, 0.07753181457519531, 0.08060550689697266, 0.08367919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 10.0, 12.0, 17.0, 36.0, 91.0, 199.0, 581.0, 1834.0, 760.0, 273.0, 114.0, 62.0, 31.0, 20.0, 8.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0477294921875, -0.04617166519165039, -0.04461383819580078, -0.04305601119995117, -0.04149818420410156, -0.03994035720825195, -0.038382530212402344, -0.036824703216552734, -0.035266876220703125, -0.033709049224853516, -0.032151222229003906, -0.030593395233154297, -0.029035568237304688, -0.027477741241455078, -0.02591991424560547, -0.02436208724975586, -0.02280426025390625, -0.02124643325805664, -0.01968860626220703, -0.018130779266357422, -0.016572952270507812, -0.015015125274658203, -0.013457298278808594, -0.011899471282958984, -0.010341644287109375, -0.008783817291259766, -0.007225990295410156, -0.005668163299560547, -0.0041103363037109375, -0.002552509307861328, -0.0009946823120117188, 0.0005631446838378906, 0.0021209716796875, 0.0036787986755371094, 0.005236625671386719, 0.006794452667236328, 0.008352279663085938, 0.009910106658935547, 0.011467933654785156, 0.013025760650634766, 0.014583587646484375, 0.016141414642333984, 0.017699241638183594, 0.019257068634033203, 0.020814895629882812, 0.022372722625732422, 0.02393054962158203, 0.02548837661743164, 0.02704620361328125, 0.02860403060913086, 0.03016185760498047, 0.03171968460083008, 0.03327751159667969, 0.0348353385925293, 0.036393165588378906, 0.037950992584228516, 0.039508819580078125, 0.041066646575927734, 0.042624473571777344, 0.04418230056762695, 0.04574012756347656, 0.04729795455932617, 0.04885578155517578, 0.05041360855102539, 0.051971435546875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 9.0, 8.0, 45.0, 101.0, 189.0, 244.0, 217.0, 114.0, 41.0, 18.0, 8.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16230973601341248, -0.1517733484506607, -0.14123696088790894, -0.13070055842399597, -0.1201641783118248, -0.10962779074907303, -0.09909139573574066, -0.08855500817298889, -0.07801862061023712, -0.06748223304748535, -0.05694584175944328, -0.046409450471401215, -0.035873062908649445, -0.025336675345897675, -0.014800280332565308, -0.004263892769813538, 0.006272494792938232, 0.01680888421833515, 0.02734527364373207, 0.03788166493177414, 0.04841805249452591, 0.05895444005727768, 0.06949083507061005, 0.08002722263336182, 0.09056361019611359, 0.10109999775886536, 0.11163638532161713, 0.1221727803349495, 0.13270917534828186, 0.14324554800987244, 0.1537819504737854, 0.16431833803653717, 0.17485475540161133, 0.1853911429643631, 0.19592753052711487, 0.20646393299102783, 0.2170003056526184, 0.22753670811653137, 0.23807309567928314, 0.2486094832420349, 0.2591458559036255, 0.26968225836753845, 0.28021863102912903, 0.290755033493042, 0.30129140615463257, 0.31182780861854553, 0.3223642110824585, 0.3329005837440491, 0.34343698620796204, 0.353973388671875, 0.3645097613334656, 0.37504616379737854, 0.3855825364589691, 0.3961189389228821, 0.40665531158447266, 0.4171917140483856, 0.4277281165122986, 0.43826451897621155, 0.4488008916378021, 0.4593372941017151, 0.46987366676330566, 0.48041006922721863, 0.4909464716911316, 0.5014828443527222, 0.5120192170143127]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 1.0, 3.0, 9.0, 7.0, 9.0, 22.0, 24.0, 24.0, 30.0, 36.0, 47.0, 49.0, 45.0, 53.0, 51.0, 61.0, 63.0, 52.0, 75.0, 61.0, 37.0, 55.0, 25.0, 36.0, 36.0, 18.0, 15.0, 15.0, 10.0, 6.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1082226037979126, -0.10425594449043274, -0.10028928518295288, -0.09632262587547302, -0.09235596656799316, -0.0883893072605133, -0.08442264050245285, -0.08045598119497299, -0.07648932188749313, -0.07252266258001328, -0.06855600327253342, -0.06458934396505356, -0.0606226809322834, -0.05665602162480354, -0.052689358592033386, -0.04872269928455353, -0.04475603997707367, -0.04078938066959381, -0.03682272136211395, -0.032856058329343796, -0.028889399021863937, -0.02492273971438408, -0.02095607854425907, -0.016989417374134064, -0.013022758066654205, -0.009056097827851772, -0.005089437589049339, -0.0011227773502469063, 0.0028438828885555267, 0.006810542196035385, 0.010777203366160393, 0.0147438645362854, 0.01871052384376526, 0.022677183151245117, 0.026643844321370125, 0.030610505491495132, 0.03457716479897499, 0.03854382410645485, 0.042510487139225006, 0.046477146446704865, 0.05044380575418472, 0.05441046506166458, 0.05837712436914444, 0.0623437874019146, 0.06631045043468475, 0.07027710974216461, 0.07424376904964447, 0.07821042835712433, 0.08217708766460419, 0.08614374697208405, 0.0901104062795639, 0.09407706558704376, 0.09804372489452362, 0.10201038420200348, 0.10597705096006393, 0.10994371026754379, 0.11391036957502365, 0.11787702888250351, 0.12184368818998337, 0.12581035494804382, 0.12977701425552368, 0.13374367356300354, 0.1377103328704834, 0.14167699217796326, 0.14564365148544312]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 11.0, 16.0, 34.0, 52.0, 82.0, 167.0, 364.0, 905.0, 2891.0, 14321.0, 154084.0, 733303.0, 125721.0, 12440.0, 2619.0, 804.0, 369.0, 145.0, 92.0, 62.0, 32.0, 8.0, 9.0, 8.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1265869140625, -0.12268733978271484, -0.11878776550292969, -0.11488819122314453, -0.11098861694335938, -0.10708904266357422, -0.10318946838378906, -0.0992898941040039, -0.09539031982421875, -0.0914907455444336, -0.08759117126464844, -0.08369159698486328, -0.07979202270507812, -0.07589244842529297, -0.07199287414550781, -0.06809329986572266, -0.0641937255859375, -0.060294151306152344, -0.05639457702636719, -0.05249500274658203, -0.048595428466796875, -0.04469585418701172, -0.04079627990722656, -0.036896705627441406, -0.03299713134765625, -0.029097557067871094, -0.025197982788085938, -0.02129840850830078, -0.017398834228515625, -0.013499259948730469, -0.009599685668945312, -0.005700111389160156, -0.001800537109375, 0.0020990371704101562, 0.0059986114501953125, 0.009898185729980469, 0.013797760009765625, 0.01769733428955078, 0.021596908569335938, 0.025496482849121094, 0.02939605712890625, 0.033295631408691406, 0.03719520568847656, 0.04109477996826172, 0.044994354248046875, 0.04889392852783203, 0.05279350280761719, 0.056693077087402344, 0.0605926513671875, 0.06449222564697266, 0.06839179992675781, 0.07229137420654297, 0.07619094848632812, 0.08009052276611328, 0.08399009704589844, 0.0878896713256836, 0.09178924560546875, 0.0956888198852539, 0.09958839416503906, 0.10348796844482422, 0.10738754272460938, 0.11128711700439453, 0.11518669128417969, 0.11908626556396484, 0.12298583984375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 5.0, 9.0, 13.0, 22.0, 34.0, 37.0, 57.0, 61.0, 97.0, 67.0, 107.0, 92.0, 95.0, 68.0, 57.0, 49.0, 43.0, 25.0, 22.0, 14.0, 7.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.057159423828125, -0.05572700500488281, -0.054294586181640625, -0.05286216735839844, -0.05142974853515625, -0.04999732971191406, -0.048564910888671875, -0.04713249206542969, -0.0457000732421875, -0.04426765441894531, -0.042835235595703125, -0.04140281677246094, -0.03997039794921875, -0.03853797912597656, -0.037105560302734375, -0.03567314147949219, -0.03424072265625, -0.03280830383300781, -0.031375885009765625, -0.029943466186523438, -0.02851104736328125, -0.027078628540039062, -0.025646209716796875, -0.024213790893554688, -0.0227813720703125, -0.021348953247070312, -0.019916534423828125, -0.018484115600585938, -0.01705169677734375, -0.015619277954101562, -0.014186859130859375, -0.012754440307617188, -0.011322021484375, -0.009889602661132812, -0.008457183837890625, -0.0070247650146484375, -0.00559234619140625, -0.0041599273681640625, -0.002727508544921875, -0.0012950897216796875, 0.0001373291015625, 0.0015697479248046875, 0.003002166748046875, 0.0044345855712890625, 0.00586700439453125, 0.0072994232177734375, 0.008731842041015625, 0.010164260864257812, 0.0115966796875, 0.013029098510742188, 0.014461517333984375, 0.015893936157226562, 0.01732635498046875, 0.018758773803710938, 0.020191192626953125, 0.021623611450195312, 0.0230560302734375, 0.024488449096679688, 0.025920867919921875, 0.027353286743164062, 0.02878570556640625, 0.030218124389648438, 0.031650543212890625, 0.03308296203613281, 0.034515380859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 11.0, 16.0, 11.0, 18.0, 24.0, 46.0, 46.0, 61.0, 97.0, 140.0, 191.0, 322.0, 613.0, 1564.0, 4740.0, 18360.0, 79920.0, 347452.0, 443250.0, 115763.0, 25621.0, 6406.0, 1953.0, 780.0, 380.0, 210.0, 145.0, 124.0, 76.0, 60.0, 37.0, 36.0, 16.0, 20.0, 13.0, 8.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050262451171875, -0.04853630065917969, -0.046810150146484375, -0.04508399963378906, -0.04335784912109375, -0.04163169860839844, -0.039905548095703125, -0.03817939758300781, -0.0364532470703125, -0.03472709655761719, -0.033000946044921875, -0.03127479553222656, -0.02954864501953125, -0.027822494506835938, -0.026096343994140625, -0.024370193481445312, -0.02264404296875, -0.020917892456054688, -0.019191741943359375, -0.017465591430664062, -0.01573944091796875, -0.014013290405273438, -0.012287139892578125, -0.010560989379882812, -0.0088348388671875, -0.0071086883544921875, -0.005382537841796875, -0.0036563873291015625, -0.00193023681640625, -0.0002040863037109375, 0.001522064208984375, 0.0032482147216796875, 0.004974365234375, 0.0067005157470703125, 0.008426666259765625, 0.010152816772460938, 0.01187896728515625, 0.013605117797851562, 0.015331268310546875, 0.017057418823242188, 0.0187835693359375, 0.020509719848632812, 0.022235870361328125, 0.023962020874023438, 0.02568817138671875, 0.027414321899414062, 0.029140472412109375, 0.030866622924804688, 0.0325927734375, 0.03431892395019531, 0.036045074462890625, 0.03777122497558594, 0.03949737548828125, 0.04122352600097656, 0.042949676513671875, 0.04467582702636719, 0.0464019775390625, 0.04812812805175781, 0.049854278564453125, 0.05158042907714844, 0.05330657958984375, 0.05503273010253906, 0.056758880615234375, 0.05848503112792969, 0.060211181640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 5.0, 19.0, 5.0, 11.0, 17.0, 19.0, 22.0, 28.0, 36.0, 20.0, 25.0, 30.0, 38.0, 45.0, 55.0, 51.0, 33.0, 52.0, 36.0, 40.0, 49.0, 45.0, 41.0, 42.0, 27.0, 35.0, 22.0, 14.0, 21.0, 21.0, 10.0, 17.0, 14.0, 5.0, 13.0, 6.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0706787109375, -0.06822967529296875, -0.0657806396484375, -0.06333160400390625, -0.060882568359375, -0.05843353271484375, -0.0559844970703125, -0.05353546142578125, -0.05108642578125, -0.04863739013671875, -0.0461883544921875, -0.04373931884765625, -0.041290283203125, -0.03884124755859375, -0.0363922119140625, -0.03394317626953125, -0.031494140625, -0.02904510498046875, -0.0265960693359375, -0.02414703369140625, -0.021697998046875, -0.01924896240234375, -0.0167999267578125, -0.01435089111328125, -0.01190185546875, -0.00945281982421875, -0.0070037841796875, -0.00455474853515625, -0.002105712890625, 0.00034332275390625, 0.0027923583984375, 0.00524139404296875, 0.0076904296875, 0.01013946533203125, 0.0125885009765625, 0.01503753662109375, 0.017486572265625, 0.01993560791015625, 0.0223846435546875, 0.02483367919921875, 0.02728271484375, 0.02973175048828125, 0.0321807861328125, 0.03462982177734375, 0.037078857421875, 0.03952789306640625, 0.0419769287109375, 0.04442596435546875, 0.046875, 0.04932403564453125, 0.0517730712890625, 0.05422210693359375, 0.056671142578125, 0.05912017822265625, 0.0615692138671875, 0.06401824951171875, 0.06646728515625, 0.06891632080078125, 0.0713653564453125, 0.07381439208984375, 0.076263427734375, 0.07871246337890625, 0.0811614990234375, 0.08361053466796875, 0.0860595703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 8.0, 2.0, 5.0, 5.0, 8.0, 21.0, 41.0, 50.0, 101.0, 238.0, 546.0, 1852.0, 8157.0, 53515.0, 380313.0, 505834.0, 82191.0, 12047.0, 2432.0, 647.0, 273.0, 114.0, 76.0, 33.0, 20.0, 8.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0217742919921875, -0.02074265480041504, -0.019711017608642578, -0.018679380416870117, -0.017647743225097656, -0.016616106033325195, -0.015584468841552734, -0.014552831649780273, -0.013521194458007812, -0.012489557266235352, -0.01145792007446289, -0.01042628288269043, -0.009394645690917969, -0.008363008499145508, -0.007331371307373047, -0.006299734115600586, -0.005268096923828125, -0.004236459732055664, -0.003204822540283203, -0.002173185348510742, -0.0011415481567382812, -0.00010991096496582031, 0.0009217262268066406, 0.0019533634185791016, 0.0029850006103515625, 0.0040166378021240234, 0.005048274993896484, 0.006079912185668945, 0.007111549377441406, 0.008143186569213867, 0.009174823760986328, 0.010206460952758789, 0.01123809814453125, 0.012269735336303711, 0.013301372528076172, 0.014333009719848633, 0.015364646911621094, 0.016396284103393555, 0.017427921295166016, 0.018459558486938477, 0.019491195678710938, 0.0205228328704834, 0.02155447006225586, 0.02258610725402832, 0.02361774444580078, 0.024649381637573242, 0.025681018829345703, 0.026712656021118164, 0.027744293212890625, 0.028775930404663086, 0.029807567596435547, 0.030839204788208008, 0.03187084197998047, 0.03290247917175293, 0.03393411636352539, 0.03496575355529785, 0.03599739074707031, 0.03702902793884277, 0.038060665130615234, 0.039092302322387695, 0.040123939514160156, 0.04115557670593262, 0.04218721389770508, 0.04321885108947754, 0.04425048828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 8.0, 9.0, 15.0, 18.0, 41.0, 65.0, 123.0, 182.0, 198.0, 143.0, 96.0, 39.0, 24.0, 18.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015091896057128906, -0.00014574453234672546, -0.00014057010412216187, -0.00013539567589759827, -0.00013022124767303467, -0.00012504681944847107, -0.00011987239122390747, -0.00011469796299934387, -0.00010952353477478027, -0.00010434910655021667, -9.917467832565308e-05, -9.400025010108948e-05, -8.882582187652588e-05, -8.365139365196228e-05, -7.847696542739868e-05, -7.330253720283508e-05, -6.812810897827148e-05, -6.295368075370789e-05, -5.777925252914429e-05, -5.260482430458069e-05, -4.743039608001709e-05, -4.225596785545349e-05, -3.708153963088989e-05, -3.1907111406326294e-05, -2.6732683181762695e-05, -2.1558254957199097e-05, -1.6383826732635498e-05, -1.12093985080719e-05, -6.034970283508301e-06, -8.605420589447021e-07, 4.3138861656188965e-06, 9.488314390182495e-06, 1.4662742614746094e-05, 1.9837170839309692e-05, 2.501159906387329e-05, 3.018602728843689e-05, 3.536045551300049e-05, 4.053488373756409e-05, 4.5709311962127686e-05, 5.0883740186691284e-05, 5.605816841125488e-05, 6.123259663581848e-05, 6.640702486038208e-05, 7.158145308494568e-05, 7.675588130950928e-05, 8.193030953407288e-05, 8.710473775863647e-05, 9.227916598320007e-05, 9.745359420776367e-05, 0.00010262802243232727, 0.00010780245065689087, 0.00011297687888145447, 0.00011815130710601807, 0.00012332573533058167, 0.00012850016355514526, 0.00013367459177970886, 0.00013884902000427246, 0.00014402344822883606, 0.00014919787645339966, 0.00015437230467796326, 0.00015954673290252686, 0.00016472116112709045, 0.00016989558935165405, 0.00017507001757621765, 0.00018024444580078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 15.0, 13.0, 22.0, 35.0, 48.0, 107.0, 173.0, 357.0, 705.0, 1665.0, 4966.0, 22457.0, 139911.0, 612908.0, 221600.0, 32827.0, 6798.0, 2076.0, 881.0, 461.0, 212.0, 112.0, 68.0, 44.0, 24.0, 15.0, 18.0, 10.0, 5.0, 3.0, 0.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.038909912109375, -0.03787541389465332, -0.03684091567993164, -0.03580641746520996, -0.03477191925048828, -0.0337374210357666, -0.03270292282104492, -0.03166842460632324, -0.030633926391601562, -0.029599428176879883, -0.028564929962158203, -0.027530431747436523, -0.026495933532714844, -0.025461435317993164, -0.024426937103271484, -0.023392438888549805, -0.022357940673828125, -0.021323442459106445, -0.020288944244384766, -0.019254446029663086, -0.018219947814941406, -0.017185449600219727, -0.016150951385498047, -0.015116453170776367, -0.014081954956054688, -0.013047456741333008, -0.012012958526611328, -0.010978460311889648, -0.009943962097167969, -0.008909463882446289, -0.00787496566772461, -0.00684046745300293, -0.00580596923828125, -0.00477147102355957, -0.0037369728088378906, -0.002702474594116211, -0.0016679763793945312, -0.0006334781646728516, 0.0004010200500488281, 0.0014355182647705078, 0.0024700164794921875, 0.003504514694213867, 0.004539012908935547, 0.0055735111236572266, 0.006608009338378906, 0.007642507553100586, 0.008677005767822266, 0.009711503982543945, 0.010746002197265625, 0.011780500411987305, 0.012814998626708984, 0.013849496841430664, 0.014883995056152344, 0.015918493270874023, 0.016952991485595703, 0.017987489700317383, 0.019021987915039062, 0.020056486129760742, 0.021090984344482422, 0.0221254825592041, 0.02315998077392578, 0.02419447898864746, 0.02522897720336914, 0.02626347541809082, 0.0272979736328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 6.0, 6.0, 14.0, 21.0, 27.0, 41.0, 67.0, 119.0, 146.0, 133.0, 100.0, 101.0, 75.0, 52.0, 34.0, 26.0, 16.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047210693359375, -0.04609107971191406, -0.044971466064453125, -0.04385185241699219, -0.04273223876953125, -0.04161262512207031, -0.040493011474609375, -0.03937339782714844, -0.0382537841796875, -0.03713417053222656, -0.036014556884765625, -0.03489494323730469, -0.03377532958984375, -0.03265571594238281, -0.031536102294921875, -0.030416488647460938, -0.029296875, -0.028177261352539062, -0.027057647705078125, -0.025938034057617188, -0.02481842041015625, -0.023698806762695312, -0.022579193115234375, -0.021459579467773438, -0.0203399658203125, -0.019220352172851562, -0.018100738525390625, -0.016981124877929688, -0.01586151123046875, -0.014741897583007812, -0.013622283935546875, -0.012502670288085938, -0.011383056640625, -0.010263442993164062, -0.009143829345703125, -0.008024215698242188, -0.00690460205078125, -0.0057849884033203125, -0.004665374755859375, -0.0035457611083984375, -0.0024261474609375, -0.0013065338134765625, -0.000186920166015625, 0.0009326934814453125, 0.00205230712890625, 0.0031719207763671875, 0.004291534423828125, 0.0054111480712890625, 0.00653076171875, 0.0076503753662109375, 0.008769989013671875, 0.009889602661132812, 0.01100921630859375, 0.012128829956054688, 0.013248443603515625, 0.014368057250976562, 0.0154876708984375, 0.016607284545898438, 0.017726898193359375, 0.018846511840820312, 0.01996612548828125, 0.021085739135742188, 0.022205352783203125, 0.023324966430664062, 0.024444580078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 48.0, 292.0, 457.0, 177.0, 22.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6047021150588989, -0.559441864490509, -0.5141816139221191, -0.468921422958374, -0.42366117238998413, -0.37840092182159424, -0.33314070105552673, -0.28788048028945923, -0.24262022972106934, -0.19735999405384064, -0.15209975838661194, -0.10683952271938324, -0.06157928705215454, -0.016319051384925842, 0.028941184282302856, 0.07420140504837036, 0.11946165561676025, 0.16472189128398895, 0.20998212695121765, 0.25524234771728516, 0.30050259828567505, 0.34576284885406494, 0.39102306962013245, 0.43628329038619995, 0.48154354095458984, 0.5268037915229797, 0.5720640420913696, 0.6173242330551147, 0.6625844836235046, 0.7078447341918945, 0.7531049251556396, 0.7983651757240295, 0.843625545501709, 0.8888857960700989, 0.9341460466384888, 0.9794062376022339, 1.0246665477752686, 1.0699267387390137, 1.1151869297027588, 1.160447120666504, 1.2057074308395386, 1.2509676218032837, 1.2962279319763184, 1.3414881229400635, 1.3867483139038086, 1.4320086240768433, 1.4772688150405884, 1.522529125213623, 1.5677893161773682, 1.6130495071411133, 1.658309817314148, 1.703570008277893, 1.7488303184509277, 1.7940905094146729, 1.839350700378418, 1.884610891342163, 1.9298712015151978, 1.9751313924789429, 2.0203917026519775, 2.0656518936157227, 2.1109120845794678, 2.156172275543213, 2.201432704925537, 2.2466928958892822, 2.2919530868530273]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 5.0, 7.0, 12.0, 12.0, 9.0, 17.0, 12.0, 22.0, 24.0, 20.0, 29.0, 31.0, 42.0, 32.0, 34.0, 31.0, 32.0, 35.0, 42.0, 59.0, 41.0, 53.0, 48.0, 37.0, 45.0, 31.0, 25.0, 28.0, 25.0, 24.0, 24.0, 22.0, 16.0, 14.0, 11.0, 10.0, 10.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.4116557240486145, -0.3999914526939392, -0.3883271813392639, -0.3766629099845886, -0.36499863862991333, -0.35333436727523804, -0.34167009592056274, -0.33000582456588745, -0.31834155321121216, -0.30667728185653687, -0.2950130105018616, -0.2833487391471863, -0.271684467792511, -0.2600201964378357, -0.2483559250831604, -0.2366916537284851, -0.22502738237380981, -0.21336311101913452, -0.20169883966445923, -0.19003456830978394, -0.17837029695510864, -0.16670602560043335, -0.15504175424575806, -0.14337748289108276, -0.13171321153640747, -0.12004894018173218, -0.10838466882705688, -0.09672039747238159, -0.0850561261177063, -0.073391854763031, -0.06172758340835571, -0.05006331205368042, -0.03839904069900513, -0.026734769344329834, -0.015070497989654541, -0.003406226634979248, 0.008258044719696045, 0.019922316074371338, 0.03158658742904663, 0.043250858783721924, 0.05491513013839722, 0.06657940149307251, 0.0782436728477478, 0.0899079442024231, 0.10157221555709839, 0.11323648691177368, 0.12490075826644897, 0.13656502962112427, 0.14822930097579956, 0.15989357233047485, 0.17155784368515015, 0.18322211503982544, 0.19488638639450073, 0.20655065774917603, 0.21821492910385132, 0.2298792004585266, 0.2415434718132019, 0.2532077431678772, 0.2648720145225525, 0.2765362858772278, 0.2882005572319031, 0.29986482858657837, 0.31152909994125366, 0.32319337129592896, 0.33485764265060425]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 7.0, 17.0, 11.0, 17.0, 32.0, 35.0, 86.0, 108.0, 220.0, 505.0, 1227.0, 4271.0, 19185.0, 265842.0, 3839432.0, 50845.0, 8351.0, 2327.0, 880.0, 395.0, 191.0, 99.0, 78.0, 47.0, 25.0, 16.0, 10.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1412353515625, -0.13623619079589844, -0.13123703002929688, -0.1262378692626953, -0.12123870849609375, -0.11623954772949219, -0.11124038696289062, -0.10624122619628906, -0.1012420654296875, -0.09624290466308594, -0.09124374389648438, -0.08624458312988281, -0.08124542236328125, -0.07624626159667969, -0.07124710083007812, -0.06624794006347656, -0.061248779296875, -0.05624961853027344, -0.051250457763671875, -0.04625129699707031, -0.04125213623046875, -0.03625297546386719, -0.031253814697265625, -0.026254653930664062, -0.0212554931640625, -0.016256332397460938, -0.011257171630859375, -0.0062580108642578125, -0.00125885009765625, 0.0037403106689453125, 0.008739471435546875, 0.013738632202148438, 0.01873779296875, 0.023736953735351562, 0.028736114501953125, 0.03373527526855469, 0.03873443603515625, 0.04373359680175781, 0.048732757568359375, 0.05373191833496094, 0.0587310791015625, 0.06373023986816406, 0.06872940063476562, 0.07372856140136719, 0.07872772216796875, 0.08372688293457031, 0.08872604370117188, 0.09372520446777344, 0.098724365234375, 0.10372352600097656, 0.10872268676757812, 0.11372184753417969, 0.11872100830078125, 0.12372016906738281, 0.12871932983398438, 0.13371849060058594, 0.1387176513671875, 0.14371681213378906, 0.14871597290039062, 0.1537151336669922, 0.15871429443359375, 0.1637134552001953, 0.16871261596679688, 0.17371177673339844, 0.1787109375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 10.0, 19.0, 27.0, 32.0, 45.0, 65.0, 70.0, 80.0, 77.0, 84.0, 89.0, 82.0, 73.0, 74.0, 39.0, 33.0, 24.0, 20.0, 11.0, 8.0, 5.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.054412841796875, -0.05303812026977539, -0.05166339874267578, -0.05028867721557617, -0.04891395568847656, -0.04753923416137695, -0.046164512634277344, -0.044789791107177734, -0.043415069580078125, -0.042040348052978516, -0.040665626525878906, -0.0392909049987793, -0.03791618347167969, -0.03654146194458008, -0.03516674041748047, -0.03379201889038086, -0.03241729736328125, -0.03104257583618164, -0.02966785430908203, -0.028293132781982422, -0.026918411254882812, -0.025543689727783203, -0.024168968200683594, -0.022794246673583984, -0.021419525146484375, -0.020044803619384766, -0.018670082092285156, -0.017295360565185547, -0.015920639038085938, -0.014545917510986328, -0.013171195983886719, -0.01179647445678711, -0.0104217529296875, -0.00904703140258789, -0.007672309875488281, -0.006297588348388672, -0.0049228668212890625, -0.003548145294189453, -0.0021734237670898438, -0.0007987022399902344, 0.000576019287109375, 0.0019507408142089844, 0.0033254623413085938, 0.004700183868408203, 0.0060749053955078125, 0.007449626922607422, 0.008824348449707031, 0.01019906997680664, 0.01157379150390625, 0.01294851303100586, 0.014323234558105469, 0.015697956085205078, 0.017072677612304688, 0.018447399139404297, 0.019822120666503906, 0.021196842193603516, 0.022571563720703125, 0.023946285247802734, 0.025321006774902344, 0.026695728302001953, 0.028070449829101562, 0.029445171356201172, 0.03081989288330078, 0.03219461441040039, 0.0335693359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 12.0, 20.0, 41.0, 71.0, 122.0, 235.0, 448.0, 830.0, 1793.0, 4568.0, 16278.0, 100986.0, 3208359.0, 795108.0, 49183.0, 10263.0, 3227.0, 1364.0, 659.0, 308.0, 157.0, 99.0, 51.0, 32.0, 19.0, 12.0, 8.0, 6.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090576171875, -0.0875396728515625, -0.084503173828125, -0.0814666748046875, -0.07843017578125, -0.0753936767578125, -0.072357177734375, -0.0693206787109375, -0.0662841796875, -0.0632476806640625, -0.060211181640625, -0.0571746826171875, -0.05413818359375, -0.0511016845703125, -0.048065185546875, -0.0450286865234375, -0.0419921875, -0.0389556884765625, -0.035919189453125, -0.0328826904296875, -0.02984619140625, -0.0268096923828125, -0.023773193359375, -0.0207366943359375, -0.0177001953125, -0.0146636962890625, -0.011627197265625, -0.0085906982421875, -0.00555419921875, -0.0025177001953125, 0.000518798828125, 0.0035552978515625, 0.006591796875, 0.0096282958984375, 0.012664794921875, 0.0157012939453125, 0.01873779296875, 0.0217742919921875, 0.024810791015625, 0.0278472900390625, 0.0308837890625, 0.0339202880859375, 0.036956787109375, 0.0399932861328125, 0.04302978515625, 0.0460662841796875, 0.049102783203125, 0.0521392822265625, 0.05517578125, 0.0582122802734375, 0.061248779296875, 0.0642852783203125, 0.06732177734375, 0.0703582763671875, 0.073394775390625, 0.0764312744140625, 0.0794677734375, 0.0825042724609375, 0.085540771484375, 0.0885772705078125, 0.09161376953125, 0.0946502685546875, 0.097686767578125, 0.1007232666015625, 0.103759765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 14.0, 25.0, 38.0, 104.0, 205.0, 710.0, 1997.0, 571.0, 188.0, 77.0, 48.0, 24.0, 17.0, 10.0, 9.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055206298828125, -0.053690433502197266, -0.05217456817626953, -0.0506587028503418, -0.04914283752441406, -0.04762697219848633, -0.046111106872558594, -0.04459524154663086, -0.043079376220703125, -0.04156351089477539, -0.040047645568847656, -0.03853178024291992, -0.03701591491699219, -0.03550004959106445, -0.03398418426513672, -0.032468318939208984, -0.03095245361328125, -0.029436588287353516, -0.02792072296142578, -0.026404857635498047, -0.024888992309570312, -0.023373126983642578, -0.021857261657714844, -0.02034139633178711, -0.018825531005859375, -0.01730966567993164, -0.015793800354003906, -0.014277935028076172, -0.012762069702148438, -0.011246204376220703, -0.009730339050292969, -0.008214473724365234, -0.0066986083984375, -0.005182743072509766, -0.0036668777465820312, -0.002151012420654297, -0.0006351470947265625, 0.0008807182312011719, 0.0023965835571289062, 0.003912448883056641, 0.005428314208984375, 0.006944179534912109, 0.008460044860839844, 0.009975910186767578, 0.011491775512695312, 0.013007640838623047, 0.014523506164550781, 0.016039371490478516, 0.01755523681640625, 0.019071102142333984, 0.02058696746826172, 0.022102832794189453, 0.023618698120117188, 0.025134563446044922, 0.026650428771972656, 0.02816629409790039, 0.029682159423828125, 0.03119802474975586, 0.032713890075683594, 0.03422975540161133, 0.03574562072753906, 0.0372614860534668, 0.03877735137939453, 0.040293216705322266, 0.04180908203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 59.0, 300.0, 444.0, 167.0, 16.0, 5.0, 2.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29908138513565063, -0.279452383518219, -0.25982338190078735, -0.2401943802833557, -0.22056537866592407, -0.20093637704849243, -0.1813073754310608, -0.16167837381362915, -0.1420493721961975, -0.12242037057876587, -0.10279136896133423, -0.08316236734390259, -0.06353336572647095, -0.04390436410903931, -0.024275362491607666, -0.004646360874176025, 0.014982640743255615, 0.034611642360687256, 0.054240643978118896, 0.07386964559555054, 0.09349864721298218, 0.11312764883041382, 0.13275665044784546, 0.1523856520652771, 0.17201465368270874, 0.19164365530014038, 0.21127265691757202, 0.23090165853500366, 0.2505306601524353, 0.27015966176986694, 0.2897886633872986, 0.3094176650047302, 0.32904666662216187, 0.3486756682395935, 0.36830466985702515, 0.3879336714744568, 0.4075626730918884, 0.42719167470932007, 0.4468206763267517, 0.46644967794418335, 0.486078679561615, 0.5057076811790466, 0.5253366827964783, 0.5449656844139099, 0.5645946860313416, 0.5842236876487732, 0.6038526892662048, 0.6234816908836365, 0.6431106925010681, 0.6627396941184998, 0.6823686957359314, 0.701997697353363, 0.7216266989707947, 0.7412557005882263, 0.760884702205658, 0.7805137038230896, 0.8001427054405212, 0.8197717070579529, 0.8394007086753845, 0.8590297102928162, 0.8786587119102478, 0.8982877135276794, 0.9179167151451111, 0.9375457167625427, 0.9571747183799744]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 2.0, 14.0, 14.0, 17.0, 19.0, 28.0, 55.0, 46.0, 73.0, 84.0, 72.0, 83.0, 76.0, 80.0, 80.0, 69.0, 54.0, 43.0, 28.0, 23.0, 11.0, 7.0, 11.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.23309898376464844, -0.2276722490787506, -0.22224551439285278, -0.21681877970695496, -0.21139205992221832, -0.2059653252363205, -0.20053859055042267, -0.19511185586452484, -0.1896851360797882, -0.18425840139389038, -0.17883166670799255, -0.17340493202209473, -0.1679782122373581, -0.16255147755146027, -0.15712474286556244, -0.1516980081796646, -0.14627127349376678, -0.14084453880786896, -0.13541780412197113, -0.1299910843372345, -0.12456434965133667, -0.11913761496543884, -0.11371088027954102, -0.10828414559364319, -0.10285741835832596, -0.09743068367242813, -0.0920039564371109, -0.08657722175121307, -0.08115048706531525, -0.07572375982999802, -0.07029702514410019, -0.06487029790878296, -0.05944356322288513, -0.0540168322622776, -0.048590101301670074, -0.04316336661577225, -0.03773663565516472, -0.03230990469455719, -0.026883170008659363, -0.021456439048051834, -0.016029708087444305, -0.010602976195514202, -0.005176244303584099, 0.0002504885196685791, 0.005677219480276108, 0.011103950440883636, 0.016530685126781464, 0.021957416087388992, 0.02738414704799652, 0.03281087800860405, 0.03823760896921158, 0.043664343655109406, 0.049091074615716934, 0.05451780557632446, 0.05994454026222229, 0.06537127494812012, 0.07079800218343735, 0.07622473686933517, 0.0816514641046524, 0.08707819879055023, 0.09250493347644806, 0.09793166071176529, 0.10335839539766312, 0.10878512263298035, 0.11421185731887817]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 3.0, 7.0, 8.0, 12.0, 16.0, 21.0, 27.0, 42.0, 62.0, 86.0, 139.0, 223.0, 368.0, 617.0, 1170.0, 2489.0, 6566.0, 24466.0, 126039.0, 501688.0, 305018.0, 58385.0, 12925.0, 4211.0, 1790.0, 886.0, 484.0, 271.0, 183.0, 113.0, 71.0, 57.0, 26.0, 23.0, 16.0, 13.0, 4.0, 10.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09063720703125, -0.08787155151367188, -0.08510589599609375, -0.08234024047851562, -0.0795745849609375, -0.07680892944335938, -0.07404327392578125, -0.07127761840820312, -0.068511962890625, -0.06574630737304688, -0.06298065185546875, -0.060214996337890625, -0.0574493408203125, -0.054683685302734375, -0.05191802978515625, -0.049152374267578125, -0.04638671875, -0.043621063232421875, -0.04085540771484375, -0.038089752197265625, -0.0353240966796875, -0.032558441162109375, -0.02979278564453125, -0.027027130126953125, -0.024261474609375, -0.021495819091796875, -0.01873016357421875, -0.015964508056640625, -0.0131988525390625, -0.010433197021484375, -0.00766754150390625, -0.004901885986328125, -0.00213623046875, 0.000629425048828125, 0.00339508056640625, 0.006160736083984375, 0.0089263916015625, 0.011692047119140625, 0.01445770263671875, 0.017223358154296875, 0.019989013671875, 0.022754669189453125, 0.02552032470703125, 0.028285980224609375, 0.0310516357421875, 0.033817291259765625, 0.03658294677734375, 0.039348602294921875, 0.0421142578125, 0.044879913330078125, 0.04764556884765625, 0.050411224365234375, 0.0531768798828125, 0.055942535400390625, 0.05870819091796875, 0.061473846435546875, 0.064239501953125, 0.06700515747070312, 0.06977081298828125, 0.07253646850585938, 0.0753021240234375, 0.07806777954101562, 0.08083343505859375, 0.08359909057617188, 0.08636474609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 11.0, 20.0, 24.0, 30.0, 35.0, 55.0, 66.0, 96.0, 88.0, 75.0, 92.0, 98.0, 71.0, 66.0, 52.0, 35.0, 27.0, 15.0, 11.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05902099609375, -0.05750226974487305, -0.055983543395996094, -0.05446481704711914, -0.05294609069824219, -0.051427364349365234, -0.04990863800048828, -0.04838991165161133, -0.046871185302734375, -0.04535245895385742, -0.04383373260498047, -0.042315006256103516, -0.04079627990722656, -0.03927755355834961, -0.037758827209472656, -0.0362401008605957, -0.03472137451171875, -0.0332026481628418, -0.031683921813964844, -0.03016519546508789, -0.028646469116210938, -0.027127742767333984, -0.02560901641845703, -0.024090290069580078, -0.022571563720703125, -0.021052837371826172, -0.01953411102294922, -0.018015384674072266, -0.016496658325195312, -0.01497793197631836, -0.013459205627441406, -0.011940479278564453, -0.0104217529296875, -0.008903026580810547, -0.007384300231933594, -0.005865573883056641, -0.0043468475341796875, -0.0028281211853027344, -0.0013093948364257812, 0.00020933151245117188, 0.001728057861328125, 0.003246784210205078, 0.004765510559082031, 0.006284236907958984, 0.0078029632568359375, 0.00932168960571289, 0.010840415954589844, 0.012359142303466797, 0.01387786865234375, 0.015396595001220703, 0.016915321350097656, 0.01843404769897461, 0.019952774047851562, 0.021471500396728516, 0.02299022674560547, 0.024508953094482422, 0.026027679443359375, 0.027546405792236328, 0.02906513214111328, 0.030583858489990234, 0.03210258483886719, 0.03362131118774414, 0.035140037536621094, 0.03665876388549805, 0.038177490234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 7.0, 12.0, 17.0, 17.0, 26.0, 51.0, 39.0, 66.0, 83.0, 116.0, 194.0, 257.0, 322.0, 495.0, 809.0, 1417.0, 3335.0, 10149.0, 41712.0, 182447.0, 471188.0, 253292.0, 59326.0, 14288.0, 4312.0, 1776.0, 915.0, 545.0, 397.0, 268.0, 176.0, 125.0, 96.0, 69.0, 50.0, 37.0, 31.0, 12.0, 17.0, 18.0, 7.0, 10.0, 10.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049957275390625, -0.04827070236206055, -0.046584129333496094, -0.04489755630493164, -0.04321098327636719, -0.041524410247802734, -0.03983783721923828, -0.03815126419067383, -0.036464691162109375, -0.03477811813354492, -0.03309154510498047, -0.031404972076416016, -0.029718399047851562, -0.02803182601928711, -0.026345252990722656, -0.024658679962158203, -0.02297210693359375, -0.021285533905029297, -0.019598960876464844, -0.01791238784790039, -0.016225814819335938, -0.014539241790771484, -0.012852668762207031, -0.011166095733642578, -0.009479522705078125, -0.007792949676513672, -0.006106376647949219, -0.004419803619384766, -0.0027332305908203125, -0.0010466575622558594, 0.0006399154663085938, 0.002326488494873047, 0.0040130615234375, 0.005699634552001953, 0.007386207580566406, 0.00907278060913086, 0.010759353637695312, 0.012445926666259766, 0.014132499694824219, 0.015819072723388672, 0.017505645751953125, 0.019192218780517578, 0.02087879180908203, 0.022565364837646484, 0.024251937866210938, 0.02593851089477539, 0.027625083923339844, 0.029311656951904297, 0.03099822998046875, 0.0326848030090332, 0.034371376037597656, 0.03605794906616211, 0.03774452209472656, 0.039431095123291016, 0.04111766815185547, 0.04280424118041992, 0.044490814208984375, 0.04617738723754883, 0.04786396026611328, 0.049550533294677734, 0.05123710632324219, 0.05292367935180664, 0.054610252380371094, 0.05629682540893555, 0.0579833984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 9.0, 12.0, 17.0, 23.0, 40.0, 38.0, 30.0, 34.0, 50.0, 50.0, 44.0, 41.0, 53.0, 53.0, 47.0, 42.0, 55.0, 29.0, 54.0, 33.0, 37.0, 39.0, 21.0, 27.0, 17.0, 17.0, 13.0, 7.0, 10.0, 11.0, 7.0, 2.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09747314453125, -0.09418201446533203, -0.09089088439941406, -0.0875997543334961, -0.08430862426757812, -0.08101749420166016, -0.07772636413574219, -0.07443523406982422, -0.07114410400390625, -0.06785297393798828, -0.06456184387207031, -0.061270713806152344, -0.057979583740234375, -0.054688453674316406, -0.05139732360839844, -0.04810619354248047, -0.0448150634765625, -0.04152393341064453, -0.03823280334472656, -0.034941673278808594, -0.031650543212890625, -0.028359413146972656, -0.025068283081054688, -0.02177715301513672, -0.01848602294921875, -0.015194892883300781, -0.011903762817382812, -0.008612632751464844, -0.005321502685546875, -0.0020303726196289062, 0.0012607574462890625, 0.004551887512207031, 0.007843017578125, 0.011134147644042969, 0.014425277709960938, 0.017716407775878906, 0.021007537841796875, 0.024298667907714844, 0.027589797973632812, 0.03088092803955078, 0.03417205810546875, 0.03746318817138672, 0.04075431823730469, 0.044045448303222656, 0.047336578369140625, 0.050627708435058594, 0.05391883850097656, 0.05720996856689453, 0.0605010986328125, 0.06379222869873047, 0.06708335876464844, 0.0703744888305664, 0.07366561889648438, 0.07695674896240234, 0.08024787902832031, 0.08353900909423828, 0.08683013916015625, 0.09012126922607422, 0.09341239929199219, 0.09670352935791016, 0.09999465942382812, 0.1032857894897461, 0.10657691955566406, 0.10986804962158203, 0.1131591796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 11.0, 15.0, 21.0, 74.0, 285.0, 1646.0, 72723.0, 956091.0, 16478.0, 934.0, 178.0, 56.0, 22.0, 11.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.094482421875, -0.09060287475585938, -0.08672332763671875, -0.08284378051757812, -0.0789642333984375, -0.07508468627929688, -0.07120513916015625, -0.06732559204101562, -0.063446044921875, -0.059566497802734375, -0.05568695068359375, -0.051807403564453125, -0.0479278564453125, -0.044048309326171875, -0.04016876220703125, -0.036289215087890625, -0.03240966796875, -0.028530120849609375, -0.02465057373046875, -0.020771026611328125, -0.0168914794921875, -0.013011932373046875, -0.00913238525390625, -0.005252838134765625, -0.001373291015625, 0.002506256103515625, 0.00638580322265625, 0.010265350341796875, 0.0141448974609375, 0.018024444580078125, 0.02190399169921875, 0.025783538818359375, 0.0296630859375, 0.033542633056640625, 0.03742218017578125, 0.041301727294921875, 0.0451812744140625, 0.049060821533203125, 0.05294036865234375, 0.056819915771484375, 0.060699462890625, 0.06457901000976562, 0.06845855712890625, 0.07233810424804688, 0.0762176513671875, 0.08009719848632812, 0.08397674560546875, 0.08785629272460938, 0.09173583984375, 0.09561538696289062, 0.09949493408203125, 0.10337448120117188, 0.1072540283203125, 0.11113357543945312, 0.11501312255859375, 0.11889266967773438, 0.122772216796875, 0.12665176391601562, 0.13053131103515625, 0.13441085815429688, 0.1382904052734375, 0.14216995239257812, 0.14604949951171875, 0.14992904663085938, 0.15380859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 8.0, 12.0, 17.0, 24.0, 37.0, 51.0, 61.0, 76.0, 113.0, 146.0, 105.0, 90.0, 69.0, 46.0, 39.0, 28.0, 19.0, 16.0, 9.0, 8.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.543231964111328e-05, -5.227886140346527e-05, -4.912540316581726e-05, -4.597194492816925e-05, -4.281848669052124e-05, -3.966502845287323e-05, -3.651157021522522e-05, -3.335811197757721e-05, -3.02046537399292e-05, -2.705119550228119e-05, -2.389773726463318e-05, -2.074427902698517e-05, -1.7590820789337158e-05, -1.4437362551689148e-05, -1.1283904314041138e-05, -8.130446076393127e-06, -4.976987838745117e-06, -1.823529601097107e-06, 1.3299286365509033e-06, 4.4833868741989136e-06, 7.636845111846924e-06, 1.0790303349494934e-05, 1.3943761587142944e-05, 1.7097219824790955e-05, 2.0250678062438965e-05, 2.3404136300086975e-05, 2.6557594537734985e-05, 2.9711052775382996e-05, 3.2864511013031006e-05, 3.6017969250679016e-05, 3.9171427488327026e-05, 4.232488572597504e-05, 4.547834396362305e-05, 4.863180220127106e-05, 5.178526043891907e-05, 5.493871867656708e-05, 5.809217691421509e-05, 6.12456351518631e-05, 6.439909338951111e-05, 6.755255162715912e-05, 7.070600986480713e-05, 7.385946810245514e-05, 7.701292634010315e-05, 8.016638457775116e-05, 8.331984281539917e-05, 8.647330105304718e-05, 8.962675929069519e-05, 9.27802175283432e-05, 9.593367576599121e-05, 9.908713400363922e-05, 0.00010224059224128723, 0.00010539405047893524, 0.00010854750871658325, 0.00011170096695423126, 0.00011485442519187927, 0.00011800788342952728, 0.00012116134166717529, 0.0001243147999048233, 0.0001274682581424713, 0.00013062171638011932, 0.00013377517461776733, 0.00013692863285541534, 0.00014008209109306335, 0.00014323554933071136, 0.00014638900756835938]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 13.0, 19.0, 52.0, 107.0, 324.0, 1262.0, 17040.0, 945352.0, 81169.0, 2433.0, 491.0, 153.0, 61.0, 32.0, 19.0, 13.0, 8.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.1470041275024414, -0.1427631378173828, -0.13852214813232422, -0.13428115844726562, -0.13004016876220703, -0.12579917907714844, -0.12155818939208984, -0.11731719970703125, -0.11307621002197266, -0.10883522033691406, -0.10459423065185547, -0.10035324096679688, -0.09611225128173828, -0.09187126159667969, -0.0876302719116211, -0.0833892822265625, -0.0791482925415039, -0.07490730285644531, -0.07066631317138672, -0.06642532348632812, -0.06218433380126953, -0.05794334411621094, -0.053702354431152344, -0.04946136474609375, -0.045220375061035156, -0.04097938537597656, -0.03673839569091797, -0.032497406005859375, -0.02825641632080078, -0.024015426635742188, -0.019774436950683594, -0.015533447265625, -0.011292457580566406, -0.0070514678955078125, -0.0028104782104492188, 0.001430511474609375, 0.005671501159667969, 0.009912490844726562, 0.014153480529785156, 0.01839447021484375, 0.022635459899902344, 0.026876449584960938, 0.03111743927001953, 0.035358428955078125, 0.03959941864013672, 0.04384040832519531, 0.048081398010253906, 0.0523223876953125, 0.056563377380371094, 0.06080436706542969, 0.06504535675048828, 0.06928634643554688, 0.07352733612060547, 0.07776832580566406, 0.08200931549072266, 0.08625030517578125, 0.09049129486083984, 0.09473228454589844, 0.09897327423095703, 0.10321426391601562, 0.10745525360107422, 0.11169624328613281, 0.1159372329711914, 0.12017822265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 6.0, 26.0, 49.0, 67.0, 106.0, 176.0, 173.0, 181.0, 88.0, 64.0, 33.0, 12.0, 11.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047607421875, -0.045014381408691406, -0.04242134094238281, -0.03982830047607422, -0.037235260009765625, -0.03464221954345703, -0.03204917907714844, -0.029456138610839844, -0.02686309814453125, -0.024270057678222656, -0.021677017211914062, -0.01908397674560547, -0.016490936279296875, -0.013897895812988281, -0.011304855346679688, -0.008711814880371094, -0.0061187744140625, -0.0035257339477539062, -0.0009326934814453125, 0.0016603469848632812, 0.004253387451171875, 0.006846427917480469, 0.009439468383789062, 0.012032508850097656, 0.01462554931640625, 0.017218589782714844, 0.019811630249023438, 0.02240467071533203, 0.024997711181640625, 0.02759075164794922, 0.030183792114257812, 0.032776832580566406, 0.035369873046875, 0.037962913513183594, 0.04055595397949219, 0.04314899444580078, 0.045742034912109375, 0.04833507537841797, 0.05092811584472656, 0.053521156311035156, 0.05611419677734375, 0.058707237243652344, 0.06130027770996094, 0.06389331817626953, 0.06648635864257812, 0.06907939910888672, 0.07167243957519531, 0.0742654800415039, 0.0768585205078125, 0.0794515609741211, 0.08204460144042969, 0.08463764190673828, 0.08723068237304688, 0.08982372283935547, 0.09241676330566406, 0.09500980377197266, 0.09760284423828125, 0.10019588470458984, 0.10278892517089844, 0.10538196563720703, 0.10797500610351562, 0.11056804656982422, 0.11316108703613281, 0.1157541275024414, 0.11834716796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 11.0, 29.0, 154.0, 423.0, 272.0, 75.0, 27.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7266422510147095, -0.6774941682815552, -0.6283460855484009, -0.5791980028152466, -0.5300499200820923, -0.4809018671512604, -0.43175381422042847, -0.38260573148727417, -0.3334576487541199, -0.2843095660209656, -0.23516149818897247, -0.18601343035697937, -0.13686534762382507, -0.08771726489067078, -0.03856921195983887, 0.01057887077331543, 0.05972695350646973, 0.10887502878904343, 0.15802310407161713, 0.20717117190361023, 0.2563192546367645, 0.3054673373699188, 0.35461539030075073, 0.40376347303390503, 0.4529115557670593, 0.5020596385002136, 0.5512077212333679, 0.6003557443618774, 0.6495038270950317, 0.698651909828186, 0.7477999925613403, 0.7969480752944946, 0.8460962772369385, 0.8952443599700928, 0.9443924427032471, 0.9935405254364014, 1.0426886081695557, 1.09183669090271, 1.1409847736358643, 1.1901328563690186, 1.2392809391021729, 1.2884290218353271, 1.3375771045684814, 1.3867251873016357, 1.43587327003479, 1.4850213527679443, 1.5341694355010986, 1.583317518234253, 1.6324654817581177, 1.681613564491272, 1.7307616472244263, 1.7799097299575806, 1.8290578126907349, 1.8782058954238892, 1.927353858947754, 1.9765019416809082, 2.0256500244140625, 2.074798107147217, 2.123946189880371, 2.1730942726135254, 2.2222423553466797, 2.271390438079834, 2.3205385208129883, 2.3696866035461426, 2.418834686279297]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 5.0, 2.0, 8.0, 3.0, 10.0, 10.0, 11.0, 14.0, 15.0, 18.0, 25.0, 27.0, 32.0, 26.0, 31.0, 33.0, 40.0, 42.0, 35.0, 31.0, 41.0, 44.0, 45.0, 39.0, 33.0, 30.0, 24.0, 31.0, 43.0, 31.0, 32.0, 37.0, 24.0, 15.0, 20.0, 12.0, 13.0, 10.0, 11.0, 13.0, 8.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4197768568992615, -0.40610626339912415, -0.3924356698989868, -0.3787651062011719, -0.36509451270103455, -0.3514239192008972, -0.3377533257007599, -0.32408273220062256, -0.31041213870048523, -0.2967415452003479, -0.28307095170021057, -0.26940035820007324, -0.2557297945022583, -0.24205920100212097, -0.22838860750198364, -0.2147180140018463, -0.20104743540287018, -0.18737684190273285, -0.1737062633037567, -0.16003566980361938, -0.14636507630348206, -0.13269448280334473, -0.11902390420436859, -0.10535331070423126, -0.09168272465467453, -0.0780121386051178, -0.06434154510498047, -0.05067095905542374, -0.037000369280576706, -0.023329779505729675, -0.009659193456172943, 0.004011400043964386, 0.017681986093521118, 0.03135257586836815, 0.04502316564321518, 0.05869375169277191, 0.07236434519290924, 0.08603493124246597, 0.0997055172920227, 0.11337611079216003, 0.12704670429229736, 0.1407172977924347, 0.15438787639141083, 0.16805846989154816, 0.18172906339168549, 0.19539964199066162, 0.20907023549079895, 0.22274082899093628, 0.23641140758991241, 0.25008198618888855, 0.2637525796890259, 0.2774231731891632, 0.29109376668930054, 0.30476436018943787, 0.3184349536895752, 0.33210551738739014, 0.34577611088752747, 0.3594467043876648, 0.3731172978878021, 0.38678789138793945, 0.4004584550857544, 0.4141290485858917, 0.42779964208602905, 0.4414702355861664, 0.4551408290863037]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 14.0, 21.0, 43.0, 76.0, 148.0, 338.0, 731.0, 2066.0, 8679.0, 94694.0, 3979959.0, 95322.0, 8550.0, 2094.0, 760.0, 344.0, 158.0, 94.0, 68.0, 35.0, 19.0, 14.0, 13.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2100830078125, -0.2048959732055664, -0.1997089385986328, -0.19452190399169922, -0.18933486938476562, -0.18414783477783203, -0.17896080017089844, -0.17377376556396484, -0.16858673095703125, -0.16339969635009766, -0.15821266174316406, -0.15302562713623047, -0.14783859252929688, -0.14265155792236328, -0.1374645233154297, -0.1322774887084961, -0.1270904541015625, -0.1219034194946289, -0.11671638488769531, -0.11152935028076172, -0.10634231567382812, -0.10115528106689453, -0.09596824645996094, -0.09078121185302734, -0.08559417724609375, -0.08040714263916016, -0.07522010803222656, -0.07003307342529297, -0.06484603881835938, -0.05965900421142578, -0.05447196960449219, -0.049284934997558594, -0.044097900390625, -0.038910865783691406, -0.03372383117675781, -0.02853679656982422, -0.023349761962890625, -0.01816272735595703, -0.012975692749023438, -0.007788658142089844, -0.00260162353515625, 0.0025854110717773438, 0.0077724456787109375, 0.012959480285644531, 0.018146514892578125, 0.02333354949951172, 0.028520584106445312, 0.033707618713378906, 0.0388946533203125, 0.044081687927246094, 0.04926872253417969, 0.05445575714111328, 0.059642791748046875, 0.06482982635498047, 0.07001686096191406, 0.07520389556884766, 0.08039093017578125, 0.08557796478271484, 0.09076499938964844, 0.09595203399658203, 0.10113906860351562, 0.10632610321044922, 0.11151313781738281, 0.1167001724243164, 0.12188720703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 3.0, 12.0, 12.0, 13.0, 32.0, 25.0, 33.0, 52.0, 53.0, 69.0, 84.0, 76.0, 82.0, 83.0, 78.0, 66.0, 56.0, 45.0, 36.0, 25.0, 14.0, 16.0, 10.0, 9.0, 5.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.054443359375, -0.053061485290527344, -0.05167961120605469, -0.05029773712158203, -0.048915863037109375, -0.04753398895263672, -0.04615211486816406, -0.044770240783691406, -0.04338836669921875, -0.042006492614746094, -0.04062461853027344, -0.03924274444580078, -0.037860870361328125, -0.03647899627685547, -0.03509712219238281, -0.033715248107910156, -0.0323333740234375, -0.030951499938964844, -0.029569625854492188, -0.02818775177001953, -0.026805877685546875, -0.02542400360107422, -0.024042129516601562, -0.022660255432128906, -0.02127838134765625, -0.019896507263183594, -0.018514633178710938, -0.01713275909423828, -0.015750885009765625, -0.014369010925292969, -0.012987136840820312, -0.011605262756347656, -0.010223388671875, -0.008841514587402344, -0.0074596405029296875, -0.006077766418457031, -0.004695892333984375, -0.0033140182495117188, -0.0019321441650390625, -0.0005502700805664062, 0.00083160400390625, 0.0022134780883789062, 0.0035953521728515625, 0.004977226257324219, 0.006359100341796875, 0.007740974426269531, 0.009122848510742188, 0.010504722595214844, 0.0118865966796875, 0.013268470764160156, 0.014650344848632812, 0.01603221893310547, 0.017414093017578125, 0.01879596710205078, 0.020177841186523438, 0.021559715270996094, 0.02294158935546875, 0.024323463439941406, 0.025705337524414062, 0.02708721160888672, 0.028469085693359375, 0.02985095977783203, 0.031232833862304688, 0.032614707946777344, 0.03399658203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 11.0, 12.0, 19.0, 17.0, 43.0, 95.0, 208.0, 440.0, 955.0, 2447.0, 8179.0, 45339.0, 908329.0, 3112394.0, 96647.0, 13307.0, 3497.0, 1261.0, 587.0, 246.0, 115.0, 51.0, 31.0, 13.0, 11.0, 4.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06640625, -0.06340980529785156, -0.060413360595703125, -0.05741691589355469, -0.05442047119140625, -0.05142402648925781, -0.048427581787109375, -0.04543113708496094, -0.0424346923828125, -0.03943824768066406, -0.036441802978515625, -0.03344535827636719, -0.03044891357421875, -0.027452468872070312, -0.024456024169921875, -0.021459579467773438, -0.018463134765625, -0.015466690063476562, -0.012470245361328125, -0.009473800659179688, -0.00647735595703125, -0.0034809112548828125, -0.000484466552734375, 0.0025119781494140625, 0.0055084228515625, 0.008504867553710938, 0.011501312255859375, 0.014497756958007812, 0.01749420166015625, 0.020490646362304688, 0.023487091064453125, 0.026483535766601562, 0.02947998046875, 0.03247642517089844, 0.035472869873046875, 0.03846931457519531, 0.04146575927734375, 0.04446220397949219, 0.047458648681640625, 0.05045509338378906, 0.0534515380859375, 0.05644798278808594, 0.059444427490234375, 0.06244087219238281, 0.06543731689453125, 0.06843376159667969, 0.07143020629882812, 0.07442665100097656, 0.077423095703125, 0.08041954040527344, 0.08341598510742188, 0.08641242980957031, 0.08940887451171875, 0.09240531921386719, 0.09540176391601562, 0.09839820861816406, 0.1013946533203125, 0.10439109802246094, 0.10738754272460938, 0.11038398742675781, 0.11338043212890625, 0.11637687683105469, 0.11937332153320312, 0.12236976623535156, 0.1253662109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 9.0, 18.0, 17.0, 48.0, 74.0, 124.0, 293.0, 863.0, 1559.0, 557.0, 254.0, 106.0, 52.0, 31.0, 19.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037200927734375, -0.03567218780517578, -0.03414344787597656, -0.032614707946777344, -0.031085968017578125, -0.029557228088378906, -0.028028488159179688, -0.02649974822998047, -0.02497100830078125, -0.02344226837158203, -0.021913528442382812, -0.020384788513183594, -0.018856048583984375, -0.017327308654785156, -0.015798568725585938, -0.014269828796386719, -0.0127410888671875, -0.011212348937988281, -0.009683609008789062, -0.008154869079589844, -0.006626129150390625, -0.005097389221191406, -0.0035686492919921875, -0.0020399093627929688, -0.00051116943359375, 0.0010175704956054688, 0.0025463104248046875, 0.004075050354003906, 0.005603790283203125, 0.007132530212402344, 0.008661270141601562, 0.010190010070800781, 0.01171875, 0.013247489929199219, 0.014776229858398438, 0.016304969787597656, 0.017833709716796875, 0.019362449645996094, 0.020891189575195312, 0.02241992950439453, 0.02394866943359375, 0.02547740936279297, 0.027006149291992188, 0.028534889221191406, 0.030063629150390625, 0.031592369079589844, 0.03312110900878906, 0.03464984893798828, 0.0361785888671875, 0.03770732879638672, 0.03923606872558594, 0.040764808654785156, 0.042293548583984375, 0.043822288513183594, 0.04535102844238281, 0.04687976837158203, 0.04840850830078125, 0.04993724822998047, 0.05146598815917969, 0.052994728088378906, 0.054523468017578125, 0.056052207946777344, 0.05758094787597656, 0.05910968780517578, 0.060638427734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 41.0, 81.0, 183.0, 219.0, 219.0, 130.0, 58.0, 26.0, 14.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40133681893348694, -0.3900216519832611, -0.3787064552307129, -0.36739128828048706, -0.35607612133026123, -0.344760924577713, -0.3334457576274872, -0.32213056087493896, -0.31081539392471313, -0.2995002269744873, -0.2881850302219391, -0.27686986327171326, -0.26555466651916504, -0.2542394995689392, -0.24292433261871338, -0.23160915076732635, -0.22029396891593933, -0.2089787870645523, -0.19766360521316528, -0.18634843826293945, -0.17503325641155243, -0.1637180745601654, -0.15240290760993958, -0.14108772575855255, -0.12977254390716553, -0.1184573620557785, -0.10714218765497208, -0.09582701325416565, -0.08451183140277863, -0.0731966495513916, -0.061881475150585175, -0.05056630074977875, -0.039251089096069336, -0.02793591096997261, -0.016620732843875885, -0.0053055547177791595, 0.006009623408317566, 0.01732480153441429, 0.028639979660511017, 0.039955154061317444, 0.05127033591270447, 0.06258551776409149, 0.07390069216489792, 0.08521586656570435, 0.09653104841709137, 0.1078462302684784, 0.11916140466928482, 0.13047657907009125, 0.14179176092147827, 0.1531069427728653, 0.16442212462425232, 0.17573729157447815, 0.18705247342586517, 0.1983676552772522, 0.20968282222747803, 0.22099800407886505, 0.23231318593025208, 0.2436283677816391, 0.2549435496330261, 0.26625871658325195, 0.2775738835334778, 0.288889080286026, 0.30020424723625183, 0.31151944398880005, 0.3228346109390259]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 8.0, 4.0, 8.0, 16.0, 14.0, 19.0, 15.0, 26.0, 21.0, 33.0, 34.0, 33.0, 37.0, 26.0, 46.0, 51.0, 51.0, 48.0, 43.0, 50.0, 41.0, 36.0, 40.0, 36.0, 32.0, 32.0, 21.0, 27.0, 21.0, 24.0, 18.0, 19.0, 10.0, 10.0, 8.0, 6.0, 5.0, 2.0, 7.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12369930744171143, -0.11981014907360077, -0.11592099070549011, -0.11203182488679886, -0.1081426665186882, -0.10425350815057755, -0.10036434233188629, -0.09647518396377563, -0.09258602559566498, -0.08869686722755432, -0.08480770885944366, -0.08091854304075241, -0.07702938467264175, -0.0731402263045311, -0.06925106048583984, -0.06536190211772919, -0.06147274374961853, -0.057583585381507874, -0.05369442328810692, -0.04980526119470596, -0.045916102826595306, -0.04202694445848465, -0.038137782365083694, -0.03424862027168274, -0.030359461903572083, -0.026470301672816277, -0.02258114144206047, -0.018691981211304665, -0.014802820980548859, -0.010913660749793053, -0.007024500519037247, -0.0031353402882814407, 0.0007538199424743652, 0.004642980173230171, 0.008532140403985977, 0.012421300634741783, 0.01631046086549759, 0.020199621096253395, 0.0240887813270092, 0.027977941557765007, 0.03186710178852081, 0.03575626015663147, 0.039645422250032425, 0.04353458434343338, 0.04742374271154404, 0.051312901079654694, 0.05520206317305565, 0.059091225266456604, 0.06298038363456726, 0.06686954200267792, 0.07075870037078857, 0.07464786618947983, 0.07853702455759048, 0.08242618292570114, 0.0863153487443924, 0.09020450711250305, 0.09409366548061371, 0.09798282384872437, 0.10187198221683502, 0.10576114803552628, 0.10965030640363693, 0.11353946477174759, 0.11742863059043884, 0.1213177889585495, 0.12520694732666016]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 18.0, 18.0, 27.0, 43.0, 75.0, 103.0, 174.0, 301.0, 640.0, 1612.0, 5754.0, 32410.0, 258331.0, 603568.0, 123025.0, 16701.0, 3478.0, 1117.0, 504.0, 253.0, 143.0, 80.0, 50.0, 32.0, 26.0, 13.0, 14.0, 7.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08624267578125, -0.08330154418945312, -0.08036041259765625, -0.07741928100585938, -0.0744781494140625, -0.07153701782226562, -0.06859588623046875, -0.06565475463867188, -0.062713623046875, -0.059772491455078125, -0.05683135986328125, -0.053890228271484375, -0.0509490966796875, -0.048007965087890625, -0.04506683349609375, -0.042125701904296875, -0.0391845703125, -0.036243438720703125, -0.03330230712890625, -0.030361175537109375, -0.0274200439453125, -0.024478912353515625, -0.02153778076171875, -0.018596649169921875, -0.015655517578125, -0.012714385986328125, -0.00977325439453125, -0.006832122802734375, -0.0038909912109375, -0.000949859619140625, 0.00199127197265625, 0.004932403564453125, 0.00787353515625, 0.010814666748046875, 0.01375579833984375, 0.016696929931640625, 0.0196380615234375, 0.022579193115234375, 0.02552032470703125, 0.028461456298828125, 0.031402587890625, 0.034343719482421875, 0.03728485107421875, 0.040225982666015625, 0.0431671142578125, 0.046108245849609375, 0.04904937744140625, 0.051990509033203125, 0.054931640625, 0.057872772216796875, 0.06081390380859375, 0.06375503540039062, 0.0666961669921875, 0.06963729858398438, 0.07257843017578125, 0.07551956176757812, 0.078460693359375, 0.08140182495117188, 0.08434295654296875, 0.08728408813476562, 0.0902252197265625, 0.09316635131835938, 0.09610748291015625, 0.09904861450195312, 0.10198974609375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 7.0, 8.0, 12.0, 16.0, 26.0, 26.0, 54.0, 59.0, 53.0, 72.0, 83.0, 78.0, 89.0, 94.0, 86.0, 61.0, 49.0, 42.0, 20.0, 15.0, 13.0, 14.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.059906005859375, -0.0583648681640625, -0.05682373046875, -0.0552825927734375, -0.053741455078125, -0.0522003173828125, -0.0506591796875, -0.0491180419921875, -0.047576904296875, -0.0460357666015625, -0.04449462890625, -0.0429534912109375, -0.041412353515625, -0.0398712158203125, -0.038330078125, -0.0367889404296875, -0.035247802734375, -0.0337066650390625, -0.03216552734375, -0.0306243896484375, -0.029083251953125, -0.0275421142578125, -0.0260009765625, -0.0244598388671875, -0.022918701171875, -0.0213775634765625, -0.01983642578125, -0.0182952880859375, -0.016754150390625, -0.0152130126953125, -0.013671875, -0.0121307373046875, -0.010589599609375, -0.0090484619140625, -0.00750732421875, -0.0059661865234375, -0.004425048828125, -0.0028839111328125, -0.0013427734375, 0.0001983642578125, 0.001739501953125, 0.0032806396484375, 0.00482177734375, 0.0063629150390625, 0.007904052734375, 0.0094451904296875, 0.010986328125, 0.0125274658203125, 0.014068603515625, 0.0156097412109375, 0.01715087890625, 0.0186920166015625, 0.020233154296875, 0.0217742919921875, 0.0233154296875, 0.0248565673828125, 0.026397705078125, 0.0279388427734375, 0.02947998046875, 0.0310211181640625, 0.032562255859375, 0.0341033935546875, 0.03564453125, 0.0371856689453125, 0.038726806640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 8.0, 7.0, 7.0, 11.0, 10.0, 14.0, 21.0, 42.0, 44.0, 48.0, 72.0, 110.0, 161.0, 211.0, 296.0, 466.0, 748.0, 1520.0, 4377.0, 20057.0, 147958.0, 627142.0, 209192.0, 26582.0, 5214.0, 1702.0, 863.0, 489.0, 331.0, 244.0, 179.0, 100.0, 78.0, 58.0, 54.0, 39.0, 34.0, 12.0, 17.0, 6.0, 7.0, 8.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06345367431640625, -0.0612335205078125, -0.05901336669921875, -0.056793212890625, -0.05457305908203125, -0.0523529052734375, -0.05013275146484375, -0.04791259765625, -0.04569244384765625, -0.0434722900390625, -0.04125213623046875, -0.039031982421875, -0.03681182861328125, -0.0345916748046875, -0.03237152099609375, -0.0301513671875, -0.02793121337890625, -0.0257110595703125, -0.02349090576171875, -0.021270751953125, -0.01905059814453125, -0.0168304443359375, -0.01461029052734375, -0.01239013671875, -0.01016998291015625, -0.0079498291015625, -0.00572967529296875, -0.003509521484375, -0.00128936767578125, 0.0009307861328125, 0.00315093994140625, 0.00537109375, 0.00759124755859375, 0.0098114013671875, 0.01203155517578125, 0.014251708984375, 0.01647186279296875, 0.0186920166015625, 0.02091217041015625, 0.02313232421875, 0.02535247802734375, 0.0275726318359375, 0.02979278564453125, 0.032012939453125, 0.03423309326171875, 0.0364532470703125, 0.03867340087890625, 0.0408935546875, 0.04311370849609375, 0.0453338623046875, 0.04755401611328125, 0.049774169921875, 0.05199432373046875, 0.0542144775390625, 0.05643463134765625, 0.05865478515625, 0.06087493896484375, 0.0630950927734375, 0.06531524658203125, 0.067535400390625, 0.06975555419921875, 0.0719757080078125, 0.07419586181640625, 0.076416015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 3.0, 4.0, 6.0, 4.0, 9.0, 10.0, 18.0, 16.0, 25.0, 26.0, 19.0, 35.0, 36.0, 41.0, 43.0, 32.0, 56.0, 34.0, 47.0, 42.0, 39.0, 43.0, 48.0, 48.0, 50.0, 30.0, 41.0, 34.0, 24.0, 24.0, 19.0, 21.0, 15.0, 12.0, 16.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10772705078125, -0.10437583923339844, -0.10102462768554688, -0.09767341613769531, -0.09432220458984375, -0.09097099304199219, -0.08761978149414062, -0.08426856994628906, -0.0809173583984375, -0.07756614685058594, -0.07421493530273438, -0.07086372375488281, -0.06751251220703125, -0.06416130065917969, -0.060810089111328125, -0.05745887756347656, -0.054107666015625, -0.05075645446777344, -0.047405242919921875, -0.04405403137207031, -0.04070281982421875, -0.03735160827636719, -0.034000396728515625, -0.030649185180664062, -0.0272979736328125, -0.023946762084960938, -0.020595550537109375, -0.017244338989257812, -0.01389312744140625, -0.010541915893554688, -0.007190704345703125, -0.0038394927978515625, -0.00048828125, 0.0028629302978515625, 0.006214141845703125, 0.009565353393554688, 0.01291656494140625, 0.016267776489257812, 0.019618988037109375, 0.022970199584960938, 0.0263214111328125, 0.029672622680664062, 0.033023834228515625, 0.03637504577636719, 0.03972625732421875, 0.04307746887207031, 0.046428680419921875, 0.04977989196777344, 0.053131103515625, 0.05648231506347656, 0.059833526611328125, 0.06318473815917969, 0.06653594970703125, 0.06988716125488281, 0.07323837280273438, 0.07658958435058594, 0.0799407958984375, 0.08329200744628906, 0.08664321899414062, 0.08999443054199219, 0.09334564208984375, 0.09669685363769531, 0.10004806518554688, 0.10339927673339844, 0.10675048828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 10.0, 14.0, 23.0, 36.0, 57.0, 114.0, 186.0, 417.0, 894.0, 2479.0, 8576.0, 41097.0, 230183.0, 528870.0, 190830.0, 33898.0, 7117.0, 2128.0, 774.0, 392.0, 172.0, 105.0, 72.0, 35.0, 20.0, 15.0, 8.0, 8.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0274658203125, -0.026386260986328125, -0.02530670166015625, -0.024227142333984375, -0.0231475830078125, -0.022068023681640625, -0.02098846435546875, -0.019908905029296875, -0.018829345703125, -0.017749786376953125, -0.01667022705078125, -0.015590667724609375, -0.0145111083984375, -0.013431549072265625, -0.01235198974609375, -0.011272430419921875, -0.01019287109375, -0.009113311767578125, -0.00803375244140625, -0.006954193115234375, -0.0058746337890625, -0.004795074462890625, -0.00371551513671875, -0.002635955810546875, -0.001556396484375, -0.000476837158203125, 0.00060272216796875, 0.001682281494140625, 0.0027618408203125, 0.003841400146484375, 0.00492095947265625, 0.006000518798828125, 0.007080078125, 0.008159637451171875, 0.00923919677734375, 0.010318756103515625, 0.0113983154296875, 0.012477874755859375, 0.01355743408203125, 0.014636993408203125, 0.015716552734375, 0.016796112060546875, 0.01787567138671875, 0.018955230712890625, 0.0200347900390625, 0.021114349365234375, 0.02219390869140625, 0.023273468017578125, 0.02435302734375, 0.025432586669921875, 0.02651214599609375, 0.027591705322265625, 0.0286712646484375, 0.029750823974609375, 0.03083038330078125, 0.031909942626953125, 0.032989501953125, 0.034069061279296875, 0.03514862060546875, 0.036228179931640625, 0.0373077392578125, 0.038387298583984375, 0.03946685791015625, 0.040546417236328125, 0.0416259765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 9.0, 7.0, 12.0, 17.0, 14.0, 25.0, 37.0, 38.0, 52.0, 68.0, 83.0, 104.0, 114.0, 96.0, 66.0, 64.0, 38.0, 27.0, 28.0, 20.0, 20.0, 13.0, 10.0, 4.0, 10.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.896257400512695e-05, -6.651971489191055e-05, -6.407685577869415e-05, -6.163399666547775e-05, -5.919113755226135e-05, -5.674827843904495e-05, -5.430541932582855e-05, -5.186256021261215e-05, -4.941970109939575e-05, -4.697684198617935e-05, -4.453398287296295e-05, -4.209112375974655e-05, -3.964826464653015e-05, -3.720540553331375e-05, -3.476254642009735e-05, -3.231968730688095e-05, -2.987682819366455e-05, -2.743396908044815e-05, -2.499110996723175e-05, -2.254825085401535e-05, -2.010539174079895e-05, -1.766253262758255e-05, -1.521967351436615e-05, -1.277681440114975e-05, -1.033395528793335e-05, -7.89109617471695e-06, -5.448237061500549e-06, -3.005377948284149e-06, -5.62518835067749e-07, 1.8803402781486511e-06, 4.323199391365051e-06, 6.766058504581451e-06, 9.208917617797852e-06, 1.1651776731014252e-05, 1.4094635844230652e-05, 1.6537494957447052e-05, 1.8980354070663452e-05, 2.1423213183879852e-05, 2.3866072297096252e-05, 2.6308931410312653e-05, 2.8751790523529053e-05, 3.119464963674545e-05, 3.363750874996185e-05, 3.608036786317825e-05, 3.852322697639465e-05, 4.0966086089611053e-05, 4.3408945202827454e-05, 4.5851804316043854e-05, 4.8294663429260254e-05, 5.0737522542476654e-05, 5.3180381655693054e-05, 5.5623240768909454e-05, 5.8066099882125854e-05, 6.0508958995342255e-05, 6.295181810855865e-05, 6.539467722177505e-05, 6.783753633499146e-05, 7.028039544820786e-05, 7.272325456142426e-05, 7.516611367464066e-05, 7.760897278785706e-05, 8.005183190107346e-05, 8.249469101428986e-05, 8.493755012750626e-05, 8.738040924072266e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 15.0, 32.0, 46.0, 65.0, 145.0, 180.0, 336.0, 651.0, 1535.0, 4512.0, 22642.0, 191247.0, 622181.0, 176368.0, 21379.0, 4350.0, 1445.0, 607.0, 347.0, 192.0, 100.0, 77.0, 39.0, 16.0, 13.0, 9.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040374755859375, -0.03895711898803711, -0.03753948211669922, -0.03612184524536133, -0.03470420837402344, -0.03328657150268555, -0.031868934631347656, -0.030451297760009766, -0.029033660888671875, -0.027616024017333984, -0.026198387145996094, -0.024780750274658203, -0.023363113403320312, -0.021945476531982422, -0.02052783966064453, -0.01911020278930664, -0.01769256591796875, -0.01627492904663086, -0.014857292175292969, -0.013439655303955078, -0.012022018432617188, -0.010604381561279297, -0.009186744689941406, -0.007769107818603516, -0.006351470947265625, -0.004933834075927734, -0.0035161972045898438, -0.002098560333251953, -0.0006809234619140625, 0.0007367134094238281, 0.0021543502807617188, 0.0035719871520996094, 0.0049896240234375, 0.006407260894775391, 0.007824897766113281, 0.009242534637451172, 0.010660171508789062, 0.012077808380126953, 0.013495445251464844, 0.014913082122802734, 0.016330718994140625, 0.017748355865478516, 0.019165992736816406, 0.020583629608154297, 0.022001266479492188, 0.023418903350830078, 0.02483654022216797, 0.02625417709350586, 0.02767181396484375, 0.02908945083618164, 0.03050708770751953, 0.03192472457885742, 0.03334236145019531, 0.0347599983215332, 0.036177635192871094, 0.037595272064208984, 0.039012908935546875, 0.040430545806884766, 0.041848182678222656, 0.04326581954956055, 0.04468345642089844, 0.04610109329223633, 0.04751873016357422, 0.04893636703491211, 0.05035400390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 10.0, 17.0, 9.0, 36.0, 30.0, 34.0, 47.0, 57.0, 77.0, 91.0, 77.0, 99.0, 94.0, 73.0, 52.0, 37.0, 43.0, 30.0, 27.0, 20.0, 7.0, 9.0, 5.0, 3.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044464111328125, -0.0432887077331543, -0.042113304138183594, -0.04093790054321289, -0.03976249694824219, -0.038587093353271484, -0.03741168975830078, -0.03623628616333008, -0.035060882568359375, -0.03388547897338867, -0.03271007537841797, -0.031534671783447266, -0.030359268188476562, -0.02918386459350586, -0.028008460998535156, -0.026833057403564453, -0.02565765380859375, -0.024482250213623047, -0.023306846618652344, -0.02213144302368164, -0.020956039428710938, -0.019780635833740234, -0.01860523223876953, -0.017429828643798828, -0.016254425048828125, -0.015079021453857422, -0.013903617858886719, -0.012728214263916016, -0.011552810668945312, -0.01037740707397461, -0.009202003479003906, -0.008026599884033203, -0.0068511962890625, -0.005675792694091797, -0.004500389099121094, -0.0033249855041503906, -0.0021495819091796875, -0.0009741783142089844, 0.00020122528076171875, 0.0013766288757324219, 0.002552032470703125, 0.003727436065673828, 0.004902839660644531, 0.006078243255615234, 0.0072536468505859375, 0.00842905044555664, 0.009604454040527344, 0.010779857635498047, 0.01195526123046875, 0.013130664825439453, 0.014306068420410156, 0.01548147201538086, 0.016656875610351562, 0.017832279205322266, 0.01900768280029297, 0.020183086395263672, 0.021358489990234375, 0.022533893585205078, 0.02370929718017578, 0.024884700775146484, 0.026060104370117188, 0.02723550796508789, 0.028410911560058594, 0.029586315155029297, 0.03076171875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 14.0, 38.0, 138.0, 291.0, 302.0, 122.0, 49.0, 25.0, 9.0, 5.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8143242001533508, -0.7802634239196777, -0.7462027072906494, -0.7121419906616211, -0.678081214427948, -0.6440204381942749, -0.6099597215652466, -0.5758990049362183, -0.5418382287025452, -0.5077774524688721, -0.47371673583984375, -0.43965598940849304, -0.40559524297714233, -0.3715344965457916, -0.3374737501144409, -0.3034130036830902, -0.2693522572517395, -0.2352915108203888, -0.20123076438903809, -0.16717001795768738, -0.13310927152633667, -0.09904852509498596, -0.06498777866363525, -0.030927032232284546, 0.003133714199066162, 0.03719446063041687, 0.07125520706176758, 0.10531595349311829, 0.139376699924469, 0.1734374463558197, 0.2074981927871704, 0.24155893921852112, 0.2756197452545166, 0.3096804916858673, 0.343741238117218, 0.3778019845485687, 0.41186273097991943, 0.44592347741127014, 0.47998422384262085, 0.514045000076294, 0.5481057167053223, 0.5821664333343506, 0.6162272095680237, 0.6502879858016968, 0.6843487024307251, 0.7184094190597534, 0.7524701952934265, 0.7865309715270996, 0.8205916881561279, 0.8546524047851562, 0.8887131810188293, 0.9227739572525024, 0.9568346738815308, 0.9908953905105591, 1.024956226348877, 1.0590169429779053, 1.0930776596069336, 1.127138376235962, 1.1611990928649902, 1.195259928703308, 1.2293206453323364, 1.2633813619613647, 1.2974421977996826, 1.331502914428711, 1.3655636310577393]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 6.0, 5.0, 8.0, 11.0, 13.0, 15.0, 21.0, 24.0, 21.0, 26.0, 33.0, 32.0, 45.0, 54.0, 51.0, 57.0, 41.0, 52.0, 41.0, 42.0, 47.0, 44.0, 43.0, 39.0, 42.0, 25.0, 26.0, 26.0, 14.0, 26.0, 11.0, 11.0, 11.0, 9.0, 8.0, 6.0, 6.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6166394352912903, -0.59991055727005, -0.583181619644165, -0.5664527416229248, -0.5497238636016846, -0.5329949855804443, -0.5162660479545593, -0.4995371699333191, -0.48280829191207886, -0.46607938408851624, -0.449350506067276, -0.4326215982437134, -0.41589272022247314, -0.3991638123989105, -0.3824349045753479, -0.36570602655410767, -0.34897711873054504, -0.3322482109069824, -0.3155193328857422, -0.29879042506217957, -0.28206154704093933, -0.2653326392173767, -0.24860374629497528, -0.23187485337257385, -0.21514596045017242, -0.198417067527771, -0.18168817460536957, -0.16495928168296814, -0.14823037385940552, -0.13150149583816528, -0.11477258801460266, -0.09804369509220123, -0.0813148021697998, -0.06458590924739838, -0.04785701259970665, -0.031128115952014923, -0.014399223029613495, 0.0023296698927879333, 0.01905857026576996, 0.03578746318817139, 0.052516356110572815, 0.06924524903297424, 0.08597414195537567, 0.1027030423283577, 0.11943193525075912, 0.13616082072257996, 0.15288972854614258, 0.169618621468544, 0.18634751439094543, 0.20307640731334686, 0.2198053002357483, 0.2365342080593109, 0.25326308608055115, 0.26999199390411377, 0.286720871925354, 0.3034497797489166, 0.32017868757247925, 0.33690759539604187, 0.3536364734172821, 0.3703653812408447, 0.38709425926208496, 0.4038231670856476, 0.4205520749092102, 0.43728095293045044, 0.4540098309516907]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 9.0, 5.0, 18.0, 25.0, 51.0, 78.0, 136.0, 325.0, 715.0, 1910.0, 9535.0, 173421.0, 3977207.0, 25557.0, 3474.0, 972.0, 387.0, 206.0, 113.0, 51.0, 34.0, 17.0, 11.0, 3.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12286376953125, -0.11879825592041016, -0.11473274230957031, -0.11066722869873047, -0.10660171508789062, -0.10253620147705078, -0.09847068786621094, -0.0944051742553711, -0.09033966064453125, -0.0862741470336914, -0.08220863342285156, -0.07814311981201172, -0.07407760620117188, -0.07001209259033203, -0.06594657897949219, -0.061881065368652344, -0.0578155517578125, -0.053750038146972656, -0.04968452453613281, -0.04561901092529297, -0.041553497314453125, -0.03748798370361328, -0.03342247009277344, -0.029356956481933594, -0.02529144287109375, -0.021225929260253906, -0.017160415649414062, -0.013094902038574219, -0.009029388427734375, -0.004963874816894531, -0.0008983612060546875, 0.0031671524047851562, 0.007232666015625, 0.011298179626464844, 0.015363693237304688, 0.01942920684814453, 0.023494720458984375, 0.02756023406982422, 0.03162574768066406, 0.035691261291503906, 0.03975677490234375, 0.043822288513183594, 0.04788780212402344, 0.05195331573486328, 0.056018829345703125, 0.06008434295654297, 0.06414985656738281, 0.06821537017822266, 0.0722808837890625, 0.07634639739990234, 0.08041191101074219, 0.08447742462158203, 0.08854293823242188, 0.09260845184326172, 0.09667396545410156, 0.1007394790649414, 0.10480499267578125, 0.1088705062866211, 0.11293601989746094, 0.11700153350830078, 0.12106704711914062, 0.12513256072998047, 0.1291980743408203, 0.13326358795166016, 0.1373291015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 8.0, 11.0, 12.0, 17.0, 32.0, 49.0, 71.0, 81.0, 74.0, 105.0, 113.0, 94.0, 98.0, 76.0, 58.0, 42.0, 26.0, 13.0, 8.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.084716796875, -0.08275890350341797, -0.08080101013183594, -0.0788431167602539, -0.07688522338867188, -0.07492733001708984, -0.07296943664550781, -0.07101154327392578, -0.06905364990234375, -0.06709575653076172, -0.06513786315917969, -0.06317996978759766, -0.061222076416015625, -0.059264183044433594, -0.05730628967285156, -0.05534839630126953, -0.0533905029296875, -0.05143260955810547, -0.04947471618652344, -0.047516822814941406, -0.045558929443359375, -0.043601036071777344, -0.04164314270019531, -0.03968524932861328, -0.03772735595703125, -0.03576946258544922, -0.03381156921386719, -0.031853675842285156, -0.029895782470703125, -0.027937889099121094, -0.025979995727539062, -0.02402210235595703, -0.022064208984375, -0.02010631561279297, -0.018148422241210938, -0.016190528869628906, -0.014232635498046875, -0.012274742126464844, -0.010316848754882812, -0.008358955383300781, -0.00640106201171875, -0.004443168640136719, -0.0024852752685546875, -0.0005273818969726562, 0.001430511474609375, 0.0033884048461914062, 0.0053462982177734375, 0.007304191589355469, 0.0092620849609375, 0.011219978332519531, 0.013177871704101562, 0.015135765075683594, 0.017093658447265625, 0.019051551818847656, 0.021009445190429688, 0.02296733856201172, 0.02492523193359375, 0.02688312530517578, 0.028841018676757812, 0.030798912048339844, 0.032756805419921875, 0.034714698791503906, 0.03667259216308594, 0.03863048553466797, 0.04058837890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 7.0, 9.0, 10.0, 22.0, 23.0, 25.0, 25.0, 33.0, 47.0, 69.0, 92.0, 147.0, 234.0, 434.0, 969.0, 3451.0, 26234.0, 3608075.0, 532936.0, 16788.0, 2805.0, 838.0, 371.0, 190.0, 107.0, 81.0, 52.0, 47.0, 36.0, 21.0, 17.0, 16.0, 17.0, 11.0, 11.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1265869140625, -0.12261962890625, -0.11865234375, -0.11468505859375, -0.1107177734375, -0.10675048828125, -0.102783203125, -0.09881591796875, -0.0948486328125, -0.09088134765625, -0.0869140625, -0.08294677734375, -0.0789794921875, -0.07501220703125, -0.071044921875, -0.06707763671875, -0.0631103515625, -0.05914306640625, -0.05517578125, -0.05120849609375, -0.0472412109375, -0.04327392578125, -0.039306640625, -0.03533935546875, -0.0313720703125, -0.02740478515625, -0.0234375, -0.01947021484375, -0.0155029296875, -0.01153564453125, -0.007568359375, -0.00360107421875, 0.0003662109375, 0.00433349609375, 0.00830078125, 0.01226806640625, 0.0162353515625, 0.02020263671875, 0.024169921875, 0.02813720703125, 0.0321044921875, 0.03607177734375, 0.0400390625, 0.04400634765625, 0.0479736328125, 0.05194091796875, 0.055908203125, 0.05987548828125, 0.0638427734375, 0.06781005859375, 0.07177734375, 0.07574462890625, 0.0797119140625, 0.08367919921875, 0.087646484375, 0.09161376953125, 0.0955810546875, 0.09954833984375, 0.103515625, 0.10748291015625, 0.1114501953125, 0.11541748046875, 0.119384765625, 0.12335205078125, 0.1273193359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 14.0, 21.0, 100.0, 705.0, 3014.0, 157.0, 45.0, 12.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.0643301010131836, -0.06304740905761719, -0.06176471710205078, -0.060482025146484375, -0.05919933319091797, -0.05791664123535156, -0.056633949279785156, -0.05535125732421875, -0.054068565368652344, -0.05278587341308594, -0.05150318145751953, -0.050220489501953125, -0.04893779754638672, -0.04765510559082031, -0.046372413635253906, -0.0450897216796875, -0.043807029724121094, -0.04252433776855469, -0.04124164581298828, -0.039958953857421875, -0.03867626190185547, -0.03739356994628906, -0.036110877990722656, -0.03482818603515625, -0.033545494079589844, -0.03226280212402344, -0.03098011016845703, -0.029697418212890625, -0.02841472625732422, -0.027132034301757812, -0.025849342346191406, -0.024566650390625, -0.023283958435058594, -0.022001266479492188, -0.02071857452392578, -0.019435882568359375, -0.01815319061279297, -0.016870498657226562, -0.015587806701660156, -0.01430511474609375, -0.013022422790527344, -0.011739730834960938, -0.010457038879394531, -0.009174346923828125, -0.007891654968261719, -0.0066089630126953125, -0.005326271057128906, -0.0040435791015625, -0.0027608871459960938, -0.0014781951904296875, -0.00019550323486328125, 0.001087188720703125, 0.0023698806762695312, 0.0036525726318359375, 0.004935264587402344, 0.00621795654296875, 0.007500648498535156, 0.008783340454101562, 0.010066032409667969, 0.011348724365234375, 0.012631416320800781, 0.013914108276367188, 0.015196800231933594, 0.0164794921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 11.0, 10.0, 33.0, 37.0, 73.0, 120.0, 172.0, 175.0, 134.0, 106.0, 50.0, 40.0, 17.0, 11.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.13901358842849731, -0.1359356939792633, -0.1328577995300293, -0.1297798901796341, -0.12670199573040009, -0.12362410128116608, -0.12054620683193207, -0.11746831238269806, -0.11439041048288345, -0.11131251603364944, -0.10823461413383484, -0.10515671968460083, -0.10207882523536682, -0.09900092333555222, -0.0959230288863182, -0.0928451269865036, -0.08976723253726959, -0.08668933808803558, -0.08361143618822098, -0.08053354173898697, -0.07745563983917236, -0.07437774538993835, -0.07129985094070435, -0.06822195649147034, -0.06514405459165573, -0.062066156417131424, -0.05898825824260712, -0.05591036379337311, -0.0528324656188488, -0.04975456744432449, -0.046676672995090485, -0.04359877482056618, -0.04052086919546127, -0.037442971020936966, -0.03436507284641266, -0.03128717839717865, -0.028209280222654343, -0.025131382048130035, -0.022053485736250877, -0.01897558942437172, -0.015897691249847412, -0.01281979400664568, -0.009741896763443947, -0.006663999520242214, -0.0035861022770404816, -0.0005082050338387489, 0.0025696922093629837, 0.005647588521242142, 0.008725486695766449, 0.011803383938968182, 0.014881281182169914, 0.017959177494049072, 0.02103707566857338, 0.024114973843097687, 0.027192870154976845, 0.030270766466856003, 0.03334866464138031, 0.03642656281590462, 0.039504460990428925, 0.04258235543966293, 0.04566025361418724, 0.04873815178871155, 0.05181604623794556, 0.054893944412469864, 0.05797184258699417]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 4.0, 10.0, 14.0, 11.0, 17.0, 13.0, 25.0, 30.0, 21.0, 36.0, 41.0, 32.0, 39.0, 39.0, 51.0, 42.0, 73.0, 50.0, 36.0, 31.0, 34.0, 43.0, 36.0, 39.0, 29.0, 29.0, 31.0, 22.0, 19.0, 20.0, 11.0, 10.0, 8.0, 14.0, 12.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04391604661941528, -0.04255952313542366, -0.04120299965143204, -0.039846476167440414, -0.03848995268344879, -0.03713342919945717, -0.035776905715465546, -0.03442038223147392, -0.0330638587474823, -0.03170733526349068, -0.030350811779499054, -0.02899428829550743, -0.027637764811515808, -0.026281241327524185, -0.024924717843532562, -0.02356819435954094, -0.022211670875549316, -0.020855147391557693, -0.01949862390756607, -0.018142100423574448, -0.016785576939582825, -0.015429053455591202, -0.014072529971599579, -0.012716006487607956, -0.011359483003616333, -0.01000295951962471, -0.008646436035633087, -0.007289912551641464, -0.005933389067649841, -0.004576865583658218, -0.0032203420996665955, -0.0018638186156749725, -0.0005072951316833496, 0.0008492283523082733, 0.0022057518362998962, 0.003562275320291519, 0.004918798804283142, 0.006275322288274765, 0.007631845772266388, 0.00898836925625801, 0.010344892740249634, 0.011701416224241257, 0.01305793970823288, 0.014414463192224503, 0.015770986676216125, 0.01712751016020775, 0.01848403364419937, 0.019840557128190994, 0.021197080612182617, 0.02255360409617424, 0.023910127580165863, 0.025266651064157486, 0.02662317454814911, 0.027979698032140732, 0.029336221516132355, 0.030692745000123978, 0.0320492684841156, 0.033405791968107224, 0.034762315452098846, 0.03611883893609047, 0.03747536242008209, 0.038831885904073715, 0.04018840938806534, 0.04154493287205696, 0.042901456356048584]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 10.0, 13.0, 15.0, 19.0, 25.0, 47.0, 64.0, 97.0, 201.0, 364.0, 944.0, 3260.0, 17765.0, 120582.0, 524084.0, 320621.0, 49543.0, 7855.0, 1785.0, 597.0, 281.0, 150.0, 78.0, 49.0, 43.0, 16.0, 22.0, 9.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.09405517578125, -0.09156513214111328, -0.08907508850097656, -0.08658504486083984, -0.08409500122070312, -0.0816049575805664, -0.07911491394042969, -0.07662487030029297, -0.07413482666015625, -0.07164478302001953, -0.06915473937988281, -0.0666646957397461, -0.06417465209960938, -0.061684608459472656, -0.05919456481933594, -0.05670452117919922, -0.0542144775390625, -0.05172443389892578, -0.04923439025878906, -0.046744346618652344, -0.044254302978515625, -0.041764259338378906, -0.03927421569824219, -0.03678417205810547, -0.03429412841796875, -0.03180408477783203, -0.029314041137695312, -0.026823997497558594, -0.024333953857421875, -0.021843910217285156, -0.019353866577148438, -0.01686382293701172, -0.014373779296875, -0.011883735656738281, -0.009393692016601562, -0.006903648376464844, -0.004413604736328125, -0.0019235610961914062, 0.0005664825439453125, 0.0030565261840820312, 0.00554656982421875, 0.008036613464355469, 0.010526657104492188, 0.013016700744628906, 0.015506744384765625, 0.017996788024902344, 0.020486831665039062, 0.02297687530517578, 0.0254669189453125, 0.02795696258544922, 0.030447006225585938, 0.032937049865722656, 0.035427093505859375, 0.037917137145996094, 0.04040718078613281, 0.04289722442626953, 0.04538726806640625, 0.04787731170654297, 0.05036735534667969, 0.052857398986816406, 0.055347442626953125, 0.057837486267089844, 0.06032752990722656, 0.06281757354736328, 0.0653076171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 11.0, 13.0, 18.0, 27.0, 37.0, 37.0, 69.0, 72.0, 73.0, 83.0, 80.0, 83.0, 95.0, 73.0, 64.0, 52.0, 29.0, 24.0, 26.0, 9.0, 9.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0667724609375, -0.06508064270019531, -0.06338882446289062, -0.06169700622558594, -0.06000518798828125, -0.05831336975097656, -0.056621551513671875, -0.05492973327636719, -0.0532379150390625, -0.05154609680175781, -0.049854278564453125, -0.04816246032714844, -0.04647064208984375, -0.04477882385253906, -0.043087005615234375, -0.04139518737792969, -0.039703369140625, -0.03801155090332031, -0.036319732666015625, -0.03462791442871094, -0.03293609619140625, -0.031244277954101562, -0.029552459716796875, -0.027860641479492188, -0.0261688232421875, -0.024477005004882812, -0.022785186767578125, -0.021093368530273438, -0.01940155029296875, -0.017709732055664062, -0.016017913818359375, -0.014326095581054688, -0.01263427734375, -0.010942459106445312, -0.009250640869140625, -0.0075588226318359375, -0.00586700439453125, -0.0041751861572265625, -0.002483367919921875, -0.0007915496826171875, 0.0009002685546875, 0.0025920867919921875, 0.004283905029296875, 0.0059757232666015625, 0.00766754150390625, 0.009359359741210938, 0.011051177978515625, 0.012742996215820312, 0.014434814453125, 0.016126632690429688, 0.017818450927734375, 0.019510269165039062, 0.02120208740234375, 0.022893905639648438, 0.024585723876953125, 0.026277542114257812, 0.0279693603515625, 0.029661178588867188, 0.031352996826171875, 0.03304481506347656, 0.03473663330078125, 0.03642845153808594, 0.038120269775390625, 0.03981208801269531, 0.04150390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 6.0, 13.0, 29.0, 22.0, 31.0, 50.0, 53.0, 91.0, 137.0, 159.0, 233.0, 332.0, 524.0, 862.0, 1543.0, 3919.0, 15222.0, 89513.0, 488998.0, 369731.0, 59769.0, 10777.0, 3051.0, 1288.0, 717.0, 425.0, 272.0, 205.0, 146.0, 118.0, 69.0, 60.0, 36.0, 36.0, 24.0, 26.0, 16.0, 13.0, 9.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0623779296875, -0.06048154830932617, -0.058585166931152344, -0.056688785552978516, -0.05479240417480469, -0.05289602279663086, -0.05099964141845703, -0.0491032600402832, -0.047206878662109375, -0.04531049728393555, -0.04341411590576172, -0.04151773452758789, -0.03962135314941406, -0.037724971771240234, -0.035828590393066406, -0.03393220901489258, -0.03203582763671875, -0.030139446258544922, -0.028243064880371094, -0.026346683502197266, -0.024450302124023438, -0.02255392074584961, -0.02065753936767578, -0.018761157989501953, -0.016864776611328125, -0.014968395233154297, -0.013072013854980469, -0.01117563247680664, -0.009279251098632812, -0.007382869720458984, -0.005486488342285156, -0.003590106964111328, -0.0016937255859375, 0.00020265579223632812, 0.0020990371704101562, 0.003995418548583984, 0.0058917999267578125, 0.007788181304931641, 0.009684562683105469, 0.011580944061279297, 0.013477325439453125, 0.015373706817626953, 0.01727008819580078, 0.01916646957397461, 0.021062850952148438, 0.022959232330322266, 0.024855613708496094, 0.026751995086669922, 0.02864837646484375, 0.030544757843017578, 0.032441139221191406, 0.034337520599365234, 0.03623390197753906, 0.03813028335571289, 0.04002666473388672, 0.04192304611206055, 0.043819427490234375, 0.0457158088684082, 0.04761219024658203, 0.04950857162475586, 0.05140495300292969, 0.053301334381103516, 0.055197715759277344, 0.05709409713745117, 0.058990478515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 6.0, 7.0, 7.0, 6.0, 12.0, 16.0, 15.0, 23.0, 21.0, 29.0, 23.0, 15.0, 28.0, 33.0, 36.0, 42.0, 40.0, 47.0, 34.0, 41.0, 39.0, 39.0, 46.0, 42.0, 36.0, 41.0, 36.0, 48.0, 21.0, 32.0, 15.0, 20.0, 15.0, 17.0, 14.0, 12.0, 10.0, 7.0, 13.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09477806091308594, -0.09159469604492188, -0.08841133117675781, -0.08522796630859375, -0.08204460144042969, -0.07886123657226562, -0.07567787170410156, -0.0724945068359375, -0.06931114196777344, -0.06612777709960938, -0.06294441223144531, -0.05976104736328125, -0.05657768249511719, -0.053394317626953125, -0.05021095275878906, -0.047027587890625, -0.04384422302246094, -0.040660858154296875, -0.03747749328613281, -0.03429412841796875, -0.031110763549804688, -0.027927398681640625, -0.024744033813476562, -0.0215606689453125, -0.018377304077148438, -0.015193939208984375, -0.012010574340820312, -0.00882720947265625, -0.0056438446044921875, -0.002460479736328125, 0.0007228851318359375, 0.00390625, 0.0070896148681640625, 0.010272979736328125, 0.013456344604492188, 0.01663970947265625, 0.019823074340820312, 0.023006439208984375, 0.026189804077148438, 0.0293731689453125, 0.03255653381347656, 0.035739898681640625, 0.03892326354980469, 0.04210662841796875, 0.04528999328613281, 0.048473358154296875, 0.05165672302246094, 0.054840087890625, 0.05802345275878906, 0.061206817626953125, 0.06439018249511719, 0.06757354736328125, 0.07075691223144531, 0.07394027709960938, 0.07712364196777344, 0.0803070068359375, 0.08349037170410156, 0.08667373657226562, 0.08985710144042969, 0.09304046630859375, 0.09622383117675781, 0.09940719604492188, 0.10259056091308594, 0.10577392578125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 10.0, 16.0, 20.0, 30.0, 42.0, 73.0, 102.0, 200.0, 298.0, 601.0, 1253.0, 3117.0, 9765.0, 41605.0, 202710.0, 510617.0, 216896.0, 44803.0, 10450.0, 3189.0, 1290.0, 626.0, 308.0, 180.0, 125.0, 68.0, 43.0, 27.0, 22.0, 13.0, 7.0, 9.0, 7.0, 4.0, 2.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.031768798828125, -0.030944108963012695, -0.03011941909790039, -0.029294729232788086, -0.02847003936767578, -0.027645349502563477, -0.026820659637451172, -0.025995969772338867, -0.025171279907226562, -0.024346590042114258, -0.023521900177001953, -0.02269721031188965, -0.021872520446777344, -0.02104783058166504, -0.020223140716552734, -0.01939845085144043, -0.018573760986328125, -0.01774907112121582, -0.016924381256103516, -0.01609969139099121, -0.015275001525878906, -0.014450311660766602, -0.013625621795654297, -0.012800931930541992, -0.011976242065429688, -0.011151552200317383, -0.010326862335205078, -0.009502172470092773, -0.008677482604980469, -0.007852792739868164, -0.007028102874755859, -0.006203413009643555, -0.00537872314453125, -0.004554033279418945, -0.0037293434143066406, -0.002904653549194336, -0.0020799636840820312, -0.0012552738189697266, -0.0004305839538574219, 0.0003941059112548828, 0.0012187957763671875, 0.002043485641479492, 0.002868175506591797, 0.0036928653717041016, 0.004517555236816406, 0.005342245101928711, 0.006166934967041016, 0.00699162483215332, 0.007816314697265625, 0.00864100456237793, 0.009465694427490234, 0.010290384292602539, 0.011115074157714844, 0.011939764022827148, 0.012764453887939453, 0.013589143753051758, 0.014413833618164062, 0.015238523483276367, 0.016063213348388672, 0.016887903213500977, 0.01771259307861328, 0.018537282943725586, 0.01936197280883789, 0.020186662673950195, 0.0210113525390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 1.0, 5.0, 6.0, 9.0, 16.0, 20.0, 20.0, 25.0, 28.0, 31.0, 49.0, 39.0, 38.0, 54.0, 52.0, 57.0, 65.0, 71.0, 56.0, 59.0, 45.0, 43.0, 27.0, 31.0, 23.0, 20.0, 15.0, 16.0, 12.0, 12.0, 12.0, 6.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.696846008300781e-05, -4.5525841414928436e-05, -4.408322274684906e-05, -4.2640604078769684e-05, -4.119798541069031e-05, -3.975536674261093e-05, -3.8312748074531555e-05, -3.687012940645218e-05, -3.54275107383728e-05, -3.3984892070293427e-05, -3.254227340221405e-05, -3.1099654734134674e-05, -2.9657036066055298e-05, -2.821441739797592e-05, -2.6771798729896545e-05, -2.532918006181717e-05, -2.3886561393737793e-05, -2.2443942725658417e-05, -2.100132405757904e-05, -1.9558705389499664e-05, -1.8116086721420288e-05, -1.6673468053340912e-05, -1.5230849385261536e-05, -1.378823071718216e-05, -1.2345612049102783e-05, -1.0902993381023407e-05, -9.46037471294403e-06, -8.017756044864655e-06, -6.575137376785278e-06, -5.132518708705902e-06, -3.689900040626526e-06, -2.2472813725471497e-06, -8.046627044677734e-07, 6.379559636116028e-07, 2.080574631690979e-06, 3.5231932997703552e-06, 4.9658119678497314e-06, 6.408430635929108e-06, 7.851049304008484e-06, 9.29366797208786e-06, 1.0736286640167236e-05, 1.2178905308246613e-05, 1.3621523976325989e-05, 1.5064142644405365e-05, 1.650676131248474e-05, 1.7949379980564117e-05, 1.9391998648643494e-05, 2.083461731672287e-05, 2.2277235984802246e-05, 2.3719854652881622e-05, 2.5162473320961e-05, 2.6605091989040375e-05, 2.804771065711975e-05, 2.9490329325199127e-05, 3.0932947993278503e-05, 3.237556666135788e-05, 3.3818185329437256e-05, 3.526080399751663e-05, 3.670342266559601e-05, 3.8146041333675385e-05, 3.958866000175476e-05, 4.103127866983414e-05, 4.247389733791351e-05, 4.391651600599289e-05, 4.5359134674072266e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 7.0, 4.0, 10.0, 10.0, 13.0, 35.0, 29.0, 58.0, 60.0, 136.0, 187.0, 354.0, 558.0, 1096.0, 2422.0, 6714.0, 28137.0, 150367.0, 497386.0, 285329.0, 56967.0, 11753.0, 3515.0, 1562.0, 758.0, 391.0, 244.0, 170.0, 88.0, 46.0, 44.0, 24.0, 19.0, 20.0, 13.0, 7.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.032318115234375, -0.0313870906829834, -0.030456066131591797, -0.029525041580200195, -0.028594017028808594, -0.027662992477416992, -0.02673196792602539, -0.02580094337463379, -0.024869918823242188, -0.023938894271850586, -0.023007869720458984, -0.022076845169067383, -0.02114582061767578, -0.02021479606628418, -0.019283771514892578, -0.018352746963500977, -0.017421722412109375, -0.016490697860717773, -0.015559673309326172, -0.01462864875793457, -0.013697624206542969, -0.012766599655151367, -0.011835575103759766, -0.010904550552368164, -0.009973526000976562, -0.009042501449584961, -0.00811147689819336, -0.007180452346801758, -0.006249427795410156, -0.005318403244018555, -0.004387378692626953, -0.0034563541412353516, -0.00252532958984375, -0.0015943050384521484, -0.0006632804870605469, 0.0002677440643310547, 0.0011987686157226562, 0.002129793167114258, 0.0030608177185058594, 0.003991842269897461, 0.0049228668212890625, 0.005853891372680664, 0.006784915924072266, 0.007715940475463867, 0.008646965026855469, 0.00957798957824707, 0.010509014129638672, 0.011440038681030273, 0.012371063232421875, 0.013302087783813477, 0.014233112335205078, 0.01516413688659668, 0.01609516143798828, 0.017026185989379883, 0.017957210540771484, 0.018888235092163086, 0.019819259643554688, 0.02075028419494629, 0.02168130874633789, 0.022612333297729492, 0.023543357849121094, 0.024474382400512695, 0.025405406951904297, 0.0263364315032959, 0.0272674560546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 4.0, 12.0, 23.0, 27.0, 30.0, 49.0, 45.0, 62.0, 53.0, 85.0, 83.0, 70.0, 77.0, 55.0, 73.0, 71.0, 42.0, 34.0, 27.0, 23.0, 13.0, 12.0, 6.0, 2.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291748046875, -0.028139591217041016, -0.02710437774658203, -0.026069164276123047, -0.025033950805664062, -0.023998737335205078, -0.022963523864746094, -0.02192831039428711, -0.020893096923828125, -0.01985788345336914, -0.018822669982910156, -0.017787456512451172, -0.016752243041992188, -0.015717029571533203, -0.014681816101074219, -0.013646602630615234, -0.01261138916015625, -0.011576175689697266, -0.010540962219238281, -0.009505748748779297, -0.008470535278320312, -0.007435321807861328, -0.006400108337402344, -0.005364894866943359, -0.004329681396484375, -0.0032944679260253906, -0.0022592544555664062, -0.0012240409851074219, -0.0001888275146484375, 0.0008463859558105469, 0.0018815994262695312, 0.0029168128967285156, 0.0039520263671875, 0.004987239837646484, 0.006022453308105469, 0.007057666778564453, 0.008092880249023438, 0.009128093719482422, 0.010163307189941406, 0.01119852066040039, 0.012233734130859375, 0.01326894760131836, 0.014304161071777344, 0.015339374542236328, 0.016374588012695312, 0.017409801483154297, 0.01844501495361328, 0.019480228424072266, 0.02051544189453125, 0.021550655364990234, 0.02258586883544922, 0.023621082305908203, 0.024656295776367188, 0.025691509246826172, 0.026726722717285156, 0.02776193618774414, 0.028797149658203125, 0.02983236312866211, 0.030867576599121094, 0.03190279006958008, 0.03293800354003906, 0.03397321701049805, 0.03500843048095703, 0.036043643951416016, 0.037078857421875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 19.0, 45.0, 99.0, 209.0, 249.0, 196.0, 108.0, 45.0, 16.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49815264344215393, -0.46979671716690063, -0.44144079089164734, -0.41308486461639404, -0.38472890853881836, -0.35637298226356506, -0.32801705598831177, -0.2996610999107361, -0.2713052034378052, -0.24294927716255188, -0.2145933359861374, -0.1862374097108841, -0.1578814685344696, -0.1295255422592163, -0.10116961598396301, -0.07281367480754852, -0.04445773363113403, -0.01610180176794529, 0.012254130095243454, 0.04061006009578705, 0.06896599382162094, 0.09732192754745483, 0.12567785382270813, 0.15403379499912262, 0.18238972127437592, 0.2107456475496292, 0.2391015887260437, 0.267457515001297, 0.2958134412765503, 0.324169397354126, 0.3525252938270569, 0.38088124990463257, 0.40923720598220825, 0.43759313225746155, 0.46594905853271484, 0.4943050146102905, 0.5226609110832214, 0.5510168671607971, 0.579372763633728, 0.6077287197113037, 0.6360846757888794, 0.6644406318664551, 0.692796528339386, 0.7211524844169617, 0.7495083808898926, 0.7778643369674683, 0.806220293045044, 0.8345761895179749, 0.8629320859909058, 0.8912880420684814, 0.9196439385414124, 0.947999894618988, 0.976355791091919, 1.0047117471694946, 1.0330677032470703, 1.061423659324646, 1.0897796154022217, 1.1181355714797974, 1.146491527557373, 1.1748473644256592, 1.2032033205032349, 1.2315592765808105, 1.2599152326583862, 1.288271188735962, 1.316627025604248]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 9.0, 6.0, 15.0, 17.0, 21.0, 17.0, 29.0, 21.0, 40.0, 26.0, 35.0, 47.0, 50.0, 51.0, 44.0, 58.0, 53.0, 57.0, 47.0, 53.0, 37.0, 36.0, 32.0, 40.0, 29.0, 16.0, 19.0, 16.0, 11.0, 11.0, 8.0, 12.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5884151458740234, -0.5706067681312561, -0.552798330783844, -0.5349899530410767, -0.5171815156936646, -0.4993731379508972, -0.4815647304058075, -0.4637563228607178, -0.44594791531562805, -0.42813950777053833, -0.4103311002254486, -0.3925226926803589, -0.37471431493759155, -0.35690587759017944, -0.3390974998474121, -0.3212890923023224, -0.30348068475723267, -0.28567227721214294, -0.2678638696670532, -0.2500554621219635, -0.23224706947803497, -0.21443866193294525, -0.19663026928901672, -0.178821861743927, -0.16101345419883728, -0.14320504665374756, -0.12539663910865784, -0.10758824646472931, -0.08977983891963959, -0.07197143137454987, -0.05416303128004074, -0.036354631185531616, -0.01854628324508667, -0.0007378794252872467, 0.017070524394512177, 0.0348789282143116, 0.05268733203411102, 0.07049573957920074, 0.08830413967370987, 0.106112539768219, 0.12392094731330872, 0.14172935485839844, 0.15953776240348816, 0.1773461550474167, 0.1951545625925064, 0.21296297013759613, 0.23077136278152466, 0.24857977032661438, 0.2663881778717041, 0.2841965854167938, 0.30200499296188354, 0.31981340050697327, 0.337621808052063, 0.3554301857948303, 0.37323859333992004, 0.39104700088500977, 0.4088554084300995, 0.4266638159751892, 0.44447222352027893, 0.46228063106536865, 0.480089008808136, 0.4978974461555481, 0.5157058238983154, 0.5335142612457275, 0.5513226389884949]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 11.0, 19.0, 51.0, 108.0, 285.0, 904.0, 3330.0, 18438.0, 318264.0, 3809699.0, 35849.0, 5375.0, 1301.0, 380.0, 140.0, 58.0, 22.0, 17.0, 10.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0889892578125, -0.08613300323486328, -0.08327674865722656, -0.08042049407958984, -0.07756423950195312, -0.0747079849243164, -0.07185173034667969, -0.06899547576904297, -0.06613922119140625, -0.06328296661376953, -0.06042671203613281, -0.057570457458496094, -0.054714202880859375, -0.051857948303222656, -0.04900169372558594, -0.04614543914794922, -0.0432891845703125, -0.04043292999267578, -0.03757667541503906, -0.034720420837402344, -0.031864166259765625, -0.029007911682128906, -0.026151657104492188, -0.02329540252685547, -0.02043914794921875, -0.01758289337158203, -0.014726638793945312, -0.011870384216308594, -0.009014129638671875, -0.006157875061035156, -0.0033016204833984375, -0.00044536590576171875, 0.002410888671875, 0.005267143249511719, 0.008123397827148438, 0.010979652404785156, 0.013835906982421875, 0.016692161560058594, 0.019548416137695312, 0.02240467071533203, 0.02526092529296875, 0.02811717987060547, 0.030973434448242188, 0.033829689025878906, 0.036685943603515625, 0.039542198181152344, 0.04239845275878906, 0.04525470733642578, 0.0481109619140625, 0.05096721649169922, 0.05382347106933594, 0.056679725646972656, 0.059535980224609375, 0.062392234802246094, 0.06524848937988281, 0.06810474395751953, 0.07096099853515625, 0.07381725311279297, 0.07667350769042969, 0.0795297622680664, 0.08238601684570312, 0.08524227142333984, 0.08809852600097656, 0.09095478057861328, 0.09381103515625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 15.0, 18.0, 18.0, 29.0, 41.0, 70.0, 68.0, 85.0, 92.0, 92.0, 100.0, 81.0, 72.0, 54.0, 71.0, 24.0, 28.0, 14.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0789794921875, -0.07708072662353516, -0.07518196105957031, -0.07328319549560547, -0.07138442993164062, -0.06948566436767578, -0.06758689880371094, -0.0656881332397461, -0.06378936767578125, -0.061890602111816406, -0.05999183654785156, -0.05809307098388672, -0.056194305419921875, -0.05429553985595703, -0.05239677429199219, -0.050498008728027344, -0.0485992431640625, -0.046700477600097656, -0.04480171203613281, -0.04290294647216797, -0.041004180908203125, -0.03910541534423828, -0.03720664978027344, -0.035307884216308594, -0.03340911865234375, -0.031510353088378906, -0.029611587524414062, -0.02771282196044922, -0.025814056396484375, -0.02391529083251953, -0.022016525268554688, -0.020117759704589844, -0.018218994140625, -0.016320228576660156, -0.014421463012695312, -0.012522697448730469, -0.010623931884765625, -0.008725166320800781, -0.0068264007568359375, -0.004927635192871094, -0.00302886962890625, -0.0011301040649414062, 0.0007686614990234375, 0.0026674270629882812, 0.004566192626953125, 0.006464958190917969, 0.008363723754882812, 0.010262489318847656, 0.0121612548828125, 0.014060020446777344, 0.015958786010742188, 0.01785755157470703, 0.019756317138671875, 0.02165508270263672, 0.023553848266601562, 0.025452613830566406, 0.02735137939453125, 0.029250144958496094, 0.031148910522460938, 0.03304767608642578, 0.034946441650390625, 0.03684520721435547, 0.03874397277832031, 0.040642738342285156, 0.04254150390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 11.0, 14.0, 30.0, 61.0, 86.0, 149.0, 311.0, 532.0, 1136.0, 2182.0, 4539.0, 10578.0, 29281.0, 116686.0, 3328016.0, 592531.0, 71742.0, 21004.0, 8163.0, 3588.0, 1707.0, 907.0, 441.0, 245.0, 153.0, 88.0, 36.0, 26.0, 11.0, 10.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0350341796875, -0.03350067138671875, -0.0319671630859375, -0.03043365478515625, -0.028900146484375, -0.02736663818359375, -0.0258331298828125, -0.02429962158203125, -0.02276611328125, -0.02123260498046875, -0.0196990966796875, -0.01816558837890625, -0.016632080078125, -0.01509857177734375, -0.0135650634765625, -0.01203155517578125, -0.010498046875, -0.00896453857421875, -0.0074310302734375, -0.00589752197265625, -0.004364013671875, -0.00283050537109375, -0.0012969970703125, 0.00023651123046875, 0.00177001953125, 0.00330352783203125, 0.0048370361328125, 0.00637054443359375, 0.007904052734375, 0.00943756103515625, 0.0109710693359375, 0.01250457763671875, 0.0140380859375, 0.01557159423828125, 0.0171051025390625, 0.01863861083984375, 0.020172119140625, 0.02170562744140625, 0.0232391357421875, 0.02477264404296875, 0.02630615234375, 0.02783966064453125, 0.0293731689453125, 0.03090667724609375, 0.032440185546875, 0.03397369384765625, 0.0355072021484375, 0.03704071044921875, 0.03857421875, 0.04010772705078125, 0.0416412353515625, 0.04317474365234375, 0.044708251953125, 0.04624176025390625, 0.0477752685546875, 0.04930877685546875, 0.05084228515625, 0.05237579345703125, 0.0539093017578125, 0.05544281005859375, 0.056976318359375, 0.05850982666015625, 0.0600433349609375, 0.06157684326171875, 0.0631103515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 12.0, 16.0, 20.0, 20.0, 39.0, 54.0, 74.0, 151.0, 312.0, 2208.0, 601.0, 205.0, 103.0, 65.0, 42.0, 26.0, 18.0, 17.0, 8.0, 8.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01128387451171875, -0.010904669761657715, -0.01052546501159668, -0.010146260261535645, -0.00976705551147461, -0.009387850761413574, -0.009008646011352539, -0.008629441261291504, -0.008250236511230469, -0.007871031761169434, -0.0074918270111083984, -0.007112622261047363, -0.006733417510986328, -0.006354212760925293, -0.005975008010864258, -0.005595803260803223, -0.0052165985107421875, -0.004837393760681152, -0.004458189010620117, -0.004078984260559082, -0.003699779510498047, -0.0033205747604370117, -0.0029413700103759766, -0.0025621652603149414, -0.0021829605102539062, -0.001803755760192871, -0.001424551010131836, -0.0010453462600708008, -0.0006661415100097656, -0.00028693675994873047, 9.226799011230469e-05, 0.00047147274017333984, 0.000850677490234375, 0.0012298822402954102, 0.0016090869903564453, 0.0019882917404174805, 0.0023674964904785156, 0.0027467012405395508, 0.003125905990600586, 0.003505110740661621, 0.0038843154907226562, 0.004263520240783691, 0.0046427249908447266, 0.005021929740905762, 0.005401134490966797, 0.005780339241027832, 0.006159543991088867, 0.006538748741149902, 0.0069179534912109375, 0.007297158241271973, 0.007676362991333008, 0.008055567741394043, 0.008434772491455078, 0.008813977241516113, 0.009193181991577148, 0.009572386741638184, 0.009951591491699219, 0.010330796241760254, 0.010710000991821289, 0.011089205741882324, 0.01146841049194336, 0.011847615242004395, 0.01222681999206543, 0.012606024742126465, 0.0129852294921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 10.0, 22.0, 24.0, 43.0, 58.0, 84.0, 132.0, 114.0, 118.0, 115.0, 87.0, 61.0, 52.0, 29.0, 17.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08026564121246338, -0.07788148522377014, -0.0754973292350769, -0.07311317324638367, -0.07072901725769043, -0.06834486126899719, -0.06596070528030396, -0.06357654929161072, -0.06119238957762718, -0.058808233588933945, -0.05642407760024071, -0.05403992161154747, -0.051655761897563934, -0.0492716059088707, -0.04688744992017746, -0.04450329393148422, -0.042119137942790985, -0.03973498195409775, -0.03735082596540451, -0.03496666997671127, -0.032582513988018036, -0.03019835613667965, -0.027814198285341263, -0.025430042296648026, -0.023045886307954788, -0.02066173031926155, -0.018277574330568314, -0.015893416479229927, -0.01350926049053669, -0.011125104501843452, -0.00874094758182764, -0.006356790661811829, -0.003972634673118591, -0.0015884782187640667, 0.0007956782355904579, 0.0031798346899449825, 0.005563991144299507, 0.007948147132992744, 0.010332304053008556, 0.012716460973024368, 0.015100616961717606, 0.017484772950410843, 0.01986892893910408, 0.022253086790442467, 0.024637242779135704, 0.02702139876782894, 0.029405556619167328, 0.031789712607860565, 0.0341738685965538, 0.03655802458524704, 0.03894218057394028, 0.041326336562633514, 0.04371049255132675, 0.04609464854001999, 0.048478808254003525, 0.05086296424269676, 0.05324712023139, 0.05563127622008324, 0.058015432208776474, 0.06039958819746971, 0.06278374791145325, 0.06516790390014648, 0.06755205988883972, 0.06993621587753296, 0.0723203718662262]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 8.0, 18.0, 16.0, 27.0, 25.0, 26.0, 32.0, 40.0, 43.0, 47.0, 46.0, 47.0, 61.0, 66.0, 53.0, 42.0, 66.0, 49.0, 60.0, 37.0, 21.0, 25.0, 23.0, 21.0, 17.0, 11.0, 14.0, 13.0, 9.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0516352653503418, -0.0500616617500782, -0.048488058149814606, -0.04691445454955101, -0.045340850949287415, -0.04376724734902382, -0.04219364374876022, -0.04062004014849663, -0.03904643654823303, -0.03747283294796944, -0.03589922934770584, -0.034325625747442245, -0.03275202214717865, -0.031178418546915054, -0.02960481494665146, -0.028031211346387863, -0.026457607746124268, -0.024884004145860672, -0.023310400545597076, -0.02173679694533348, -0.020163193345069885, -0.01858958974480629, -0.017015986144542694, -0.015442382544279099, -0.013868778944015503, -0.012295175343751907, -0.010721571743488312, -0.009147968143224716, -0.007574364542961121, -0.006000760942697525, -0.0044271573424339294, -0.002853553742170334, -0.0012799501419067383, 0.0002936534583568573, 0.0018672570586204529, 0.0034408606588840485, 0.005014464259147644, 0.00658806785941124, 0.008161671459674835, 0.00973527505993843, 0.011308878660202026, 0.012882482260465622, 0.014456085860729218, 0.016029689460992813, 0.01760329306125641, 0.019176896661520004, 0.0207505002617836, 0.022324103862047195, 0.02389770746231079, 0.025471311062574387, 0.027044914662837982, 0.028618518263101578, 0.030192121863365173, 0.03176572546362877, 0.033339329063892365, 0.03491293266415596, 0.036486536264419556, 0.03806013986468315, 0.03963374346494675, 0.04120734706521034, 0.04278095066547394, 0.044354554265737534, 0.04592815786600113, 0.047501761466264725, 0.04907536506652832]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 9.0, 15.0, 18.0, 28.0, 58.0, 92.0, 126.0, 203.0, 360.0, 857.0, 2228.0, 7364.0, 29700.0, 143288.0, 427262.0, 329428.0, 82081.0, 17698.0, 4696.0, 1678.0, 654.0, 338.0, 152.0, 77.0, 51.0, 33.0, 15.0, 18.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056610107421875, -0.0548853874206543, -0.053160667419433594, -0.05143594741821289, -0.04971122741699219, -0.047986507415771484, -0.04626178741455078, -0.04453706741333008, -0.042812347412109375, -0.04108762741088867, -0.03936290740966797, -0.037638187408447266, -0.03591346740722656, -0.03418874740600586, -0.032464027404785156, -0.030739307403564453, -0.02901458740234375, -0.027289867401123047, -0.025565147399902344, -0.02384042739868164, -0.022115707397460938, -0.020390987396240234, -0.01866626739501953, -0.016941547393798828, -0.015216827392578125, -0.013492107391357422, -0.011767387390136719, -0.010042667388916016, -0.008317947387695312, -0.006593227386474609, -0.004868507385253906, -0.003143787384033203, -0.0014190673828125, 0.0003056526184082031, 0.0020303726196289062, 0.0037550926208496094, 0.0054798126220703125, 0.007204532623291016, 0.008929252624511719, 0.010653972625732422, 0.012378692626953125, 0.014103412628173828, 0.01582813262939453, 0.017552852630615234, 0.019277572631835938, 0.02100229263305664, 0.022727012634277344, 0.024451732635498047, 0.02617645263671875, 0.027901172637939453, 0.029625892639160156, 0.03135061264038086, 0.03307533264160156, 0.034800052642822266, 0.03652477264404297, 0.03824949264526367, 0.039974212646484375, 0.04169893264770508, 0.04342365264892578, 0.045148372650146484, 0.04687309265136719, 0.04859781265258789, 0.050322532653808594, 0.0520472526550293, 0.05377197265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 10.0, 10.0, 14.0, 15.0, 25.0, 39.0, 42.0, 44.0, 56.0, 58.0, 70.0, 76.0, 84.0, 64.0, 69.0, 70.0, 54.0, 55.0, 34.0, 32.0, 14.0, 26.0, 9.0, 13.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.05975341796875, -0.058199405670166016, -0.05664539337158203, -0.05509138107299805, -0.05353736877441406, -0.05198335647583008, -0.050429344177246094, -0.04887533187866211, -0.047321319580078125, -0.04576730728149414, -0.044213294982910156, -0.04265928268432617, -0.04110527038574219, -0.0395512580871582, -0.03799724578857422, -0.036443233489990234, -0.03488922119140625, -0.033335208892822266, -0.03178119659423828, -0.030227184295654297, -0.028673171997070312, -0.027119159698486328, -0.025565147399902344, -0.02401113510131836, -0.022457122802734375, -0.02090311050415039, -0.019349098205566406, -0.017795085906982422, -0.016241073608398438, -0.014687061309814453, -0.013133049011230469, -0.011579036712646484, -0.0100250244140625, -0.008471012115478516, -0.006916999816894531, -0.005362987518310547, -0.0038089752197265625, -0.002254962921142578, -0.0007009506225585938, 0.0008530616760253906, 0.002407073974609375, 0.003961086273193359, 0.005515098571777344, 0.007069110870361328, 0.008623123168945312, 0.010177135467529297, 0.011731147766113281, 0.013285160064697266, 0.01483917236328125, 0.016393184661865234, 0.01794719696044922, 0.019501209259033203, 0.021055221557617188, 0.022609233856201172, 0.024163246154785156, 0.02571725845336914, 0.027271270751953125, 0.02882528305053711, 0.030379295349121094, 0.03193330764770508, 0.03348731994628906, 0.03504133224487305, 0.03659534454345703, 0.038149356842041016, 0.039703369140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 8.0, 17.0, 21.0, 34.0, 46.0, 73.0, 118.0, 178.0, 360.0, 559.0, 1100.0, 2876.0, 17305.0, 381313.0, 609016.0, 28861.0, 3741.0, 1329.0, 632.0, 332.0, 216.0, 128.0, 84.0, 68.0, 50.0, 20.0, 16.0, 12.0, 11.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08349609375, -0.0804147720336914, -0.07733345031738281, -0.07425212860107422, -0.07117080688476562, -0.06808948516845703, -0.06500816345214844, -0.061926841735839844, -0.05884552001953125, -0.055764198303222656, -0.05268287658691406, -0.04960155487060547, -0.046520233154296875, -0.04343891143798828, -0.04035758972167969, -0.037276268005371094, -0.0341949462890625, -0.031113624572753906, -0.028032302856445312, -0.02495098114013672, -0.021869659423828125, -0.01878833770751953, -0.015707015991210938, -0.012625694274902344, -0.00954437255859375, -0.006463050842285156, -0.0033817291259765625, -0.00030040740966796875, 0.002780914306640625, 0.005862236022949219, 0.008943557739257812, 0.012024879455566406, 0.015106201171875, 0.018187522888183594, 0.021268844604492188, 0.02435016632080078, 0.027431488037109375, 0.03051280975341797, 0.03359413146972656, 0.036675453186035156, 0.03975677490234375, 0.042838096618652344, 0.04591941833496094, 0.04900074005126953, 0.052082061767578125, 0.05516338348388672, 0.05824470520019531, 0.061326026916503906, 0.0644073486328125, 0.0674886703491211, 0.07056999206542969, 0.07365131378173828, 0.07673263549804688, 0.07981395721435547, 0.08289527893066406, 0.08597660064697266, 0.08905792236328125, 0.09213924407958984, 0.09522056579589844, 0.09830188751220703, 0.10138320922851562, 0.10446453094482422, 0.10754585266113281, 0.1106271743774414, 0.11370849609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 14.0, 11.0, 18.0, 17.0, 17.0, 18.0, 36.0, 24.0, 48.0, 35.0, 39.0, 27.0, 47.0, 48.0, 38.0, 40.0, 37.0, 45.0, 49.0, 43.0, 34.0, 42.0, 28.0, 42.0, 27.0, 27.0, 21.0, 16.0, 11.0, 10.0, 19.0, 11.0, 10.0, 3.0, 3.0, 4.0, 6.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11541748046875, -0.11178970336914062, -0.10816192626953125, -0.10453414916992188, -0.1009063720703125, -0.09727859497070312, -0.09365081787109375, -0.09002304077148438, -0.086395263671875, -0.08276748657226562, -0.07913970947265625, -0.07551193237304688, -0.0718841552734375, -0.06825637817382812, -0.06462860107421875, -0.061000823974609375, -0.057373046875, -0.053745269775390625, -0.05011749267578125, -0.046489715576171875, -0.0428619384765625, -0.039234161376953125, -0.03560638427734375, -0.031978607177734375, -0.028350830078125, -0.024723052978515625, -0.02109527587890625, -0.017467498779296875, -0.0138397216796875, -0.010211944580078125, -0.00658416748046875, -0.002956390380859375, 0.00067138671875, 0.004299163818359375, 0.00792694091796875, 0.011554718017578125, 0.0151824951171875, 0.018810272216796875, 0.02243804931640625, 0.026065826416015625, 0.029693603515625, 0.033321380615234375, 0.03694915771484375, 0.040576934814453125, 0.0442047119140625, 0.047832489013671875, 0.05146026611328125, 0.055088043212890625, 0.0587158203125, 0.062343597412109375, 0.06597137451171875, 0.06959915161132812, 0.0732269287109375, 0.07685470581054688, 0.08048248291015625, 0.08411026000976562, 0.087738037109375, 0.09136581420898438, 0.09499359130859375, 0.09862136840820312, 0.1022491455078125, 0.10587692260742188, 0.10950469970703125, 0.11313247680664062, 0.11676025390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 13.0, 5.0, 11.0, 9.0, 10.0, 12.0, 32.0, 42.0, 61.0, 95.0, 232.0, 561.0, 1766.0, 9191.0, 145868.0, 821177.0, 61730.0, 5544.0, 1270.0, 440.0, 193.0, 115.0, 54.0, 39.0, 16.0, 14.0, 20.0, 15.0, 4.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04833984375, -0.046573638916015625, -0.04480743408203125, -0.043041229248046875, -0.0412750244140625, -0.039508819580078125, -0.03774261474609375, -0.035976409912109375, -0.034210205078125, -0.032444000244140625, -0.03067779541015625, -0.028911590576171875, -0.0271453857421875, -0.025379180908203125, -0.02361297607421875, -0.021846771240234375, -0.02008056640625, -0.018314361572265625, -0.01654815673828125, -0.014781951904296875, -0.0130157470703125, -0.011249542236328125, -0.00948333740234375, -0.007717132568359375, -0.005950927734375, -0.004184722900390625, -0.00241851806640625, -0.000652313232421875, 0.0011138916015625, 0.002880096435546875, 0.00464630126953125, 0.006412506103515625, 0.0081787109375, 0.009944915771484375, 0.01171112060546875, 0.013477325439453125, 0.0152435302734375, 0.017009735107421875, 0.01877593994140625, 0.020542144775390625, 0.022308349609375, 0.024074554443359375, 0.02584075927734375, 0.027606964111328125, 0.0293731689453125, 0.031139373779296875, 0.03290557861328125, 0.034671783447265625, 0.03643798828125, 0.038204193115234375, 0.03997039794921875, 0.041736602783203125, 0.0435028076171875, 0.045269012451171875, 0.04703521728515625, 0.048801422119140625, 0.050567626953125, 0.052333831787109375, 0.05410003662109375, 0.055866241455078125, 0.0576324462890625, 0.059398651123046875, 0.06116485595703125, 0.06293106079101562, 0.064697265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 18.0, 24.0, 33.0, 33.0, 49.0, 52.0, 83.0, 111.0, 110.0, 98.0, 102.0, 82.0, 55.0, 41.0, 28.0, 27.0, 14.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55055046081543e-05, -6.356462836265564e-05, -6.162375211715698e-05, -5.9682875871658325e-05, -5.774199962615967e-05, -5.580112338066101e-05, -5.3860247135162354e-05, -5.1919370889663696e-05, -4.997849464416504e-05, -4.803761839866638e-05, -4.6096742153167725e-05, -4.415586590766907e-05, -4.221498966217041e-05, -4.027411341667175e-05, -3.8333237171173096e-05, -3.639236092567444e-05, -3.445148468017578e-05, -3.2510608434677124e-05, -3.056973218917847e-05, -2.862885594367981e-05, -2.6687979698181152e-05, -2.4747103452682495e-05, -2.2806227207183838e-05, -2.086535096168518e-05, -1.8924474716186523e-05, -1.6983598470687866e-05, -1.5042722225189209e-05, -1.3101845979690552e-05, -1.1160969734191895e-05, -9.220093488693237e-06, -7.27921724319458e-06, -5.338340997695923e-06, -3.3974647521972656e-06, -1.4565885066986084e-06, 4.842877388000488e-07, 2.425163984298706e-06, 4.366040229797363e-06, 6.3069164752960205e-06, 8.247792720794678e-06, 1.0188668966293335e-05, 1.2129545211791992e-05, 1.407042145729065e-05, 1.6011297702789307e-05, 1.7952173948287964e-05, 1.989305019378662e-05, 2.183392643928528e-05, 2.3774802684783936e-05, 2.5715678930282593e-05, 2.765655517578125e-05, 2.9597431421279907e-05, 3.1538307666778564e-05, 3.347918391227722e-05, 3.542006015777588e-05, 3.7360936403274536e-05, 3.930181264877319e-05, 4.124268889427185e-05, 4.318356513977051e-05, 4.5124441385269165e-05, 4.706531763076782e-05, 4.900619387626648e-05, 5.094707012176514e-05, 5.2887946367263794e-05, 5.482882261276245e-05, 5.676969885826111e-05, 5.8710575103759766e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 11.0, 10.0, 26.0, 38.0, 58.0, 131.0, 342.0, 1233.0, 9438.0, 746672.0, 283936.0, 5181.0, 916.0, 302.0, 118.0, 63.0, 31.0, 17.0, 16.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0953369140625, -0.0921468734741211, -0.08895683288574219, -0.08576679229736328, -0.08257675170898438, -0.07938671112060547, -0.07619667053222656, -0.07300662994384766, -0.06981658935546875, -0.06662654876708984, -0.06343650817871094, -0.06024646759033203, -0.057056427001953125, -0.05386638641357422, -0.05067634582519531, -0.047486305236816406, -0.0442962646484375, -0.041106224060058594, -0.03791618347167969, -0.03472614288330078, -0.031536102294921875, -0.02834606170654297, -0.025156021118164062, -0.021965980529785156, -0.01877593994140625, -0.015585899353027344, -0.012395858764648438, -0.009205818176269531, -0.006015777587890625, -0.0028257369995117188, 0.0003643035888671875, 0.0035543441772460938, 0.006744384765625, 0.009934425354003906, 0.013124465942382812, 0.01631450653076172, 0.019504547119140625, 0.02269458770751953, 0.025884628295898438, 0.029074668884277344, 0.03226470947265625, 0.035454750061035156, 0.03864479064941406, 0.04183483123779297, 0.045024871826171875, 0.04821491241455078, 0.05140495300292969, 0.054594993591308594, 0.0577850341796875, 0.060975074768066406, 0.06416511535644531, 0.06735515594482422, 0.07054519653320312, 0.07373523712158203, 0.07692527770996094, 0.08011531829833984, 0.08330535888671875, 0.08649539947509766, 0.08968544006347656, 0.09287548065185547, 0.09606552124023438, 0.09925556182861328, 0.10244560241699219, 0.1056356430053711, 0.10882568359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 8.0, 9.0, 23.0, 15.0, 33.0, 46.0, 61.0, 66.0, 69.0, 77.0, 88.0, 72.0, 65.0, 70.0, 66.0, 55.0, 34.0, 27.0, 24.0, 26.0, 22.0, 6.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022003173828125, -0.020963191986083984, -0.01992321014404297, -0.018883228302001953, -0.017843246459960938, -0.016803264617919922, -0.015763282775878906, -0.01472330093383789, -0.013683319091796875, -0.01264333724975586, -0.011603355407714844, -0.010563373565673828, -0.009523391723632812, -0.008483409881591797, -0.007443428039550781, -0.006403446197509766, -0.00536346435546875, -0.004323482513427734, -0.0032835006713867188, -0.002243518829345703, -0.0012035369873046875, -0.00016355514526367188, 0.0008764266967773438, 0.0019164085388183594, 0.002956390380859375, 0.003996372222900391, 0.005036354064941406, 0.006076335906982422, 0.0071163177490234375, 0.008156299591064453, 0.009196281433105469, 0.010236263275146484, 0.0112762451171875, 0.012316226959228516, 0.013356208801269531, 0.014396190643310547, 0.015436172485351562, 0.016476154327392578, 0.017516136169433594, 0.01855611801147461, 0.019596099853515625, 0.02063608169555664, 0.021676063537597656, 0.022716045379638672, 0.023756027221679688, 0.024796009063720703, 0.02583599090576172, 0.026875972747802734, 0.02791595458984375, 0.028955936431884766, 0.02999591827392578, 0.031035900115966797, 0.03207588195800781, 0.03311586380004883, 0.034155845642089844, 0.03519582748413086, 0.036235809326171875, 0.03727579116821289, 0.038315773010253906, 0.03935575485229492, 0.04039573669433594, 0.04143571853637695, 0.04247570037841797, 0.043515682220458984, 0.0445556640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 23.0, 114.0, 307.0, 354.0, 137.0, 45.0, 10.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8783001899719238, -0.8324673771858215, -0.786634624004364, -0.7408018112182617, -0.6949689984321594, -0.6491361856460571, -0.6033034324645996, -0.5574706196784973, -0.511637806892395, -0.4658050239086151, -0.4199722111225128, -0.3741394281387329, -0.3283066153526306, -0.2824738323688507, -0.2366410493850708, -0.1908082365989685, -0.144975483417511, -0.09914268553256989, -0.05330989509820938, -0.007477104663848877, 0.038355693221092224, 0.08418849110603333, 0.13002127408981323, 0.17585408687591553, 0.22168686985969543, 0.26751965284347534, 0.31335246562957764, 0.35918524861335754, 0.40501803159713745, 0.45085084438323975, 0.49668362736701965, 0.5425164699554443, 0.5883492231369019, 0.6341820359230042, 0.6800147891044617, 0.725847601890564, 0.7716804146766663, 0.8175132274627686, 0.8633459806442261, 0.9091787934303284, 0.9550116062164307, 1.0008443593978882, 1.0466772317886353, 1.0925099849700928, 1.1383427381515503, 1.1841756105422974, 1.2300083637237549, 1.275841236114502, 1.32167387008667, 1.3675066232681274, 1.4133394956588745, 1.459172248840332, 1.5050050020217896, 1.5508378744125366, 1.5966706275939941, 1.6425034999847412, 1.6883362531661987, 1.7341690063476562, 1.7800018787384033, 1.8258346319198608, 1.8716673851013184, 1.9175002574920654, 1.963333010673523, 2.0091657638549805, 2.0549986362457275]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 16.0, 5.0, 11.0, 16.0, 11.0, 21.0, 21.0, 22.0, 20.0, 40.0, 28.0, 47.0, 42.0, 39.0, 58.0, 42.0, 50.0, 52.0, 53.0, 49.0, 52.0, 28.0, 32.0, 21.0, 32.0, 29.0, 32.0, 23.0, 19.0, 14.0, 17.0, 16.0, 8.0, 6.0, 4.0, 4.0, 5.0, 5.0, 6.0, 1.0, 0.0, 2.0], "bins": [-0.7230413556098938, -0.7045522332191467, -0.6860631108283997, -0.6675739288330078, -0.6490848064422607, -0.6305956840515137, -0.6121065616607666, -0.5936174392700195, -0.5751283168792725, -0.5566391944885254, -0.5381500720977783, -0.5196608901023865, -0.5011717677116394, -0.48268264532089233, -0.46419352293014526, -0.4457044005393982, -0.42721521854400635, -0.4087260961532593, -0.3902369439601898, -0.37174782156944275, -0.3532586693763733, -0.3347695469856262, -0.31628042459487915, -0.2977913022041321, -0.2793021500110626, -0.26081302762031555, -0.2423238754272461, -0.22383475303649902, -0.20534561574459076, -0.1868564784526825, -0.16836735606193542, -0.14987821877002716, -0.13138914108276367, -0.11290000379085541, -0.09441087394952774, -0.07592174410820007, -0.05743260681629181, -0.038943469524383545, -0.020454339683055878, -0.0019652098417282104, 0.016523927450180054, 0.03501306101679802, 0.053502194583415985, 0.07199132442474365, 0.09048046171665192, 0.10896959900856018, 0.12745872139930725, 0.14594785869121552, 0.16443699598312378, 0.18292613327503204, 0.2014152705669403, 0.21990439295768738, 0.23839353024959564, 0.2568826675415039, 0.275371789932251, 0.29386091232299805, 0.3123500645160675, 0.3308391869068146, 0.34932833909988403, 0.3678174614906311, 0.3863065838813782, 0.40479573607444763, 0.4232848584651947, 0.44177401065826416, 0.46026313304901123]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 19.0, 32.0, 124.0, 324.0, 1097.0, 10631.0, 4104674.0, 73629.0, 2921.0, 549.0, 156.0, 55.0, 32.0, 17.0, 11.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.14908790588378906, -0.14351272583007812, -0.1379375457763672, -0.13236236572265625, -0.1267871856689453, -0.12121200561523438, -0.11563682556152344, -0.1100616455078125, -0.10448646545410156, -0.09891128540039062, -0.09333610534667969, -0.08776092529296875, -0.08218574523925781, -0.07661056518554688, -0.07103538513183594, -0.065460205078125, -0.05988502502441406, -0.054309844970703125, -0.04873466491699219, -0.04315948486328125, -0.03758430480957031, -0.032009124755859375, -0.026433944702148438, -0.0208587646484375, -0.015283584594726562, -0.009708404541015625, -0.0041332244873046875, 0.00144195556640625, 0.0070171356201171875, 0.012592315673828125, 0.018167495727539062, 0.02374267578125, 0.029317855834960938, 0.034893035888671875, 0.04046821594238281, 0.04604339599609375, 0.05161857604980469, 0.057193756103515625, 0.06276893615722656, 0.0683441162109375, 0.07391929626464844, 0.07949447631835938, 0.08506965637207031, 0.09064483642578125, 0.09622001647949219, 0.10179519653320312, 0.10737037658691406, 0.112945556640625, 0.11852073669433594, 0.12409591674804688, 0.1296710968017578, 0.13524627685546875, 0.1408214569091797, 0.14639663696289062, 0.15197181701660156, 0.1575469970703125, 0.16312217712402344, 0.16869735717773438, 0.1742725372314453, 0.17984771728515625, 0.1854228973388672, 0.19099807739257812, 0.19657325744628906, 0.2021484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 15.0, 18.0, 25.0, 29.0, 30.0, 43.0, 48.0, 66.0, 64.0, 57.0, 84.0, 73.0, 76.0, 67.0, 68.0, 49.0, 46.0, 31.0, 27.0, 22.0, 19.0, 13.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06494140625, -0.06331586837768555, -0.061690330505371094, -0.06006479263305664, -0.05843925476074219, -0.056813716888427734, -0.05518817901611328, -0.05356264114379883, -0.051937103271484375, -0.05031156539916992, -0.04868602752685547, -0.047060489654541016, -0.04543495178222656, -0.04380941390991211, -0.042183876037597656, -0.0405583381652832, -0.03893280029296875, -0.0373072624206543, -0.035681724548339844, -0.03405618667602539, -0.03243064880371094, -0.030805110931396484, -0.02917957305908203, -0.027554035186767578, -0.025928497314453125, -0.024302959442138672, -0.02267742156982422, -0.021051883697509766, -0.019426345825195312, -0.01780080795288086, -0.016175270080566406, -0.014549732208251953, -0.0129241943359375, -0.011298656463623047, -0.009673118591308594, -0.00804758071899414, -0.0064220428466796875, -0.004796504974365234, -0.0031709671020507812, -0.0015454292297363281, 8.0108642578125e-05, 0.0017056465148925781, 0.0033311843872070312, 0.004956722259521484, 0.0065822601318359375, 0.00820779800415039, 0.009833335876464844, 0.011458873748779297, 0.01308441162109375, 0.014709949493408203, 0.016335487365722656, 0.01796102523803711, 0.019586563110351562, 0.021212100982666016, 0.02283763885498047, 0.024463176727294922, 0.026088714599609375, 0.027714252471923828, 0.02933979034423828, 0.030965328216552734, 0.03259086608886719, 0.03421640396118164, 0.035841941833496094, 0.03746747970581055, 0.039093017578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 8.0, 10.0, 14.0, 22.0, 33.0, 50.0, 85.0, 136.0, 203.0, 379.0, 644.0, 1436.0, 4001.0, 14035.0, 99833.0, 3913575.0, 135271.0, 16577.0, 4541.0, 1650.0, 758.0, 408.0, 222.0, 132.0, 87.0, 66.0, 34.0, 24.0, 15.0, 12.0, 10.0, 8.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0849609375, -0.0824289321899414, -0.07989692687988281, -0.07736492156982422, -0.07483291625976562, -0.07230091094970703, -0.06976890563964844, -0.06723690032958984, -0.06470489501953125, -0.062172889709472656, -0.05964088439941406, -0.05710887908935547, -0.054576873779296875, -0.05204486846923828, -0.04951286315917969, -0.046980857849121094, -0.0444488525390625, -0.041916847229003906, -0.03938484191894531, -0.03685283660888672, -0.034320831298828125, -0.03178882598876953, -0.029256820678710938, -0.026724815368652344, -0.02419281005859375, -0.021660804748535156, -0.019128799438476562, -0.01659679412841797, -0.014064788818359375, -0.011532783508300781, -0.009000778198242188, -0.006468772888183594, -0.003936767578125, -0.0014047622680664062, 0.0011272430419921875, 0.0036592483520507812, 0.006191253662109375, 0.008723258972167969, 0.011255264282226562, 0.013787269592285156, 0.01631927490234375, 0.018851280212402344, 0.021383285522460938, 0.02391529083251953, 0.026447296142578125, 0.02897930145263672, 0.03151130676269531, 0.034043312072753906, 0.0365753173828125, 0.039107322692871094, 0.04163932800292969, 0.04417133331298828, 0.046703338623046875, 0.04923534393310547, 0.05176734924316406, 0.054299354553222656, 0.05683135986328125, 0.059363365173339844, 0.06189537048339844, 0.06442737579345703, 0.06695938110351562, 0.06949138641357422, 0.07202339172363281, 0.0745553970336914, 0.07708740234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 4.0, 9.0, 23.0, 50.0, 142.0, 848.0, 2765.0, 141.0, 47.0, 20.0, 14.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0223846435546875, -0.021370649337768555, -0.02035665512084961, -0.019342660903930664, -0.01832866668701172, -0.017314672470092773, -0.016300678253173828, -0.015286684036254883, -0.014272689819335938, -0.013258695602416992, -0.012244701385498047, -0.011230707168579102, -0.010216712951660156, -0.009202718734741211, -0.008188724517822266, -0.00717473030090332, -0.006160736083984375, -0.00514674186706543, -0.004132747650146484, -0.003118753433227539, -0.0021047592163085938, -0.0010907649993896484, -7.677078247070312e-05, 0.0009372234344482422, 0.0019512176513671875, 0.002965211868286133, 0.003979206085205078, 0.0049932003021240234, 0.006007194519042969, 0.007021188735961914, 0.00803518295288086, 0.009049177169799805, 0.01006317138671875, 0.011077165603637695, 0.01209115982055664, 0.013105154037475586, 0.014119148254394531, 0.015133142471313477, 0.016147136688232422, 0.017161130905151367, 0.018175125122070312, 0.019189119338989258, 0.020203113555908203, 0.02121710777282715, 0.022231101989746094, 0.02324509620666504, 0.024259090423583984, 0.02527308464050293, 0.026287078857421875, 0.02730107307434082, 0.028315067291259766, 0.02932906150817871, 0.030343055725097656, 0.0313570499420166, 0.03237104415893555, 0.03338503837585449, 0.03439903259277344, 0.03541302680969238, 0.03642702102661133, 0.03744101524353027, 0.03845500946044922, 0.039469003677368164, 0.04048299789428711, 0.041496992111206055, 0.042510986328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 8.0, 13.0, 34.0, 83.0, 147.0, 200.0, 204.0, 163.0, 75.0, 35.0, 20.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11872594058513641, -0.11467283964157104, -0.11061973869800568, -0.10656663775444031, -0.10251353681087494, -0.09846043586730957, -0.0944073274731636, -0.09035422652959824, -0.08630112558603287, -0.0822480246424675, -0.07819492369890213, -0.07414182275533676, -0.0700887143611908, -0.06603561341762543, -0.06198251247406006, -0.05792941153049469, -0.05387631058692932, -0.04982320964336395, -0.045770108699798584, -0.04171700403094292, -0.03766390308737755, -0.03361080214381218, -0.02955769933760166, -0.025504596531391144, -0.021451495587825775, -0.017398394644260406, -0.013345291838049889, -0.009292189963161945, -0.005239088088274002, -0.0011859871447086334, 0.0028671156615018845, 0.006920218467712402, 0.010973304510116577, 0.01502640638500452, 0.019079508259892464, 0.02313261106610298, 0.02718571200966835, 0.03123881295323372, 0.035291917622089386, 0.039345018565654755, 0.04339811950922012, 0.04745122045278549, 0.05150432139635086, 0.05555742606520653, 0.059610527008771896, 0.06366363167762756, 0.06771673262119293, 0.0717698335647583, 0.07582293450832367, 0.07987603545188904, 0.0839291363954544, 0.08798223733901978, 0.09203533828258514, 0.09608843922615051, 0.10014154762029648, 0.10419464856386185, 0.10824774950742722, 0.11230085045099258, 0.11635395139455795, 0.12040705233812332, 0.12446016073226929, 0.12851326167583466, 0.13256636261940002, 0.1366194635629654, 0.14067256450653076]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 7.0, 1.0, 7.0, 3.0, 7.0, 9.0, 13.0, 4.0, 16.0, 12.0, 16.0, 11.0, 21.0, 32.0, 35.0, 35.0, 40.0, 28.0, 40.0, 46.0, 44.0, 44.0, 42.0, 42.0, 54.0, 48.0, 43.0, 31.0, 36.0, 36.0, 26.0, 19.0, 27.0, 28.0, 16.0, 19.0, 16.0, 17.0, 4.0, 5.0, 8.0, 7.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04854714870452881, -0.04703591763973236, -0.045524682849645615, -0.04401344805955887, -0.04250221699476242, -0.04099098592996597, -0.03947975113987923, -0.03796851634979248, -0.03645728528499603, -0.034946054220199585, -0.03343481943011284, -0.03192358464002609, -0.030412353575229645, -0.028901120647788048, -0.02738988772034645, -0.025878654792904854, -0.024367421865463257, -0.02285618893802166, -0.021344956010580063, -0.019833723083138466, -0.01832249015569687, -0.016811257228255272, -0.015300024300813675, -0.013788791373372078, -0.012277558445930481, -0.010766325518488884, -0.009255092591047287, -0.00774385966360569, -0.006232626736164093, -0.004721393808722496, -0.003210160881280899, -0.001698927953839302, -0.00018769502639770508, 0.001323537901043892, 0.002834770828485489, 0.004346003755927086, 0.005857236683368683, 0.00736846961081028, 0.008879702538251877, 0.010390935465693474, 0.01190216839313507, 0.013413401320576668, 0.014924634248018265, 0.016435867175459862, 0.01794710010290146, 0.019458333030343056, 0.020969565957784653, 0.02248079888522625, 0.023992031812667847, 0.025503264740109444, 0.02701449766755104, 0.028525730594992638, 0.030036963522434235, 0.03154819458723068, 0.03305942937731743, 0.034570664167404175, 0.03608189523220062, 0.03759312629699707, 0.039104361087083817, 0.04061559587717056, 0.04212682694196701, 0.04363805800676346, 0.045149292796850204, 0.04666052758693695, 0.0481717586517334]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 8.0, 17.0, 23.0, 18.0, 41.0, 58.0, 98.0, 136.0, 236.0, 481.0, 1066.0, 2565.0, 7653.0, 25529.0, 92357.0, 278678.0, 385178.0, 179327.0, 52525.0, 14591.0, 4667.0, 1593.0, 778.0, 339.0, 209.0, 119.0, 80.0, 49.0, 42.0, 18.0, 15.0, 12.0, 11.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03729248046875, -0.03606081008911133, -0.034829139709472656, -0.033597469329833984, -0.03236579895019531, -0.03113412857055664, -0.02990245819091797, -0.028670787811279297, -0.027439117431640625, -0.026207447052001953, -0.02497577667236328, -0.02374410629272461, -0.022512435913085938, -0.021280765533447266, -0.020049095153808594, -0.018817424774169922, -0.01758575439453125, -0.016354084014892578, -0.015122413635253906, -0.013890743255615234, -0.012659072875976562, -0.01142740249633789, -0.010195732116699219, -0.008964061737060547, -0.007732391357421875, -0.006500720977783203, -0.005269050598144531, -0.004037380218505859, -0.0028057098388671875, -0.0015740394592285156, -0.00034236907958984375, 0.0008893013000488281, 0.0021209716796875, 0.003352642059326172, 0.004584312438964844, 0.005815982818603516, 0.0070476531982421875, 0.00827932357788086, 0.009510993957519531, 0.010742664337158203, 0.011974334716796875, 0.013206005096435547, 0.014437675476074219, 0.01566934585571289, 0.016901016235351562, 0.018132686614990234, 0.019364356994628906, 0.020596027374267578, 0.02182769775390625, 0.023059368133544922, 0.024291038513183594, 0.025522708892822266, 0.026754379272460938, 0.02798604965209961, 0.02921772003173828, 0.030449390411376953, 0.031681060791015625, 0.0329127311706543, 0.03414440155029297, 0.03537607192993164, 0.03660774230957031, 0.037839412689208984, 0.039071083068847656, 0.04030275344848633, 0.041534423828125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 10.0, 5.0, 13.0, 15.0, 23.0, 28.0, 25.0, 52.0, 49.0, 46.0, 74.0, 76.0, 98.0, 78.0, 70.0, 71.0, 62.0, 54.0, 46.0, 35.0, 24.0, 12.0, 17.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.06347894668579102, -0.06171131134033203, -0.05994367599487305, -0.05817604064941406, -0.05640840530395508, -0.054640769958496094, -0.05287313461303711, -0.051105499267578125, -0.04933786392211914, -0.047570228576660156, -0.04580259323120117, -0.04403495788574219, -0.0422673225402832, -0.04049968719482422, -0.038732051849365234, -0.03696441650390625, -0.035196781158447266, -0.03342914581298828, -0.0316615104675293, -0.029893875122070312, -0.028126239776611328, -0.026358604431152344, -0.02459096908569336, -0.022823333740234375, -0.02105569839477539, -0.019288063049316406, -0.017520427703857422, -0.015752792358398438, -0.013985157012939453, -0.012217521667480469, -0.010449886322021484, -0.0086822509765625, -0.006914615631103516, -0.005146980285644531, -0.003379344940185547, -0.0016117095947265625, 0.00015592575073242188, 0.0019235610961914062, 0.0036911964416503906, 0.005458831787109375, 0.007226467132568359, 0.008994102478027344, 0.010761737823486328, 0.012529373168945312, 0.014297008514404297, 0.01606464385986328, 0.017832279205322266, 0.01959991455078125, 0.021367549896240234, 0.02313518524169922, 0.024902820587158203, 0.026670455932617188, 0.028438091278076172, 0.030205726623535156, 0.03197336196899414, 0.033740997314453125, 0.03550863265991211, 0.037276268005371094, 0.03904390335083008, 0.04081153869628906, 0.04257917404174805, 0.04434680938720703, 0.046114444732666016, 0.047882080078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 2.0, 8.0, 11.0, 9.0, 22.0, 33.0, 50.0, 58.0, 128.0, 142.0, 313.0, 552.0, 1041.0, 2933.0, 25205.0, 695668.0, 307568.0, 10776.0, 2038.0, 848.0, 474.0, 260.0, 126.0, 109.0, 50.0, 36.0, 27.0, 13.0, 18.0, 13.0, 8.0, 7.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09823417663574219, -0.09514999389648438, -0.09206581115722656, -0.08898162841796875, -0.08589744567871094, -0.08281326293945312, -0.07972908020019531, -0.0766448974609375, -0.07356071472167969, -0.07047653198242188, -0.06739234924316406, -0.06430816650390625, -0.06122398376464844, -0.058139801025390625, -0.05505561828613281, -0.051971435546875, -0.04888725280761719, -0.045803070068359375, -0.04271888732910156, -0.03963470458984375, -0.03655052185058594, -0.033466339111328125, -0.030382156372070312, -0.0272979736328125, -0.024213790893554688, -0.021129608154296875, -0.018045425415039062, -0.01496124267578125, -0.011877059936523438, -0.008792877197265625, -0.0057086944580078125, -0.00262451171875, 0.0004596710205078125, 0.003543853759765625, 0.0066280364990234375, 0.00971221923828125, 0.012796401977539062, 0.015880584716796875, 0.018964767456054688, 0.0220489501953125, 0.025133132934570312, 0.028217315673828125, 0.03130149841308594, 0.03438568115234375, 0.03746986389160156, 0.040554046630859375, 0.04363822937011719, 0.046722412109375, 0.04980659484863281, 0.052890777587890625, 0.05597496032714844, 0.05905914306640625, 0.06214332580566406, 0.06522750854492188, 0.06831169128417969, 0.0713958740234375, 0.07448005676269531, 0.07756423950195312, 0.08064842224121094, 0.08373260498046875, 0.08681678771972656, 0.08990097045898438, 0.09298515319824219, 0.0960693359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 7.0, 2.0, 8.0, 8.0, 19.0, 8.0, 19.0, 21.0, 24.0, 26.0, 26.0, 31.0, 27.0, 32.0, 40.0, 26.0, 33.0, 53.0, 35.0, 38.0, 31.0, 38.0, 42.0, 43.0, 45.0, 40.0, 24.0, 31.0, 30.0, 15.0, 29.0, 17.0, 15.0, 26.0, 14.0, 12.0, 11.0, 9.0, 7.0, 14.0, 6.0, 7.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12359619140625, -0.11987113952636719, -0.11614608764648438, -0.11242103576660156, -0.10869598388671875, -0.10497093200683594, -0.10124588012695312, -0.09752082824707031, -0.0937957763671875, -0.09007072448730469, -0.08634567260742188, -0.08262062072753906, -0.07889556884765625, -0.07517051696777344, -0.07144546508789062, -0.06772041320800781, -0.063995361328125, -0.06027030944824219, -0.056545257568359375, -0.05282020568847656, -0.04909515380859375, -0.04537010192871094, -0.041645050048828125, -0.03791999816894531, -0.0341949462890625, -0.030469894409179688, -0.026744842529296875, -0.023019790649414062, -0.01929473876953125, -0.015569686889648438, -0.011844635009765625, -0.008119583129882812, -0.00439453125, -0.0006694793701171875, 0.003055572509765625, 0.0067806243896484375, 0.01050567626953125, 0.014230728149414062, 0.017955780029296875, 0.021680831909179688, 0.0254058837890625, 0.029130935668945312, 0.032855987548828125, 0.03658103942871094, 0.04030609130859375, 0.04403114318847656, 0.047756195068359375, 0.05148124694824219, 0.055206298828125, 0.05893135070800781, 0.06265640258789062, 0.06638145446777344, 0.07010650634765625, 0.07383155822753906, 0.07755661010742188, 0.08128166198730469, 0.0850067138671875, 0.08873176574707031, 0.09245681762695312, 0.09618186950683594, 0.09990692138671875, 0.10363197326660156, 0.10735702514648438, 0.11108207702636719, 0.11480712890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 7.0, 5.0, 13.0, 17.0, 26.0, 33.0, 42.0, 80.0, 137.0, 248.0, 432.0, 1027.0, 3214.0, 20402.0, 494755.0, 501831.0, 20924.0, 3253.0, 1063.0, 449.0, 233.0, 133.0, 73.0, 57.0, 26.0, 18.0, 19.0, 6.0, 15.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.049652099609375, -0.0482335090637207, -0.046814918518066406, -0.04539632797241211, -0.04397773742675781, -0.042559146881103516, -0.04114055633544922, -0.03972196578979492, -0.038303375244140625, -0.03688478469848633, -0.03546619415283203, -0.034047603607177734, -0.03262901306152344, -0.03121042251586914, -0.029791831970214844, -0.028373241424560547, -0.02695465087890625, -0.025536060333251953, -0.024117469787597656, -0.02269887924194336, -0.021280288696289062, -0.019861698150634766, -0.01844310760498047, -0.017024517059326172, -0.015605926513671875, -0.014187335968017578, -0.012768745422363281, -0.011350154876708984, -0.009931564331054688, -0.00851297378540039, -0.007094383239746094, -0.005675792694091797, -0.0042572021484375, -0.002838611602783203, -0.0014200210571289062, -1.430511474609375e-06, 0.0014171600341796875, 0.0028357505798339844, 0.004254341125488281, 0.005672931671142578, 0.007091522216796875, 0.008510112762451172, 0.009928703308105469, 0.011347293853759766, 0.012765884399414062, 0.01418447494506836, 0.015603065490722656, 0.017021656036376953, 0.01844024658203125, 0.019858837127685547, 0.021277427673339844, 0.02269601821899414, 0.024114608764648438, 0.025533199310302734, 0.02695178985595703, 0.028370380401611328, 0.029788970947265625, 0.031207561492919922, 0.03262615203857422, 0.034044742584228516, 0.03546333312988281, 0.03688192367553711, 0.038300514221191406, 0.0397191047668457, 0.0411376953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 13.0, 8.0, 14.0, 15.0, 32.0, 31.0, 39.0, 66.0, 63.0, 77.0, 107.0, 84.0, 82.0, 81.0, 61.0, 58.0, 40.0, 21.0, 31.0, 18.0, 13.0, 17.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.123283386230469e-05, -2.984795719385147e-05, -2.8463080525398254e-05, -2.7078203856945038e-05, -2.569332718849182e-05, -2.4308450520038605e-05, -2.2923573851585388e-05, -2.153869718313217e-05, -2.0153820514678955e-05, -1.876894384622574e-05, -1.7384067177772522e-05, -1.5999190509319305e-05, -1.4614313840866089e-05, -1.3229437172412872e-05, -1.1844560503959656e-05, -1.045968383550644e-05, -9.074807167053223e-06, -7.689930498600006e-06, -6.3050538301467896e-06, -4.920177161693573e-06, -3.5353004932403564e-06, -2.15042382478714e-06, -7.655471563339233e-07, 6.193295121192932e-07, 2.0042061805725098e-06, 3.3890828490257263e-06, 4.773959517478943e-06, 6.1588361859321594e-06, 7.543712854385376e-06, 8.928589522838593e-06, 1.0313466191291809e-05, 1.1698342859745026e-05, 1.3083219528198242e-05, 1.4468096196651459e-05, 1.5852972865104675e-05, 1.7237849533557892e-05, 1.862272620201111e-05, 2.0007602870464325e-05, 2.139247953891754e-05, 2.2777356207370758e-05, 2.4162232875823975e-05, 2.554710954427719e-05, 2.6931986212730408e-05, 2.8316862881183624e-05, 2.970173954963684e-05, 3.108661621809006e-05, 3.2471492886543274e-05, 3.385636955499649e-05, 3.524124622344971e-05, 3.6626122891902924e-05, 3.801099956035614e-05, 3.939587622880936e-05, 4.078075289726257e-05, 4.216562956571579e-05, 4.3550506234169006e-05, 4.493538290262222e-05, 4.632025957107544e-05, 4.7705136239528656e-05, 4.909001290798187e-05, 5.047488957643509e-05, 5.1859766244888306e-05, 5.324464291334152e-05, 5.462951958179474e-05, 5.6014396250247955e-05, 5.739927291870117e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 24.0, 14.0, 25.0, 44.0, 55.0, 96.0, 140.0, 252.0, 458.0, 802.0, 1780.0, 4577.0, 21178.0, 193732.0, 710551.0, 95594.0, 12852.0, 3404.0, 1357.0, 626.0, 385.0, 216.0, 137.0, 78.0, 47.0, 31.0, 23.0, 16.0, 15.0, 9.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037384033203125, -0.03629589080810547, -0.03520774841308594, -0.034119606018066406, -0.033031463623046875, -0.031943321228027344, -0.030855178833007812, -0.02976703643798828, -0.02867889404296875, -0.02759075164794922, -0.026502609252929688, -0.025414466857910156, -0.024326324462890625, -0.023238182067871094, -0.022150039672851562, -0.02106189727783203, -0.0199737548828125, -0.01888561248779297, -0.017797470092773438, -0.016709327697753906, -0.015621185302734375, -0.014533042907714844, -0.013444900512695312, -0.012356758117675781, -0.01126861572265625, -0.010180473327636719, -0.009092330932617188, -0.008004188537597656, -0.006916046142578125, -0.005827903747558594, -0.0047397613525390625, -0.0036516189575195312, -0.0025634765625, -0.0014753341674804688, -0.0003871917724609375, 0.0007009506225585938, 0.001789093017578125, 0.0028772354125976562, 0.0039653778076171875, 0.005053520202636719, 0.00614166259765625, 0.007229804992675781, 0.008317947387695312, 0.009406089782714844, 0.010494232177734375, 0.011582374572753906, 0.012670516967773438, 0.013758659362792969, 0.0148468017578125, 0.01593494415283203, 0.017023086547851562, 0.018111228942871094, 0.019199371337890625, 0.020287513732910156, 0.021375656127929688, 0.02246379852294922, 0.02355194091796875, 0.02464008331298828, 0.025728225708007812, 0.026816368103027344, 0.027904510498046875, 0.028992652893066406, 0.030080795288085938, 0.03116893768310547, 0.032257080078125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 10.0, 11.0, 26.0, 31.0, 50.0, 79.0, 77.0, 115.0, 115.0, 100.0, 103.0, 70.0, 62.0, 43.0, 34.0, 17.0, 18.0, 8.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.054046630859375, -0.052813053131103516, -0.05157947540283203, -0.05034589767456055, -0.04911231994628906, -0.04787874221801758, -0.046645164489746094, -0.04541158676147461, -0.044178009033203125, -0.04294443130493164, -0.041710853576660156, -0.04047727584838867, -0.03924369812011719, -0.0380101203918457, -0.03677654266357422, -0.035542964935302734, -0.03430938720703125, -0.033075809478759766, -0.03184223175048828, -0.030608654022216797, -0.029375076293945312, -0.028141498565673828, -0.026907920837402344, -0.02567434310913086, -0.024440765380859375, -0.02320718765258789, -0.021973609924316406, -0.020740032196044922, -0.019506454467773438, -0.018272876739501953, -0.01703929901123047, -0.015805721282958984, -0.0145721435546875, -0.013338565826416016, -0.012104988098144531, -0.010871410369873047, -0.009637832641601562, -0.008404254913330078, -0.007170677185058594, -0.005937099456787109, -0.004703521728515625, -0.0034699440002441406, -0.0022363662719726562, -0.0010027885437011719, 0.0002307891845703125, 0.0014643669128417969, 0.0026979446411132812, 0.003931522369384766, 0.00516510009765625, 0.006398677825927734, 0.007632255554199219, 0.008865833282470703, 0.010099411010742188, 0.011332988739013672, 0.012566566467285156, 0.01380014419555664, 0.015033721923828125, 0.01626729965209961, 0.017500877380371094, 0.018734455108642578, 0.019968032836914062, 0.021201610565185547, 0.02243518829345703, 0.023668766021728516, 0.02490234375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 49.0, 209.0, 414.0, 235.0, 66.0, 11.0, 6.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3151347637176514, -1.274859070777893, -1.2345833778381348, -1.1943076848983765, -1.1540319919586182, -1.1137561798095703, -1.0734806060791016, -1.0332047939300537, -0.9929291009902954, -0.9526534080505371, -0.9123777151107788, -0.8721020221710205, -0.8318262696266174, -0.7915505766868591, -0.7512748837471008, -0.7109991312026978, -0.6707234978675842, -0.6304478049278259, -0.5901721119880676, -0.5498963594436646, -0.5096206665039062, -0.46934497356414795, -0.42906928062438965, -0.38879355788230896, -0.34851786494255066, -0.30824217200279236, -0.26796644926071167, -0.22769075632095337, -0.18741504848003387, -0.14713934063911438, -0.10686364769935608, -0.06658792495727539, -0.02631223201751709, 0.013963472098112106, 0.0542391762137413, 0.0945148766040802, 0.1347905844449997, 0.1750662922859192, 0.2153419852256775, 0.2556177079677582, 0.2958934009075165, 0.3361690938472748, 0.37644481658935547, 0.41672050952911377, 0.45699620246887207, 0.49727192521095276, 0.5375475883483887, 0.5778233408927917, 0.61809903383255, 0.6583747267723083, 0.6986504197120667, 0.7389261722564697, 0.779201865196228, 0.8194775581359863, 0.8597532510757446, 0.9000289440155029, 0.9403046369552612, 0.9805803298950195, 1.0208560228347778, 1.0611317157745361, 1.1014074087142944, 1.1416831016540527, 1.1819589138031006, 1.2222346067428589, 1.2625102996826172]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 11.0, 8.0, 10.0, 14.0, 11.0, 16.0, 20.0, 27.0, 20.0, 29.0, 45.0, 58.0, 36.0, 46.0, 55.0, 52.0, 63.0, 56.0, 48.0, 44.0, 45.0, 40.0, 31.0, 23.0, 36.0, 23.0, 27.0, 21.0, 10.0, 15.0, 8.0, 11.0, 10.0, 8.0, 4.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.6857761740684509, -0.6652608513832092, -0.6447454690933228, -0.624230146408081, -0.6037148237228394, -0.5831995010375977, -0.5626841187477112, -0.5421687960624695, -0.5216534733772278, -0.5011381506919861, -0.480622798204422, -0.4601074457168579, -0.4395921230316162, -0.4190767705440521, -0.39856141805648804, -0.37804609537124634, -0.35753074288368225, -0.33701539039611816, -0.31650006771087646, -0.2959847152233124, -0.2754693925380707, -0.2549540400505066, -0.2344387024641037, -0.2139233648777008, -0.1934080272912979, -0.17289268970489502, -0.15237735211849213, -0.13186201453208923, -0.11134666949510574, -0.09083133190870285, -0.07031598687171936, -0.04980064928531647, -0.029285311698913574, -0.008769972249865532, 0.01174536719918251, 0.0322607085108757, 0.052776046097278595, 0.07329138368368149, 0.09380672872066498, 0.11432206630706787, 0.13483740389347076, 0.15535274147987366, 0.17586807906627655, 0.19638341665267944, 0.21689876914024353, 0.23741409182548523, 0.2579294443130493, 0.278444766998291, 0.2989601194858551, 0.3194754719734192, 0.3399907946586609, 0.360506147146225, 0.3810214698314667, 0.40153682231903076, 0.42205214500427246, 0.44256749749183655, 0.46308284997940063, 0.4835982024669647, 0.5041135549545288, 0.5246288776397705, 0.5451442003250122, 0.5656595230102539, 0.5861749053001404, 0.6066902279853821, 0.6272055506706238]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 13.0, 28.0, 36.0, 62.0, 106.0, 189.0, 316.0, 702.0, 1648.0, 4609.0, 17390.0, 142462.0, 3889246.0, 115008.0, 15116.0, 4280.0, 1579.0, 672.0, 323.0, 184.0, 105.0, 70.0, 39.0, 20.0, 16.0, 9.0, 5.0, 6.0, 9.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.051544189453125, -0.049596309661865234, -0.04764842987060547, -0.0457005500793457, -0.04375267028808594, -0.04180479049682617, -0.039856910705566406, -0.03790903091430664, -0.035961151123046875, -0.03401327133178711, -0.032065391540527344, -0.030117511749267578, -0.028169631958007812, -0.026221752166748047, -0.02427387237548828, -0.022325992584228516, -0.02037811279296875, -0.018430233001708984, -0.01648235321044922, -0.014534473419189453, -0.012586593627929688, -0.010638713836669922, -0.008690834045410156, -0.006742954254150391, -0.004795074462890625, -0.0028471946716308594, -0.0008993148803710938, 0.0010485649108886719, 0.0029964447021484375, 0.004944324493408203, 0.006892204284667969, 0.008840084075927734, 0.0107879638671875, 0.012735843658447266, 0.014683723449707031, 0.016631603240966797, 0.018579483032226562, 0.020527362823486328, 0.022475242614746094, 0.02442312240600586, 0.026371002197265625, 0.02831888198852539, 0.030266761779785156, 0.03221464157104492, 0.03416252136230469, 0.03611040115356445, 0.03805828094482422, 0.040006160736083984, 0.04195404052734375, 0.043901920318603516, 0.04584980010986328, 0.04779767990112305, 0.04974555969238281, 0.05169343948364258, 0.053641319274902344, 0.05558919906616211, 0.057537078857421875, 0.05948495864868164, 0.061432838439941406, 0.06338071823120117, 0.06532859802246094, 0.0672764778137207, 0.06922435760498047, 0.07117223739624023, 0.0731201171875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 10.0, 19.0, 14.0, 16.0, 31.0, 30.0, 28.0, 56.0, 56.0, 61.0, 65.0, 79.0, 83.0, 75.0, 70.0, 62.0, 53.0, 46.0, 32.0, 27.0, 22.0, 21.0, 10.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.057647705078125, -0.05605316162109375, -0.0544586181640625, -0.05286407470703125, -0.05126953125, -0.04967498779296875, -0.0480804443359375, -0.04648590087890625, -0.044891357421875, -0.04329681396484375, -0.0417022705078125, -0.04010772705078125, -0.03851318359375, -0.03691864013671875, -0.0353240966796875, -0.03372955322265625, -0.032135009765625, -0.03054046630859375, -0.0289459228515625, -0.02735137939453125, -0.0257568359375, -0.02416229248046875, -0.0225677490234375, -0.02097320556640625, -0.019378662109375, -0.01778411865234375, -0.0161895751953125, -0.01459503173828125, -0.01300048828125, -0.01140594482421875, -0.0098114013671875, -0.00821685791015625, -0.006622314453125, -0.00502777099609375, -0.0034332275390625, -0.00183868408203125, -0.000244140625, 0.00135040283203125, 0.0029449462890625, 0.00453948974609375, 0.006134033203125, 0.00772857666015625, 0.0093231201171875, 0.01091766357421875, 0.01251220703125, 0.01410675048828125, 0.0157012939453125, 0.01729583740234375, 0.018890380859375, 0.02048492431640625, 0.0220794677734375, 0.02367401123046875, 0.0252685546875, 0.02686309814453125, 0.0284576416015625, 0.03005218505859375, 0.031646728515625, 0.03324127197265625, 0.0348358154296875, 0.03643035888671875, 0.03802490234375, 0.03961944580078125, 0.0412139892578125, 0.04280853271484375, 0.044403076171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 10.0, 8.0, 13.0, 21.0, 36.0, 65.0, 80.0, 120.0, 197.0, 347.0, 735.0, 1755.0, 5926.0, 25530.0, 253545.0, 3761605.0, 120472.0, 16729.0, 4218.0, 1481.0, 598.0, 276.0, 160.0, 111.0, 66.0, 42.0, 39.0, 18.0, 28.0, 12.0, 15.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052581787109375, -0.05042409896850586, -0.04826641082763672, -0.04610872268676758, -0.04395103454589844, -0.0417933464050293, -0.039635658264160156, -0.037477970123291016, -0.035320281982421875, -0.033162593841552734, -0.031004905700683594, -0.028847217559814453, -0.026689529418945312, -0.024531841278076172, -0.02237415313720703, -0.02021646499633789, -0.01805877685546875, -0.01590108871459961, -0.013743400573730469, -0.011585712432861328, -0.009428024291992188, -0.007270336151123047, -0.005112648010253906, -0.0029549598693847656, -0.000797271728515625, 0.0013604164123535156, 0.0035181045532226562, 0.005675792694091797, 0.007833480834960938, 0.009991168975830078, 0.012148857116699219, 0.01430654525756836, 0.0164642333984375, 0.01862192153930664, 0.02077960968017578, 0.022937297821044922, 0.025094985961914062, 0.027252674102783203, 0.029410362243652344, 0.031568050384521484, 0.033725738525390625, 0.035883426666259766, 0.038041114807128906, 0.04019880294799805, 0.04235649108886719, 0.04451417922973633, 0.04667186737060547, 0.04882955551147461, 0.05098724365234375, 0.05314493179321289, 0.05530261993408203, 0.05746030807495117, 0.05961799621582031, 0.06177568435668945, 0.0639333724975586, 0.06609106063842773, 0.06824874877929688, 0.07040643692016602, 0.07256412506103516, 0.0747218132019043, 0.07687950134277344, 0.07903718948364258, 0.08119487762451172, 0.08335256576538086, 0.08551025390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 13.0, 23.0, 34.0, 70.0, 188.0, 518.0, 2428.0, 475.0, 148.0, 71.0, 40.0, 20.0, 13.0, 11.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0226898193359375, -0.02146172523498535, -0.020233631134033203, -0.019005537033081055, -0.017777442932128906, -0.016549348831176758, -0.01532125473022461, -0.014093160629272461, -0.012865066528320312, -0.011636972427368164, -0.010408878326416016, -0.009180784225463867, -0.007952690124511719, -0.00672459602355957, -0.005496501922607422, -0.0042684078216552734, -0.003040313720703125, -0.0018122196197509766, -0.0005841255187988281, 0.0006439685821533203, 0.0018720626831054688, 0.003100156784057617, 0.004328250885009766, 0.005556344985961914, 0.0067844390869140625, 0.008012533187866211, 0.00924062728881836, 0.010468721389770508, 0.011696815490722656, 0.012924909591674805, 0.014153003692626953, 0.015381097793579102, 0.01660919189453125, 0.0178372859954834, 0.019065380096435547, 0.020293474197387695, 0.021521568298339844, 0.022749662399291992, 0.02397775650024414, 0.02520585060119629, 0.026433944702148438, 0.027662038803100586, 0.028890132904052734, 0.030118227005004883, 0.03134632110595703, 0.03257441520690918, 0.03380250930786133, 0.03503060340881348, 0.036258697509765625, 0.03748679161071777, 0.03871488571166992, 0.03994297981262207, 0.04117107391357422, 0.04239916801452637, 0.043627262115478516, 0.044855356216430664, 0.04608345031738281, 0.04731154441833496, 0.04853963851928711, 0.04976773262023926, 0.050995826721191406, 0.052223920822143555, 0.0534520149230957, 0.05468010902404785, 0.055908203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 13.0, 26.0, 57.0, 183.0, 318.0, 238.0, 103.0, 42.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34272754192352295, -0.33314183354377747, -0.323556125164032, -0.3139704465866089, -0.3043847382068634, -0.2947990298271179, -0.28521332144737244, -0.27562761306762695, -0.26604193449020386, -0.2564562261104584, -0.24687053263187408, -0.2372848242521286, -0.2276991307735443, -0.21811342239379883, -0.20852771401405334, -0.19894200563430786, -0.18935629725456238, -0.1797705888748169, -0.1701848953962326, -0.16059918701648712, -0.15101349353790283, -0.14142778515815735, -0.13184207677841187, -0.12225637584924698, -0.11267067492008209, -0.1030849739909172, -0.09349927306175232, -0.08391356468200684, -0.07432786375284195, -0.06474216282367706, -0.05515645816922188, -0.04557075351476669, -0.03598505258560181, -0.02639934979379177, -0.016813647001981735, -0.0072279442101716995, 0.002357758581638336, 0.011943459510803223, 0.021529164165258408, 0.031114868819713593, 0.04070056974887848, 0.050286270678043365, 0.05987197533249855, 0.06945767998695374, 0.07904338091611862, 0.08862908184528351, 0.09821479022502899, 0.10780049115419388, 0.11738619208335876, 0.12697190046310425, 0.13655759394168854, 0.14614330232143402, 0.1557289958000183, 0.1653147041797638, 0.17490041255950928, 0.18448612093925476, 0.19407181441783905, 0.20365752279758453, 0.21324321627616882, 0.2228289246559143, 0.2324146330356598, 0.24200032651424408, 0.25158601999282837, 0.26117172837257385, 0.27075743675231934]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 3.0, 3.0, 7.0, 10.0, 13.0, 7.0, 10.0, 11.0, 15.0, 12.0, 24.0, 33.0, 25.0, 35.0, 33.0, 33.0, 40.0, 34.0, 46.0, 47.0, 39.0, 40.0, 43.0, 53.0, 48.0, 46.0, 34.0, 39.0, 22.0, 30.0, 20.0, 29.0, 17.0, 16.0, 18.0, 11.0, 12.0, 7.0, 9.0, 12.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.06841188669204712, -0.06619738042354584, -0.06398288160562515, -0.06176837533712387, -0.05955387279391289, -0.057339370250701904, -0.05512486398220062, -0.05291036143898964, -0.050695858895778656, -0.04848135635256767, -0.04626685380935669, -0.04405234754085541, -0.041837844997644424, -0.03962334245443344, -0.03740883618593216, -0.035194333642721176, -0.03297983109951019, -0.03076532855629921, -0.028550824150443077, -0.026336319744586945, -0.02412181720137596, -0.021907314658164978, -0.019692810252308846, -0.017478305846452713, -0.01526380330324173, -0.013049299828708172, -0.010834796354174614, -0.008620292879641056, -0.006405789405107498, -0.00419128593057394, -0.0019767824560403824, 0.0002377210184931755, 0.0024522244930267334, 0.004666727967560291, 0.006881231442093849, 0.009095734916627407, 0.011310238391160965, 0.013524741865694523, 0.01573924534022808, 0.017953749746084213, 0.020168252289295197, 0.02238275483250618, 0.024597259238362312, 0.026811763644218445, 0.029026266187429428, 0.03124076873064041, 0.03345527499914169, 0.035669777542352676, 0.03788428008556366, 0.04009878262877464, 0.042313285171985626, 0.04452779144048691, 0.04674229398369789, 0.048956796526908875, 0.051171302795410156, 0.05338580533862114, 0.05560030788183212, 0.057814810425043106, 0.06002931296825409, 0.06224381923675537, 0.06445832550525665, 0.06667282432317734, 0.06888733059167862, 0.0711018294095993, 0.07331633567810059]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 10.0, 5.0, 6.0, 15.0, 19.0, 32.0, 47.0, 68.0, 116.0, 179.0, 352.0, 687.0, 1648.0, 4407.0, 15807.0, 74925.0, 355926.0, 452292.0, 109728.0, 22506.0, 5919.0, 2016.0, 844.0, 401.0, 238.0, 123.0, 72.0, 49.0, 39.0, 29.0, 18.0, 9.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058258056640625, -0.05644416809082031, -0.054630279541015625, -0.05281639099121094, -0.05100250244140625, -0.04918861389160156, -0.047374725341796875, -0.04556083679199219, -0.0437469482421875, -0.04193305969238281, -0.040119171142578125, -0.03830528259277344, -0.03649139404296875, -0.03467750549316406, -0.032863616943359375, -0.031049728393554688, -0.02923583984375, -0.027421951293945312, -0.025608062744140625, -0.023794174194335938, -0.02198028564453125, -0.020166397094726562, -0.018352508544921875, -0.016538619995117188, -0.0147247314453125, -0.012910842895507812, -0.011096954345703125, -0.009283065795898438, -0.00746917724609375, -0.0056552886962890625, -0.003841400146484375, -0.0020275115966796875, -0.000213623046875, 0.0016002655029296875, 0.003414154052734375, 0.0052280426025390625, 0.00704193115234375, 0.008855819702148438, 0.010669708251953125, 0.012483596801757812, 0.0142974853515625, 0.016111373901367188, 0.017925262451171875, 0.019739151000976562, 0.02155303955078125, 0.023366928100585938, 0.025180816650390625, 0.026994705200195312, 0.02880859375, 0.030622482299804688, 0.032436370849609375, 0.03425025939941406, 0.03606414794921875, 0.03787803649902344, 0.039691925048828125, 0.04150581359863281, 0.0433197021484375, 0.04513359069824219, 0.046947479248046875, 0.04876136779785156, 0.05057525634765625, 0.05238914489746094, 0.054203033447265625, 0.05601692199707031, 0.057830810546875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 16.0, 19.0, 23.0, 31.0, 46.0, 39.0, 59.0, 61.0, 74.0, 57.0, 68.0, 89.0, 61.0, 71.0, 49.0, 52.0, 39.0, 25.0, 28.0, 19.0, 10.0, 11.0, 11.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0537109375, -0.05210685729980469, -0.050502777099609375, -0.04889869689941406, -0.04729461669921875, -0.04569053649902344, -0.044086456298828125, -0.04248237609863281, -0.0408782958984375, -0.03927421569824219, -0.037670135498046875, -0.03606605529785156, -0.03446197509765625, -0.03285789489746094, -0.031253814697265625, -0.029649734497070312, -0.028045654296875, -0.026441574096679688, -0.024837493896484375, -0.023233413696289062, -0.02162933349609375, -0.020025253295898438, -0.018421173095703125, -0.016817092895507812, -0.0152130126953125, -0.013608932495117188, -0.012004852294921875, -0.010400772094726562, -0.00879669189453125, -0.0071926116943359375, -0.005588531494140625, -0.0039844512939453125, -0.00238037109375, -0.0007762908935546875, 0.000827789306640625, 0.0024318695068359375, 0.00403594970703125, 0.0056400299072265625, 0.007244110107421875, 0.008848190307617188, 0.0104522705078125, 0.012056350708007812, 0.013660430908203125, 0.015264511108398438, 0.01686859130859375, 0.018472671508789062, 0.020076751708984375, 0.021680831909179688, 0.023284912109375, 0.024888992309570312, 0.026493072509765625, 0.028097152709960938, 0.02970123291015625, 0.03130531311035156, 0.032909393310546875, 0.03451347351074219, 0.0361175537109375, 0.03772163391113281, 0.039325714111328125, 0.04092979431152344, 0.04253387451171875, 0.04413795471191406, 0.045742034912109375, 0.04734611511230469, 0.0489501953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 13.0, 19.0, 28.0, 37.0, 52.0, 72.0, 101.0, 156.0, 237.0, 423.0, 682.0, 1214.0, 2698.0, 10614.0, 117274.0, 786551.0, 112165.0, 10509.0, 2741.0, 1180.0, 617.0, 365.0, 260.0, 163.0, 122.0, 66.0, 60.0, 34.0, 27.0, 24.0, 9.0, 6.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.06638145446777344, -0.06367111206054688, -0.06096076965332031, -0.05825042724609375, -0.05554008483886719, -0.052829742431640625, -0.05011940002441406, -0.0474090576171875, -0.04469871520996094, -0.041988372802734375, -0.03927803039550781, -0.03656768798828125, -0.03385734558105469, -0.031147003173828125, -0.028436660766601562, -0.025726318359375, -0.023015975952148438, -0.020305633544921875, -0.017595291137695312, -0.01488494873046875, -0.012174606323242188, -0.009464263916015625, -0.0067539215087890625, -0.0040435791015625, -0.0013332366943359375, 0.001377105712890625, 0.0040874481201171875, 0.00679779052734375, 0.009508132934570312, 0.012218475341796875, 0.014928817749023438, 0.01763916015625, 0.020349502563476562, 0.023059844970703125, 0.025770187377929688, 0.02848052978515625, 0.031190872192382812, 0.033901214599609375, 0.03661155700683594, 0.0393218994140625, 0.04203224182128906, 0.044742584228515625, 0.04745292663574219, 0.05016326904296875, 0.05287361145019531, 0.055583953857421875, 0.05829429626464844, 0.061004638671875, 0.06371498107910156, 0.06642532348632812, 0.06913566589355469, 0.07184600830078125, 0.07455635070800781, 0.07726669311523438, 0.07997703552246094, 0.0826873779296875, 0.08539772033691406, 0.08810806274414062, 0.09081840515136719, 0.09352874755859375, 0.09623908996582031, 0.09894943237304688, 0.10165977478027344, 0.1043701171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 11.0, 3.0, 5.0, 13.0, 7.0, 11.0, 19.0, 12.0, 22.0, 20.0, 20.0, 17.0, 28.0, 37.0, 25.0, 38.0, 31.0, 44.0, 33.0, 36.0, 48.0, 47.0, 43.0, 34.0, 33.0, 47.0, 43.0, 28.0, 38.0, 26.0, 16.0, 24.0, 20.0, 23.0, 14.0, 18.0, 6.0, 12.0, 5.0, 10.0, 10.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.11749267578125, -0.11390972137451172, -0.11032676696777344, -0.10674381256103516, -0.10316085815429688, -0.0995779037475586, -0.09599494934082031, -0.09241199493408203, -0.08882904052734375, -0.08524608612060547, -0.08166313171386719, -0.0780801773071289, -0.07449722290039062, -0.07091426849365234, -0.06733131408691406, -0.06374835968017578, -0.0601654052734375, -0.05658245086669922, -0.05299949645996094, -0.049416542053222656, -0.045833587646484375, -0.042250633239746094, -0.03866767883300781, -0.03508472442626953, -0.03150177001953125, -0.02791881561279297, -0.024335861206054688, -0.020752906799316406, -0.017169952392578125, -0.013586997985839844, -0.010004043579101562, -0.006421089172363281, -0.002838134765625, 0.0007448196411132812, 0.0043277740478515625, 0.007910728454589844, 0.011493682861328125, 0.015076637268066406, 0.018659591674804688, 0.02224254608154297, 0.02582550048828125, 0.02940845489501953, 0.03299140930175781, 0.036574363708496094, 0.040157318115234375, 0.043740272521972656, 0.04732322692871094, 0.05090618133544922, 0.0544891357421875, 0.05807209014892578, 0.06165504455566406, 0.06523799896240234, 0.06882095336914062, 0.0724039077758789, 0.07598686218261719, 0.07956981658935547, 0.08315277099609375, 0.08673572540283203, 0.09031867980957031, 0.0939016342163086, 0.09748458862304688, 0.10106754302978516, 0.10465049743652344, 0.10823345184326172, 0.11181640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 20.0, 27.0, 53.0, 108.0, 224.0, 598.0, 1778.0, 11270.0, 282832.0, 726540.0, 21256.0, 2552.0, 730.0, 297.0, 120.0, 50.0, 35.0, 17.0, 15.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046478271484375, -0.04482555389404297, -0.04317283630371094, -0.041520118713378906, -0.039867401123046875, -0.038214683532714844, -0.03656196594238281, -0.03490924835205078, -0.03325653076171875, -0.03160381317138672, -0.029951095581054688, -0.028298377990722656, -0.026645660400390625, -0.024992942810058594, -0.023340225219726562, -0.02168750762939453, -0.0200347900390625, -0.01838207244873047, -0.016729354858398438, -0.015076637268066406, -0.013423919677734375, -0.011771202087402344, -0.010118484497070312, -0.008465766906738281, -0.00681304931640625, -0.005160331726074219, -0.0035076141357421875, -0.0018548965454101562, -0.000202178955078125, 0.0014505386352539062, 0.0031032562255859375, 0.004755973815917969, 0.00640869140625, 0.008061408996582031, 0.009714126586914062, 0.011366844177246094, 0.013019561767578125, 0.014672279357910156, 0.016324996948242188, 0.01797771453857422, 0.01963043212890625, 0.02128314971923828, 0.022935867309570312, 0.024588584899902344, 0.026241302490234375, 0.027894020080566406, 0.029546737670898438, 0.03119945526123047, 0.0328521728515625, 0.03450489044189453, 0.03615760803222656, 0.037810325622558594, 0.039463043212890625, 0.041115760803222656, 0.04276847839355469, 0.04442119598388672, 0.04607391357421875, 0.04772663116455078, 0.04937934875488281, 0.051032066345214844, 0.052684783935546875, 0.054337501525878906, 0.05599021911621094, 0.05764293670654297, 0.059295654296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 9.0, 3.0, 4.0, 9.0, 8.0, 11.0, 16.0, 16.0, 20.0, 17.0, 39.0, 46.0, 47.0, 47.0, 70.0, 77.0, 96.0, 73.0, 76.0, 43.0, 52.0, 39.0, 30.0, 28.0, 16.0, 18.0, 18.0, 17.0, 16.0, 6.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-4.6312808990478516e-05, -4.511140286922455e-05, -4.390999674797058e-05, -4.2708590626716614e-05, -4.1507184505462646e-05, -4.030577838420868e-05, -3.910437226295471e-05, -3.7902966141700745e-05, -3.670156002044678e-05, -3.550015389919281e-05, -3.429874777793884e-05, -3.3097341656684875e-05, -3.189593553543091e-05, -3.069452941417694e-05, -2.9493123292922974e-05, -2.8291717171669006e-05, -2.709031105041504e-05, -2.5888904929161072e-05, -2.4687498807907104e-05, -2.3486092686653137e-05, -2.228468656539917e-05, -2.1083280444145203e-05, -1.9881874322891235e-05, -1.8680468201637268e-05, -1.74790620803833e-05, -1.6277655959129333e-05, -1.5076249837875366e-05, -1.3874843716621399e-05, -1.2673437595367432e-05, -1.1472031474113464e-05, -1.0270625352859497e-05, -9.06921923160553e-06, -7.867813110351562e-06, -6.666406989097595e-06, -5.465000867843628e-06, -4.263594746589661e-06, -3.0621886253356934e-06, -1.860782504081726e-06, -6.593763828277588e-07, 5.420297384262085e-07, 1.7434358596801758e-06, 2.944841980934143e-06, 4.14624810218811e-06, 5.347654223442078e-06, 6.549060344696045e-06, 7.750466465950012e-06, 8.95187258720398e-06, 1.0153278708457947e-05, 1.1354684829711914e-05, 1.2556090950965881e-05, 1.3757497072219849e-05, 1.4958903193473816e-05, 1.6160309314727783e-05, 1.736171543598175e-05, 1.8563121557235718e-05, 1.9764527678489685e-05, 2.0965933799743652e-05, 2.216733992099762e-05, 2.3368746042251587e-05, 2.4570152163505554e-05, 2.577155828475952e-05, 2.697296440601349e-05, 2.8174370527267456e-05, 2.9375776648521423e-05, 3.057718276977539e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 6.0, 27.0, 30.0, 54.0, 106.0, 243.0, 497.0, 1212.0, 4064.0, 32298.0, 772389.0, 221378.0, 12286.0, 2431.0, 809.0, 357.0, 161.0, 88.0, 40.0, 37.0, 12.0, 5.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.073974609375, -0.07228565216064453, -0.07059669494628906, -0.0689077377319336, -0.06721878051757812, -0.06552982330322266, -0.06384086608886719, -0.06215190887451172, -0.06046295166015625, -0.05877399444580078, -0.05708503723144531, -0.055396080017089844, -0.053707122802734375, -0.052018165588378906, -0.05032920837402344, -0.04864025115966797, -0.0469512939453125, -0.04526233673095703, -0.04357337951660156, -0.041884422302246094, -0.040195465087890625, -0.038506507873535156, -0.03681755065917969, -0.03512859344482422, -0.03343963623046875, -0.03175067901611328, -0.030061721801757812, -0.028372764587402344, -0.026683807373046875, -0.024994850158691406, -0.023305892944335938, -0.02161693572998047, -0.019927978515625, -0.01823902130126953, -0.016550064086914062, -0.014861106872558594, -0.013172149658203125, -0.011483192443847656, -0.009794235229492188, -0.008105278015136719, -0.00641632080078125, -0.004727363586425781, -0.0030384063720703125, -0.0013494491577148438, 0.000339508056640625, 0.0020284652709960938, 0.0037174224853515625, 0.005406379699707031, 0.0070953369140625, 0.008784294128417969, 0.010473251342773438, 0.012162208557128906, 0.013851165771484375, 0.015540122985839844, 0.017229080200195312, 0.01891803741455078, 0.02060699462890625, 0.02229595184326172, 0.023984909057617188, 0.025673866271972656, 0.027362823486328125, 0.029051780700683594, 0.030740737915039062, 0.03242969512939453, 0.03411865234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 6.0, 10.0, 10.0, 17.0, 25.0, 23.0, 32.0, 41.0, 49.0, 72.0, 69.0, 89.0, 101.0, 91.0, 85.0, 69.0, 47.0, 36.0, 24.0, 24.0, 14.0, 8.0, 19.0, 7.0, 11.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0277252197265625, -0.02681255340576172, -0.025899887084960938, -0.024987220764160156, -0.024074554443359375, -0.023161888122558594, -0.022249221801757812, -0.02133655548095703, -0.02042388916015625, -0.01951122283935547, -0.018598556518554688, -0.017685890197753906, -0.016773223876953125, -0.015860557556152344, -0.014947891235351562, -0.014035224914550781, -0.01312255859375, -0.012209892272949219, -0.011297225952148438, -0.010384559631347656, -0.009471893310546875, -0.008559226989746094, -0.0076465606689453125, -0.006733894348144531, -0.00582122802734375, -0.004908561706542969, -0.0039958953857421875, -0.0030832290649414062, -0.002170562744140625, -0.0012578964233398438, -0.0003452301025390625, 0.0005674362182617188, 0.0014801025390625, 0.0023927688598632812, 0.0033054351806640625, 0.004218101501464844, 0.005130767822265625, 0.006043434143066406, 0.0069561004638671875, 0.007868766784667969, 0.00878143310546875, 0.009694099426269531, 0.010606765747070312, 0.011519432067871094, 0.012432098388671875, 0.013344764709472656, 0.014257431030273438, 0.015170097351074219, 0.016082763671875, 0.01699542999267578, 0.017908096313476562, 0.018820762634277344, 0.019733428955078125, 0.020646095275878906, 0.021558761596679688, 0.02247142791748047, 0.02338409423828125, 0.02429676055908203, 0.025209426879882812, 0.026122093200683594, 0.027034759521484375, 0.027947425842285156, 0.028860092163085938, 0.02977275848388672, 0.0306854248046875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 16.0, 22.0, 33.0, 91.0, 156.0, 207.0, 175.0, 141.0, 62.0, 35.0, 25.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8469991683959961, -0.8262155055999756, -0.8054319024085999, -0.7846482396125793, -0.7638646364212036, -0.7430809736251831, -0.7222973704338074, -0.7015137076377869, -0.6807301044464111, -0.6599464416503906, -0.6391628384590149, -0.6183791756629944, -0.5975955724716187, -0.5768119096755981, -0.5560283064842224, -0.5352446436882019, -0.5144609808921814, -0.4936773478984833, -0.47289371490478516, -0.45211008191108704, -0.4313264489173889, -0.4105427861213684, -0.3897591531276703, -0.36897552013397217, -0.34819188714027405, -0.3274082541465759, -0.3066246211528778, -0.2858409881591797, -0.2650573253631592, -0.24427370727062225, -0.22349005937576294, -0.20270642638206482, -0.1819227933883667, -0.16113916039466858, -0.14035552740097046, -0.11957187950611115, -0.09878824651241302, -0.0780046135187149, -0.05722097307443619, -0.03643733263015747, -0.01565369963645935, 0.005129937082529068, 0.025913573801517487, 0.046697210520505905, 0.06748084723949432, 0.08826448023319244, 0.10904812067747116, 0.12983176112174988, 0.150615394115448, 0.17139902710914612, 0.19218266010284424, 0.21296630799770355, 0.23374994099140167, 0.254533588886261, 0.2753172218799591, 0.2961008548736572, 0.31688448786735535, 0.33766812086105347, 0.3584517538547516, 0.3792353868484497, 0.4000190496444702, 0.42080265283584595, 0.44158631563186646, 0.4623699486255646, 0.4831535816192627]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 9.0, 5.0, 17.0, 13.0, 17.0, 25.0, 35.0, 20.0, 49.0, 51.0, 57.0, 59.0, 67.0, 51.0, 58.0, 58.0, 71.0, 51.0, 43.0, 42.0, 42.0, 36.0, 26.0, 24.0, 21.0, 13.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7940049171447754, -0.7720876336097717, -0.7501704096794128, -0.7282531261444092, -0.7063358426094055, -0.6844185590744019, -0.662501335144043, -0.6405840516090393, -0.6186667680740356, -0.596749484539032, -0.5748322606086731, -0.5529149770736694, -0.5309976935386658, -0.5090804100036621, -0.4871631860733032, -0.46524590253829956, -0.4433286488056183, -0.421411395072937, -0.39949411153793335, -0.3775768578052521, -0.3556595742702484, -0.33374232053756714, -0.3118250370025635, -0.2899077832698822, -0.2679905295372009, -0.24607326090335846, -0.224155992269516, -0.20223873853683472, -0.18032145500183105, -0.15840420126914978, -0.1364869326353073, -0.11456966400146484, -0.09265238046646118, -0.07073511183261871, -0.048817846924066544, -0.026900582015514374, -0.0049833133816719055, 0.016933955252170563, 0.038851216435432434, 0.0607684850692749, 0.08268575370311737, 0.10460302233695984, 0.1265202909708023, 0.14843755960464478, 0.17035481333732605, 0.1922720968723297, 0.214189350605011, 0.23610661923885345, 0.2580238878726959, 0.2799411416053772, 0.30185842514038086, 0.32377567887306213, 0.3456929624080658, 0.36761021614074707, 0.38952749967575073, 0.411444753408432, 0.4333620071411133, 0.45527926087379456, 0.4771965444087982, 0.4991137981414795, 0.5210310816764832, 0.5429483652114868, 0.5648655891418457, 0.5867828726768494, 0.608700156211853]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 9.0, 3.0, 12.0, 16.0, 17.0, 31.0, 30.0, 39.0, 79.0, 147.0, 204.0, 359.0, 575.0, 1044.0, 2041.0, 4351.0, 10370.0, 32415.0, 174063.0, 2167367.0, 1612992.0, 141956.0, 28622.0, 9581.0, 3874.0, 1776.0, 957.0, 524.0, 287.0, 199.0, 104.0, 72.0, 56.0, 43.0, 21.0, 11.0, 11.0, 8.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.046173095703125, -0.04477119445800781, -0.043369293212890625, -0.04196739196777344, -0.04056549072265625, -0.03916358947753906, -0.037761688232421875, -0.03635978698730469, -0.0349578857421875, -0.03355598449707031, -0.032154083251953125, -0.030752182006835938, -0.02935028076171875, -0.027948379516601562, -0.026546478271484375, -0.025144577026367188, -0.02374267578125, -0.022340774536132812, -0.020938873291015625, -0.019536972045898438, -0.01813507080078125, -0.016733169555664062, -0.015331268310546875, -0.013929367065429688, -0.0125274658203125, -0.011125564575195312, -0.009723663330078125, -0.008321762084960938, -0.00691986083984375, -0.0055179595947265625, -0.004116058349609375, -0.0027141571044921875, -0.001312255859375, 8.96453857421875e-05, 0.001491546630859375, 0.0028934478759765625, 0.00429534912109375, 0.0056972503662109375, 0.007099151611328125, 0.008501052856445312, 0.0099029541015625, 0.011304855346679688, 0.012706756591796875, 0.014108657836914062, 0.01551055908203125, 0.016912460327148438, 0.018314361572265625, 0.019716262817382812, 0.0211181640625, 0.022520065307617188, 0.023921966552734375, 0.025323867797851562, 0.02672576904296875, 0.028127670288085938, 0.029529571533203125, 0.030931472778320312, 0.0323333740234375, 0.03373527526855469, 0.035137176513671875, 0.03653907775878906, 0.03794097900390625, 0.03934288024902344, 0.040744781494140625, 0.04214668273925781, 0.043548583984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 18.0, 11.0, 17.0, 14.0, 27.0, 36.0, 39.0, 45.0, 62.0, 57.0, 58.0, 82.0, 76.0, 59.0, 72.0, 56.0, 58.0, 58.0, 32.0, 30.0, 16.0, 19.0, 13.0, 10.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.055572509765625, -0.05407524108886719, -0.052577972412109375, -0.05108070373535156, -0.04958343505859375, -0.04808616638183594, -0.046588897705078125, -0.04509162902832031, -0.0435943603515625, -0.04209709167480469, -0.040599822998046875, -0.03910255432128906, -0.03760528564453125, -0.03610801696777344, -0.034610748291015625, -0.03311347961425781, -0.0316162109375, -0.030118942260742188, -0.028621673583984375, -0.027124404907226562, -0.02562713623046875, -0.024129867553710938, -0.022632598876953125, -0.021135330200195312, -0.0196380615234375, -0.018140792846679688, -0.016643524169921875, -0.015146255493164062, -0.01364898681640625, -0.012151718139648438, -0.010654449462890625, -0.009157180786132812, -0.007659912109375, -0.0061626434326171875, -0.004665374755859375, -0.0031681060791015625, -0.00167083740234375, -0.0001735687255859375, 0.001323699951171875, 0.0028209686279296875, 0.0043182373046875, 0.0058155059814453125, 0.007312774658203125, 0.008810043334960938, 0.01030731201171875, 0.011804580688476562, 0.013301849365234375, 0.014799118041992188, 0.01629638671875, 0.017793655395507812, 0.019290924072265625, 0.020788192749023438, 0.02228546142578125, 0.023782730102539062, 0.025279998779296875, 0.026777267456054688, 0.0282745361328125, 0.029771804809570312, 0.031269073486328125, 0.03276634216308594, 0.03426361083984375, 0.03576087951660156, 0.037258148193359375, 0.03875541687011719, 0.040252685546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 18.0, 22.0, 33.0, 55.0, 77.0, 188.0, 559.0, 2612.0, 17085.0, 297292.0, 3783271.0, 82466.0, 8264.0, 1538.0, 393.0, 169.0, 69.0, 37.0, 27.0, 13.0, 23.0, 10.0, 4.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.113525390625, -0.11031150817871094, -0.10709762573242188, -0.10388374328613281, -0.10066986083984375, -0.09745597839355469, -0.09424209594726562, -0.09102821350097656, -0.0878143310546875, -0.08460044860839844, -0.08138656616210938, -0.07817268371582031, -0.07495880126953125, -0.07174491882324219, -0.06853103637695312, -0.06531715393066406, -0.062103271484375, -0.05888938903808594, -0.055675506591796875, -0.05246162414550781, -0.04924774169921875, -0.04603385925292969, -0.042819976806640625, -0.03960609436035156, -0.0363922119140625, -0.03317832946777344, -0.029964447021484375, -0.026750564575195312, -0.02353668212890625, -0.020322799682617188, -0.017108917236328125, -0.013895034790039062, -0.01068115234375, -0.0074672698974609375, -0.004253387451171875, -0.0010395050048828125, 0.00217437744140625, 0.0053882598876953125, 0.008602142333984375, 0.011816024780273438, 0.0150299072265625, 0.018243789672851562, 0.021457672119140625, 0.024671554565429688, 0.02788543701171875, 0.031099319458007812, 0.034313201904296875, 0.03752708435058594, 0.040740966796875, 0.04395484924316406, 0.047168731689453125, 0.05038261413574219, 0.05359649658203125, 0.05681037902832031, 0.060024261474609375, 0.06323814392089844, 0.0664520263671875, 0.06966590881347656, 0.07287979125976562, 0.07609367370605469, 0.07930755615234375, 0.08252143859863281, 0.08573532104492188, 0.08894920349121094, 0.0921630859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 9.0, 9.0, 14.0, 16.0, 23.0, 29.0, 61.0, 100.0, 159.0, 342.0, 666.0, 969.0, 764.0, 416.0, 207.0, 92.0, 58.0, 39.0, 26.0, 12.0, 12.0, 14.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06787109375, -0.06557655334472656, -0.06328201293945312, -0.06098747253417969, -0.05869293212890625, -0.05639839172363281, -0.054103851318359375, -0.05180931091308594, -0.0495147705078125, -0.04722023010253906, -0.044925689697265625, -0.04263114929199219, -0.04033660888671875, -0.03804206848144531, -0.035747528076171875, -0.03345298767089844, -0.031158447265625, -0.028863906860351562, -0.026569366455078125, -0.024274826049804688, -0.02198028564453125, -0.019685745239257812, -0.017391204833984375, -0.015096664428710938, -0.0128021240234375, -0.010507583618164062, -0.008213043212890625, -0.0059185028076171875, -0.00362396240234375, -0.0013294219970703125, 0.000965118408203125, 0.0032596588134765625, 0.00555419921875, 0.007848739624023438, 0.010143280029296875, 0.012437820434570312, 0.01473236083984375, 0.017026901245117188, 0.019321441650390625, 0.021615982055664062, 0.0239105224609375, 0.026205062866210938, 0.028499603271484375, 0.030794143676757812, 0.03308868408203125, 0.03538322448730469, 0.037677764892578125, 0.03997230529785156, 0.042266845703125, 0.04456138610839844, 0.046855926513671875, 0.04915046691894531, 0.05144500732421875, 0.05373954772949219, 0.056034088134765625, 0.05832862854003906, 0.0606231689453125, 0.06291770935058594, 0.06521224975585938, 0.06750679016113281, 0.06980133056640625, 0.07209587097167969, 0.07439041137695312, 0.07668495178222656, 0.0789794921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 23.0, 49.0, 106.0, 203.0, 239.0, 178.0, 101.0, 36.0, 18.0, 13.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8902294039726257, -0.8677390813827515, -0.8452487587928772, -0.8227584362030029, -0.8002681732177734, -0.7777778506278992, -0.7552875280380249, -0.7327972054481506, -0.7103068828582764, -0.6878165602684021, -0.6653262376785278, -0.6428359746932983, -0.6203456521034241, -0.5978553295135498, -0.5753650069236755, -0.5528746843338013, -0.5303844213485718, -0.5078940987586975, -0.48540380597114563, -0.46291348338127136, -0.4404231905937195, -0.4179328680038452, -0.39544254541397095, -0.3729522228240967, -0.3504619300365448, -0.32797160744667053, -0.30548131465911865, -0.2829909920692444, -0.2605006694793701, -0.23801037669181824, -0.21552005410194397, -0.1930297464132309, -0.17053937911987305, -0.14804907143115997, -0.1255587637424469, -0.10306844115257263, -0.08057813346385956, -0.058087825775146484, -0.03559750318527222, -0.013107195496559143, 0.00938311219215393, 0.0318734236061573, 0.054363735020160675, 0.07685405015945435, 0.09934435784816742, 0.1218346655368805, 0.14432498812675476, 0.16681529581546783, 0.1893056035041809, 0.21179591119289398, 0.23428621888160706, 0.2567765414714813, 0.2792668342590332, 0.30175715684890747, 0.32424747943878174, 0.346737802028656, 0.3692280948162079, 0.39171841740608215, 0.41420871019363403, 0.4366990327835083, 0.45918935537338257, 0.48167964816093445, 0.5041699409484863, 0.5266602635383606, 0.5491505861282349]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 12.0, 10.0, 11.0, 17.0, 18.0, 17.0, 18.0, 16.0, 34.0, 27.0, 34.0, 51.0, 40.0, 54.0, 36.0, 55.0, 45.0, 53.0, 47.0, 40.0, 36.0, 34.0, 37.0, 39.0, 33.0, 28.0, 25.0, 26.0, 18.0, 17.0, 16.0, 11.0, 5.0, 7.0, 3.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26301419734954834, -0.25473424792289734, -0.24645428359508514, -0.23817431926727295, -0.22989436984062195, -0.22161442041397095, -0.21333445608615875, -0.20505449175834656, -0.19677454233169556, -0.18849459290504456, -0.18021462857723236, -0.17193466424942017, -0.16365471482276917, -0.15537476539611816, -0.14709480106830597, -0.13881483674049377, -0.13053488731384277, -0.12225493043661118, -0.11397497355937958, -0.10569501668214798, -0.09741505980491638, -0.08913510292768478, -0.08085514605045319, -0.07257518917322159, -0.06429523229598999, -0.05601527541875839, -0.047735318541526794, -0.0394553616642952, -0.0311754047870636, -0.022895447909832, -0.014615491032600403, -0.006335534155368805, 0.001944422721862793, 0.010224379599094391, 0.01850433647632599, 0.026784293353557587, 0.035064250230789185, 0.04334420710802078, 0.05162416398525238, 0.05990412086248398, 0.06818407773971558, 0.07646403461694717, 0.08474399149417877, 0.09302394837141037, 0.10130390524864197, 0.10958386212587357, 0.11786381900310516, 0.12614378333091736, 0.13442373275756836, 0.14270368218421936, 0.15098364651203156, 0.15926361083984375, 0.16754356026649475, 0.17582350969314575, 0.18410347402095795, 0.19238343834877014, 0.20066338777542114, 0.20894333720207214, 0.21722330152988434, 0.22550326585769653, 0.23378321528434753, 0.24206316471099854, 0.2503431439399719, 0.2586230933666229, 0.2669030427932739]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 8.0, 14.0, 14.0, 16.0, 25.0, 49.0, 83.0, 133.0, 256.0, 446.0, 819.0, 1752.0, 3690.0, 8537.0, 21707.0, 58868.0, 167955.0, 373043.0, 261374.0, 92899.0, 33826.0, 12747.0, 5381.0, 2407.0, 1171.0, 594.0, 288.0, 182.0, 100.0, 66.0, 33.0, 30.0, 11.0, 6.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.041534423828125, -0.04030275344848633, -0.039071083068847656, -0.037839412689208984, -0.03660774230957031, -0.03537607192993164, -0.03414440155029297, -0.0329127311706543, -0.031681060791015625, -0.030449390411376953, -0.02921772003173828, -0.02798604965209961, -0.026754379272460938, -0.025522708892822266, -0.024291038513183594, -0.023059368133544922, -0.02182769775390625, -0.020596027374267578, -0.019364356994628906, -0.018132686614990234, -0.016901016235351562, -0.01566934585571289, -0.014437675476074219, -0.013206005096435547, -0.011974334716796875, -0.010742664337158203, -0.009510993957519531, -0.00827932357788086, -0.0070476531982421875, -0.005815982818603516, -0.004584312438964844, -0.003352642059326172, -0.0021209716796875, -0.0008893013000488281, 0.00034236907958984375, 0.0015740394592285156, 0.0028057098388671875, 0.004037380218505859, 0.005269050598144531, 0.006500720977783203, 0.007732391357421875, 0.008964061737060547, 0.010195732116699219, 0.01142740249633789, 0.012659072875976562, 0.013890743255615234, 0.015122413635253906, 0.016354084014892578, 0.01758575439453125, 0.018817424774169922, 0.020049095153808594, 0.021280765533447266, 0.022512435913085938, 0.02374410629272461, 0.02497577667236328, 0.026207447052001953, 0.027439117431640625, 0.028670787811279297, 0.02990245819091797, 0.03113412857055664, 0.03236579895019531, 0.033597469329833984, 0.034829139709472656, 0.03606081008911133, 0.03729248046875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 9.0, 8.0, 6.0, 13.0, 16.0, 30.0, 25.0, 49.0, 40.0, 45.0, 65.0, 61.0, 72.0, 65.0, 72.0, 65.0, 77.0, 52.0, 52.0, 48.0, 35.0, 26.0, 23.0, 13.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0545654296875, -0.052991390228271484, -0.05141735076904297, -0.04984331130981445, -0.04826927185058594, -0.04669523239135742, -0.045121192932128906, -0.04354715347290039, -0.041973114013671875, -0.04039907455444336, -0.038825035095214844, -0.03725099563598633, -0.03567695617675781, -0.0341029167175293, -0.03252887725830078, -0.030954837799072266, -0.02938079833984375, -0.027806758880615234, -0.02623271942138672, -0.024658679962158203, -0.023084640502929688, -0.021510601043701172, -0.019936561584472656, -0.01836252212524414, -0.016788482666015625, -0.01521444320678711, -0.013640403747558594, -0.012066364288330078, -0.010492324829101562, -0.008918285369873047, -0.007344245910644531, -0.005770206451416016, -0.0041961669921875, -0.0026221275329589844, -0.0010480880737304688, 0.0005259513854980469, 0.0020999908447265625, 0.003674030303955078, 0.005248069763183594, 0.006822109222412109, 0.008396148681640625, 0.00997018814086914, 0.011544227600097656, 0.013118267059326172, 0.014692306518554688, 0.016266345977783203, 0.01784038543701172, 0.019414424896240234, 0.02098846435546875, 0.022562503814697266, 0.02413654327392578, 0.025710582733154297, 0.027284622192382812, 0.028858661651611328, 0.030432701110839844, 0.03200674057006836, 0.033580780029296875, 0.03515481948852539, 0.036728858947753906, 0.03830289840698242, 0.03987693786621094, 0.04145097732543945, 0.04302501678466797, 0.044599056243896484, 0.046173095703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 6.0, 12.0, 19.0, 25.0, 43.0, 72.0, 91.0, 110.0, 186.0, 334.0, 554.0, 981.0, 2113.0, 6782.0, 61892.0, 834674.0, 125327.0, 9968.0, 2526.0, 1150.0, 603.0, 375.0, 228.0, 150.0, 103.0, 71.0, 38.0, 30.0, 27.0, 14.0, 7.0, 10.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10186767578125, -0.0985403060913086, -0.09521293640136719, -0.09188556671142578, -0.08855819702148438, -0.08523082733154297, -0.08190345764160156, -0.07857608795166016, -0.07524871826171875, -0.07192134857177734, -0.06859397888183594, -0.06526660919189453, -0.061939239501953125, -0.05861186981201172, -0.05528450012207031, -0.051957130432128906, -0.0486297607421875, -0.045302391052246094, -0.04197502136230469, -0.03864765167236328, -0.035320281982421875, -0.03199291229248047, -0.028665542602539062, -0.025338172912597656, -0.02201080322265625, -0.018683433532714844, -0.015356063842773438, -0.012028694152832031, -0.008701324462890625, -0.005373954772949219, -0.0020465850830078125, 0.0012807846069335938, 0.004608154296875, 0.007935523986816406, 0.011262893676757812, 0.014590263366699219, 0.017917633056640625, 0.02124500274658203, 0.024572372436523438, 0.027899742126464844, 0.03122711181640625, 0.034554481506347656, 0.03788185119628906, 0.04120922088623047, 0.044536590576171875, 0.04786396026611328, 0.05119132995605469, 0.054518699645996094, 0.0578460693359375, 0.061173439025878906, 0.06450080871582031, 0.06782817840576172, 0.07115554809570312, 0.07448291778564453, 0.07781028747558594, 0.08113765716552734, 0.08446502685546875, 0.08779239654541016, 0.09111976623535156, 0.09444713592529297, 0.09777450561523438, 0.10110187530517578, 0.10442924499511719, 0.1077566146850586, 0.111083984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 6.0, 3.0, 8.0, 3.0, 7.0, 12.0, 10.0, 7.0, 13.0, 22.0, 13.0, 28.0, 23.0, 28.0, 36.0, 44.0, 35.0, 39.0, 40.0, 34.0, 41.0, 44.0, 39.0, 41.0, 43.0, 36.0, 36.0, 37.0, 32.0, 28.0, 25.0, 29.0, 27.0, 17.0, 21.0, 13.0, 22.0, 11.0, 6.0, 10.0, 7.0, 9.0, 3.0, 4.0, 4.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11492919921875, -0.11123085021972656, -0.10753250122070312, -0.10383415222167969, -0.10013580322265625, -0.09643745422363281, -0.09273910522460938, -0.08904075622558594, -0.0853424072265625, -0.08164405822753906, -0.07794570922851562, -0.07424736022949219, -0.07054901123046875, -0.06685066223144531, -0.06315231323242188, -0.05945396423339844, -0.055755615234375, -0.05205726623535156, -0.048358917236328125, -0.04466056823730469, -0.04096221923828125, -0.03726387023925781, -0.033565521240234375, -0.029867172241210938, -0.0261688232421875, -0.022470474243164062, -0.018772125244140625, -0.015073776245117188, -0.01137542724609375, -0.0076770782470703125, -0.003978729248046875, -0.0002803802490234375, 0.00341796875, 0.0071163177490234375, 0.010814666748046875, 0.014513015747070312, 0.01821136474609375, 0.021909713745117188, 0.025608062744140625, 0.029306411743164062, 0.0330047607421875, 0.03670310974121094, 0.040401458740234375, 0.04409980773925781, 0.04779815673828125, 0.05149650573730469, 0.055194854736328125, 0.05889320373535156, 0.062591552734375, 0.06628990173339844, 0.06998825073242188, 0.07368659973144531, 0.07738494873046875, 0.08108329772949219, 0.08478164672851562, 0.08847999572753906, 0.0921783447265625, 0.09587669372558594, 0.09957504272460938, 0.10327339172363281, 0.10697174072265625, 0.11067008972167969, 0.11436843872070312, 0.11806678771972656, 0.12176513671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 13.0, 23.0, 16.0, 46.0, 76.0, 161.0, 360.0, 835.0, 3006.0, 30680.0, 947437.0, 59866.0, 4160.0, 1044.0, 406.0, 183.0, 89.0, 38.0, 36.0, 26.0, 15.0, 7.0, 7.0, 4.0, 2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08575439453125, -0.08295154571533203, -0.08014869689941406, -0.0773458480834961, -0.07454299926757812, -0.07174015045166016, -0.06893730163574219, -0.06613445281982422, -0.06333160400390625, -0.06052875518798828, -0.05772590637207031, -0.054923057556152344, -0.052120208740234375, -0.049317359924316406, -0.04651451110839844, -0.04371166229248047, -0.0409088134765625, -0.03810596466064453, -0.03530311584472656, -0.032500267028808594, -0.029697418212890625, -0.026894569396972656, -0.024091720581054688, -0.02128887176513672, -0.01848602294921875, -0.01568317413330078, -0.012880325317382812, -0.010077476501464844, -0.007274627685546875, -0.004471778869628906, -0.0016689300537109375, 0.0011339187622070312, 0.003936767578125, 0.006739616394042969, 0.009542465209960938, 0.012345314025878906, 0.015148162841796875, 0.017951011657714844, 0.020753860473632812, 0.02355670928955078, 0.02635955810546875, 0.02916240692138672, 0.03196525573730469, 0.034768104553222656, 0.037570953369140625, 0.040373802185058594, 0.04317665100097656, 0.04597949981689453, 0.0487823486328125, 0.05158519744873047, 0.05438804626464844, 0.057190895080566406, 0.059993743896484375, 0.06279659271240234, 0.06559944152832031, 0.06840229034423828, 0.07120513916015625, 0.07400798797607422, 0.07681083679199219, 0.07961368560791016, 0.08241653442382812, 0.0852193832397461, 0.08802223205566406, 0.09082508087158203, 0.0936279296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 10.0, 9.0, 15.0, 13.0, 18.0, 31.0, 34.0, 40.0, 51.0, 70.0, 78.0, 104.0, 91.0, 83.0, 66.0, 64.0, 47.0, 34.0, 23.0, 14.0, 13.0, 16.0, 7.0, 15.0, 7.0, 5.0, 9.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.398822784423828e-05, -4.256516695022583e-05, -4.114210605621338e-05, -3.971904516220093e-05, -3.8295984268188477e-05, -3.6872923374176025e-05, -3.5449862480163574e-05, -3.402680158615112e-05, -3.260374069213867e-05, -3.118067979812622e-05, -2.975761890411377e-05, -2.833455801010132e-05, -2.6911497116088867e-05, -2.5488436222076416e-05, -2.4065375328063965e-05, -2.2642314434051514e-05, -2.1219253540039062e-05, -1.979619264602661e-05, -1.837313175201416e-05, -1.695007085800171e-05, -1.5527009963989258e-05, -1.4103949069976807e-05, -1.2680888175964355e-05, -1.1257827281951904e-05, -9.834766387939453e-06, -8.411705493927002e-06, -6.988644599914551e-06, -5.5655837059021e-06, -4.1425228118896484e-06, -2.7194619178771973e-06, -1.296401023864746e-06, 1.2665987014770508e-07, 1.5497207641601562e-06, 2.9727816581726074e-06, 4.395842552185059e-06, 5.81890344619751e-06, 7.241964340209961e-06, 8.665025234222412e-06, 1.0088086128234863e-05, 1.1511147022247314e-05, 1.2934207916259766e-05, 1.4357268810272217e-05, 1.5780329704284668e-05, 1.720339059829712e-05, 1.862645149230957e-05, 2.004951238632202e-05, 2.1472573280334473e-05, 2.2895634174346924e-05, 2.4318695068359375e-05, 2.5741755962371826e-05, 2.7164816856384277e-05, 2.858787775039673e-05, 3.001093864440918e-05, 3.143399953842163e-05, 3.285706043243408e-05, 3.428012132644653e-05, 3.5703182220458984e-05, 3.7126243114471436e-05, 3.854930400848389e-05, 3.997236490249634e-05, 4.139542579650879e-05, 4.281848669052124e-05, 4.424154758453369e-05, 4.566460847854614e-05, 4.7087669372558594e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 8.0, 9.0, 16.0, 12.0, 18.0, 31.0, 52.0, 59.0, 134.0, 238.0, 431.0, 915.0, 2583.0, 10524.0, 91204.0, 874246.0, 56551.0, 7639.0, 2135.0, 789.0, 377.0, 232.0, 125.0, 71.0, 54.0, 28.0, 24.0, 11.0, 17.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057647705078125, -0.0554652214050293, -0.053282737731933594, -0.05110025405883789, -0.04891777038574219, -0.046735286712646484, -0.04455280303955078, -0.04237031936645508, -0.040187835693359375, -0.03800535202026367, -0.03582286834716797, -0.033640384674072266, -0.03145790100097656, -0.02927541732788086, -0.027092933654785156, -0.024910449981689453, -0.02272796630859375, -0.020545482635498047, -0.018362998962402344, -0.01618051528930664, -0.013998031616210938, -0.011815547943115234, -0.009633064270019531, -0.007450580596923828, -0.005268096923828125, -0.003085613250732422, -0.0009031295776367188, 0.0012793540954589844, 0.0034618377685546875, 0.005644321441650391, 0.007826805114746094, 0.010009288787841797, 0.0121917724609375, 0.014374256134033203, 0.016556739807128906, 0.01873922348022461, 0.020921707153320312, 0.023104190826416016, 0.02528667449951172, 0.027469158172607422, 0.029651641845703125, 0.03183412551879883, 0.03401660919189453, 0.036199092864990234, 0.03838157653808594, 0.04056406021118164, 0.042746543884277344, 0.04492902755737305, 0.04711151123046875, 0.04929399490356445, 0.051476478576660156, 0.05365896224975586, 0.05584144592285156, 0.058023929595947266, 0.06020641326904297, 0.06238889694213867, 0.06457138061523438, 0.06675386428833008, 0.06893634796142578, 0.07111883163452148, 0.07330131530761719, 0.07548379898071289, 0.0776662826538086, 0.0798487663269043, 0.08203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 5.0, 2.0, 8.0, 8.0, 4.0, 14.0, 12.0, 15.0, 15.0, 25.0, 24.0, 25.0, 37.0, 37.0, 43.0, 57.0, 76.0, 78.0, 67.0, 69.0, 57.0, 55.0, 49.0, 30.0, 25.0, 28.0, 22.0, 21.0, 18.0, 15.0, 12.0, 5.0, 4.0, 5.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0258636474609375, -0.024947404861450195, -0.02403116226196289, -0.023114919662475586, -0.02219867706298828, -0.021282434463500977, -0.020366191864013672, -0.019449949264526367, -0.018533706665039062, -0.017617464065551758, -0.016701221466064453, -0.01578497886657715, -0.014868736267089844, -0.013952493667602539, -0.013036251068115234, -0.01212000846862793, -0.011203765869140625, -0.01028752326965332, -0.009371280670166016, -0.008455038070678711, -0.007538795471191406, -0.0066225528717041016, -0.005706310272216797, -0.004790067672729492, -0.0038738250732421875, -0.002957582473754883, -0.002041339874267578, -0.0011250972747802734, -0.00020885467529296875, 0.0007073879241943359, 0.0016236305236816406, 0.0025398731231689453, 0.00345611572265625, 0.004372358322143555, 0.005288600921630859, 0.006204843521118164, 0.007121086120605469, 0.008037328720092773, 0.008953571319580078, 0.009869813919067383, 0.010786056518554688, 0.011702299118041992, 0.012618541717529297, 0.013534784317016602, 0.014451026916503906, 0.015367269515991211, 0.016283512115478516, 0.01719975471496582, 0.018115997314453125, 0.01903223991394043, 0.019948482513427734, 0.02086472511291504, 0.021780967712402344, 0.02269721031188965, 0.023613452911376953, 0.024529695510864258, 0.025445938110351562, 0.026362180709838867, 0.027278423309326172, 0.028194665908813477, 0.02911090850830078, 0.030027151107788086, 0.03094339370727539, 0.031859636306762695, 0.03277587890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 15.0, 76.0, 155.0, 276.0, 278.0, 102.0, 43.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7093920707702637, -0.6796869039535522, -0.6499817967414856, -0.6202766299247742, -0.5905714631080627, -0.5608663558959961, -0.5311611890792847, -0.5014560222625732, -0.4717508852481842, -0.44204574823379517, -0.41234058141708374, -0.3826354444026947, -0.35293030738830566, -0.32322514057159424, -0.2935200035572052, -0.26381486654281616, -0.23410969972610474, -0.2044045478105545, -0.17469939589500427, -0.14499425888061523, -0.115289106965065, -0.08558395504951477, -0.05587881803512573, -0.0261736661195755, 0.0035314857959747314, 0.033236633986234665, 0.0629417821764946, 0.09264692664146423, 0.12235207855701447, 0.1520572304725647, 0.18176236748695374, 0.21146751940250397, 0.2411726713180542, 0.27087780833244324, 0.30058297514915466, 0.3302881121635437, 0.3599932789802551, 0.38969841599464417, 0.4194035530090332, 0.44910871982574463, 0.47881385684013367, 0.5085189938545227, 0.5382241606712341, 0.5679292678833008, 0.5976344347000122, 0.6273396015167236, 0.6570447683334351, 0.6867498755455017, 0.7164550423622131, 0.7461602091789246, 0.7758653163909912, 0.8055704832077026, 0.8352756500244141, 0.8649808168411255, 0.8946859240531921, 0.9243910908699036, 0.9540961980819702, 0.9838013648986816, 1.013506531715393, 1.0432116985321045, 1.0729167461395264, 1.1026219129562378, 1.1323270797729492, 1.1620322465896606, 1.191737413406372]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 8.0, 10.0, 12.0, 13.0, 18.0, 14.0, 21.0, 20.0, 34.0, 33.0, 18.0, 27.0, 29.0, 34.0, 52.0, 59.0, 45.0, 42.0, 49.0, 44.0, 61.0, 41.0, 36.0, 35.0, 21.0, 15.0, 26.0, 25.0, 15.0, 26.0, 10.0, 20.0, 10.0, 11.0, 7.0, 11.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.5077877044677734, -0.49288874864578247, -0.4779898226261139, -0.4630908668041229, -0.44819191098213196, -0.4332929849624634, -0.4183940291404724, -0.40349507331848145, -0.38859614729881287, -0.3736971914768219, -0.3587982654571533, -0.34389930963516235, -0.3290003538131714, -0.3141014277935028, -0.29920247197151184, -0.28430354595184326, -0.2694045901298523, -0.25450563430786133, -0.23960669338703156, -0.22470775246620178, -0.209808811545372, -0.19490987062454224, -0.18001091480255127, -0.1651119738817215, -0.15021300315856934, -0.13531406223773956, -0.1204151138663292, -0.10551616549491882, -0.09061722457408905, -0.07571827620267868, -0.06081932783126831, -0.04592038691043854, -0.031021445989608765, -0.016122501343488693, -0.0012235548347234726, 0.013675391674041748, 0.02857433632016182, 0.04347328096628189, 0.05837222933769226, 0.07327117025852203, 0.0881701186299324, 0.10306906700134277, 0.11796800792217255, 0.13286694884300232, 0.1477659046649933, 0.16266484558582306, 0.17756378650665283, 0.1924627423286438, 0.20736168324947357, 0.22226062417030334, 0.2371595799922943, 0.2520585060119629, 0.26695746183395386, 0.2818564176559448, 0.2967553734779358, 0.31165429949760437, 0.32655325531959534, 0.3414522111415863, 0.3563511371612549, 0.37125009298324585, 0.3861490488052368, 0.4010479748249054, 0.41594693064689636, 0.43084585666656494, 0.4457448124885559]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 19.0, 33.0, 92.0, 246.0, 859.0, 4191475.0, 1083.0, 287.0, 104.0, 45.0, 16.0, 15.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.4248046875, -1.3981895446777344, -1.3715744018554688, -1.3449592590332031, -1.3183441162109375, -1.2917289733886719, -1.2651138305664062, -1.2384986877441406, -1.211883544921875, -1.1852684020996094, -1.1586532592773438, -1.1320381164550781, -1.1054229736328125, -1.0788078308105469, -1.0521926879882812, -1.0255775451660156, -0.99896240234375, -0.9723472595214844, -0.9457321166992188, -0.9191169738769531, -0.8925018310546875, -0.8658866882324219, -0.8392715454101562, -0.8126564025878906, -0.786041259765625, -0.7594261169433594, -0.7328109741210938, -0.7061958312988281, -0.6795806884765625, -0.6529655456542969, -0.6263504028320312, -0.5997352600097656, -0.5731201171875, -0.5465049743652344, -0.5198898315429688, -0.4932746887207031, -0.4666595458984375, -0.4400444030761719, -0.41342926025390625, -0.3868141174316406, -0.360198974609375, -0.3335838317871094, -0.30696868896484375, -0.2803535461425781, -0.2537384033203125, -0.22712326049804688, -0.20050811767578125, -0.17389297485351562, -0.14727783203125, -0.12066268920898438, -0.09404754638671875, -0.06743240356445312, -0.0408172607421875, -0.014202117919921875, 0.01241302490234375, 0.039028167724609375, 0.065643310546875, 0.09225845336914062, 0.11887359619140625, 0.14548873901367188, 0.1721038818359375, 0.19871902465820312, 0.22533416748046875, 0.2519493103027344, 0.278564453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 14.0, 22.0, 34.0, 47.0, 48.0, 52.0, 50.0, 63.0, 67.0, 58.0, 71.0, 70.0, 64.0, 63.0, 57.0, 37.0, 38.0, 24.0, 31.0, 20.0, 18.0, 10.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.055328369140625, -0.05379629135131836, -0.05226421356201172, -0.05073213577270508, -0.04920005798339844, -0.0476679801940918, -0.046135902404785156, -0.044603824615478516, -0.043071746826171875, -0.041539669036865234, -0.040007591247558594, -0.03847551345825195, -0.03694343566894531, -0.03541135787963867, -0.03387928009033203, -0.03234720230102539, -0.03081512451171875, -0.02928304672241211, -0.02775096893310547, -0.026218891143798828, -0.024686813354492188, -0.023154735565185547, -0.021622657775878906, -0.020090579986572266, -0.018558502197265625, -0.017026424407958984, -0.015494346618652344, -0.013962268829345703, -0.012430191040039062, -0.010898113250732422, -0.009366035461425781, -0.00783395767211914, -0.0063018798828125, -0.004769802093505859, -0.0032377243041992188, -0.0017056465148925781, -0.0001735687255859375, 0.0013585090637207031, 0.0028905868530273438, 0.004422664642333984, 0.005954742431640625, 0.007486820220947266, 0.009018898010253906, 0.010550975799560547, 0.012083053588867188, 0.013615131378173828, 0.015147209167480469, 0.01667928695678711, 0.01821136474609375, 0.01974344253540039, 0.02127552032470703, 0.022807598114013672, 0.024339675903320312, 0.025871753692626953, 0.027403831481933594, 0.028935909271240234, 0.030467987060546875, 0.032000064849853516, 0.033532142639160156, 0.0350642204284668, 0.03659629821777344, 0.03812837600708008, 0.03966045379638672, 0.04119253158569336, 0.042724609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 10.0, 5.0, 32.0, 44.0, 93.0, 154.0, 309.0, 908.0, 2844.0, 9800.0, 48698.0, 886283.0, 3097363.0, 122445.0, 18096.0, 4596.0, 1503.0, 517.0, 236.0, 120.0, 74.0, 44.0, 36.0, 20.0, 18.0, 9.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0865478515625, -0.08434009552001953, -0.08213233947753906, -0.0799245834350586, -0.07771682739257812, -0.07550907135009766, -0.07330131530761719, -0.07109355926513672, -0.06888580322265625, -0.06667804718017578, -0.06447029113769531, -0.062262535095214844, -0.060054779052734375, -0.057847023010253906, -0.05563926696777344, -0.05343151092529297, -0.0512237548828125, -0.04901599884033203, -0.04680824279785156, -0.044600486755371094, -0.042392730712890625, -0.040184974670410156, -0.03797721862792969, -0.03576946258544922, -0.03356170654296875, -0.03135395050048828, -0.029146194458007812, -0.026938438415527344, -0.024730682373046875, -0.022522926330566406, -0.020315170288085938, -0.01810741424560547, -0.015899658203125, -0.013691902160644531, -0.011484146118164062, -0.009276390075683594, -0.007068634033203125, -0.004860877990722656, -0.0026531219482421875, -0.00044536590576171875, 0.00176239013671875, 0.003970146179199219, 0.0061779022216796875, 0.008385658264160156, 0.010593414306640625, 0.012801170349121094, 0.015008926391601562, 0.01721668243408203, 0.0194244384765625, 0.02163219451904297, 0.023839950561523438, 0.026047706604003906, 0.028255462646484375, 0.030463218688964844, 0.03267097473144531, 0.03487873077392578, 0.03708648681640625, 0.03929424285888672, 0.04150199890136719, 0.043709754943847656, 0.045917510986328125, 0.048125267028808594, 0.05033302307128906, 0.05254077911376953, 0.05474853515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 19.0, 23.0, 40.0, 62.0, 132.0, 292.0, 611.0, 1089.0, 818.0, 472.0, 228.0, 97.0, 48.0, 42.0, 15.0, 17.0, 11.0, 13.0, 4.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.0534205436706543, -0.050963401794433594, -0.04850625991821289, -0.04604911804199219, -0.043591976165771484, -0.04113483428955078, -0.03867769241333008, -0.036220550537109375, -0.03376340866088867, -0.03130626678466797, -0.028849124908447266, -0.026391983032226562, -0.02393484115600586, -0.021477699279785156, -0.019020557403564453, -0.01656341552734375, -0.014106273651123047, -0.011649131774902344, -0.00919198989868164, -0.0067348480224609375, -0.004277706146240234, -0.0018205642700195312, 0.0006365776062011719, 0.003093719482421875, 0.005550861358642578, 0.008008003234863281, 0.010465145111083984, 0.012922286987304688, 0.01537942886352539, 0.017836570739746094, 0.020293712615966797, 0.0227508544921875, 0.025207996368408203, 0.027665138244628906, 0.03012228012084961, 0.03257942199707031, 0.035036563873291016, 0.03749370574951172, 0.03995084762573242, 0.042407989501953125, 0.04486513137817383, 0.04732227325439453, 0.049779415130615234, 0.05223655700683594, 0.05469369888305664, 0.057150840759277344, 0.05960798263549805, 0.06206512451171875, 0.06452226638793945, 0.06697940826416016, 0.06943655014038086, 0.07189369201660156, 0.07435083389282227, 0.07680797576904297, 0.07926511764526367, 0.08172225952148438, 0.08417940139770508, 0.08663654327392578, 0.08909368515014648, 0.09155082702636719, 0.09400796890258789, 0.0964651107788086, 0.0989222526550293, 0.10137939453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 17.0, 31.0, 55.0, 93.0, 184.0, 247.0, 150.0, 105.0, 53.0, 22.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7416550517082214, -0.7236423492431641, -0.7056297063827515, -0.6876170635223389, -0.6696043610572815, -0.6515916585922241, -0.6335790157318115, -0.6155663728713989, -0.5975536704063416, -0.5795409679412842, -0.5615283250808716, -0.543515682220459, -0.5255029797554016, -0.5074902772903442, -0.48947763442993164, -0.47146496176719666, -0.45345228910446167, -0.4354396164417267, -0.4174269437789917, -0.3994142711162567, -0.38140159845352173, -0.36338892579078674, -0.34537625312805176, -0.3273635804653168, -0.3093509078025818, -0.2913382351398468, -0.2733255624771118, -0.25531288981437683, -0.23730021715164185, -0.21928754448890686, -0.20127487182617188, -0.1832621991634369, -0.16524949669837952, -0.14723682403564453, -0.12922415137290955, -0.11121147871017456, -0.09319880604743958, -0.07518613338470459, -0.057173460721969604, -0.03916078805923462, -0.021148115396499634, -0.0031354427337646484, 0.014877229928970337, 0.03288990259170532, 0.05090257525444031, 0.06891524791717529, 0.08692792057991028, 0.10494059324264526, 0.12295326590538025, 0.14096593856811523, 0.15897861123085022, 0.1769912838935852, 0.1950039565563202, 0.21301662921905518, 0.23102930188179016, 0.24904197454452515, 0.26705464720726013, 0.2850673198699951, 0.3030799925327301, 0.3210926651954651, 0.3391053378582001, 0.35711801052093506, 0.37513068318367004, 0.39314335584640503, 0.41115602850914]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 7.0, 13.0, 12.0, 8.0, 16.0, 19.0, 25.0, 27.0, 35.0, 29.0, 41.0, 58.0, 47.0, 46.0, 59.0, 49.0, 60.0, 54.0, 49.0, 54.0, 51.0, 45.0, 35.0, 30.0, 33.0, 15.0, 18.0, 10.0, 13.0, 9.0, 7.0, 6.0, 9.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200320303440094, -0.19193285703659058, -0.18354542553424835, -0.17515797913074493, -0.1667705476284027, -0.1583831012248993, -0.14999565482139587, -0.14160820841789246, -0.13322077691555023, -0.12483333796262741, -0.11644589900970459, -0.10805845260620117, -0.09967101365327835, -0.09128357470035553, -0.08289612829685211, -0.07450868934392929, -0.06612125039100647, -0.05773381143808365, -0.04934636875987053, -0.04095892608165741, -0.03257148712873459, -0.024184048175811768, -0.015796605497598648, -0.0074091628193855286, 0.0009782761335372925, 0.009365716949105263, 0.017753157764673233, 0.026140598580241203, 0.034528039395809174, 0.042915478348731995, 0.051302921026945114, 0.059690363705158234, 0.06807780265808105, 0.07646524161100388, 0.0848526805639267, 0.09324012696743011, 0.10162756592035294, 0.11001500487327576, 0.11840245127677917, 0.1267898976802826, 0.13517732918262482, 0.14356477558612823, 0.15195220708847046, 0.16033965349197388, 0.1687270998954773, 0.17711453139781952, 0.18550197780132294, 0.19388940930366516, 0.20227685570716858, 0.210664302110672, 0.21905173361301422, 0.22743918001651764, 0.23582661151885986, 0.24421405792236328, 0.2526015043258667, 0.2609889507293701, 0.26937639713287354, 0.27776384353637695, 0.28615128993988037, 0.2945387065410614, 0.3029261529445648, 0.31131359934806824, 0.31970104575157166, 0.3280884921550751, 0.3364759087562561]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 10.0, 24.0, 15.0, 26.0, 38.0, 70.0, 94.0, 150.0, 266.0, 492.0, 885.0, 1854.0, 3997.0, 10774.0, 30063.0, 93373.0, 312146.0, 396909.0, 132660.0, 40469.0, 14089.0, 5347.0, 2350.0, 1072.0, 549.0, 326.0, 186.0, 111.0, 70.0, 39.0, 36.0, 19.0, 13.0, 9.0, 5.0, 2.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0450439453125, -0.043642520904541016, -0.04224109649658203, -0.04083967208862305, -0.03943824768066406, -0.03803682327270508, -0.036635398864746094, -0.03523397445678711, -0.033832550048828125, -0.03243112564086914, -0.031029701232910156, -0.029628276824951172, -0.028226852416992188, -0.026825428009033203, -0.02542400360107422, -0.024022579193115234, -0.02262115478515625, -0.021219730377197266, -0.01981830596923828, -0.018416881561279297, -0.017015457153320312, -0.015614032745361328, -0.014212608337402344, -0.01281118392944336, -0.011409759521484375, -0.01000833511352539, -0.008606910705566406, -0.007205486297607422, -0.0058040618896484375, -0.004402637481689453, -0.0030012130737304688, -0.0015997886657714844, -0.0001983642578125, 0.0012030601501464844, 0.0026044845581054688, 0.004005908966064453, 0.0054073333740234375, 0.006808757781982422, 0.008210182189941406, 0.00961160659790039, 0.011013031005859375, 0.01241445541381836, 0.013815879821777344, 0.015217304229736328, 0.016618728637695312, 0.018020153045654297, 0.01942157745361328, 0.020823001861572266, 0.02222442626953125, 0.023625850677490234, 0.02502727508544922, 0.026428699493408203, 0.027830123901367188, 0.029231548309326172, 0.030632972717285156, 0.03203439712524414, 0.033435821533203125, 0.03483724594116211, 0.036238670349121094, 0.03764009475708008, 0.03904151916503906, 0.04044294357299805, 0.04184436798095703, 0.043245792388916016, 0.044647216796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 13.0, 10.0, 10.0, 8.0, 17.0, 26.0, 23.0, 31.0, 48.0, 51.0, 35.0, 56.0, 55.0, 64.0, 61.0, 69.0, 56.0, 66.0, 56.0, 47.0, 50.0, 24.0, 24.0, 31.0, 17.0, 22.0, 9.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.047454833984375, -0.04600095748901367, -0.044547080993652344, -0.043093204498291016, -0.04163932800292969, -0.04018545150756836, -0.03873157501220703, -0.0372776985168457, -0.035823822021484375, -0.03436994552612305, -0.03291606903076172, -0.03146219253540039, -0.030008316040039062, -0.028554439544677734, -0.027100563049316406, -0.025646686553955078, -0.02419281005859375, -0.022738933563232422, -0.021285057067871094, -0.019831180572509766, -0.018377304077148438, -0.01692342758178711, -0.015469551086425781, -0.014015674591064453, -0.012561798095703125, -0.011107921600341797, -0.009654045104980469, -0.00820016860961914, -0.0067462921142578125, -0.005292415618896484, -0.0038385391235351562, -0.002384662628173828, -0.0009307861328125, 0.0005230903625488281, 0.0019769668579101562, 0.0034308433532714844, 0.0048847198486328125, 0.006338596343994141, 0.007792472839355469, 0.009246349334716797, 0.010700225830078125, 0.012154102325439453, 0.013607978820800781, 0.01506185531616211, 0.016515731811523438, 0.017969608306884766, 0.019423484802246094, 0.020877361297607422, 0.02233123779296875, 0.023785114288330078, 0.025238990783691406, 0.026692867279052734, 0.028146743774414062, 0.02960062026977539, 0.03105449676513672, 0.03250837326049805, 0.033962249755859375, 0.0354161262512207, 0.03687000274658203, 0.03832387924194336, 0.03977775573730469, 0.041231632232666016, 0.042685508728027344, 0.04413938522338867, 0.04559326171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 16.0, 18.0, 25.0, 36.0, 72.0, 95.0, 152.0, 314.0, 583.0, 1262.0, 4206.0, 28909.0, 672022.0, 318216.0, 17108.0, 3191.0, 1114.0, 538.0, 276.0, 138.0, 92.0, 53.0, 28.0, 25.0, 17.0, 11.0, 5.0, 11.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1226806640625, -0.11916446685791016, -0.11564826965332031, -0.11213207244873047, -0.10861587524414062, -0.10509967803955078, -0.10158348083496094, -0.0980672836303711, -0.09455108642578125, -0.0910348892211914, -0.08751869201660156, -0.08400249481201172, -0.08048629760742188, -0.07697010040283203, -0.07345390319824219, -0.06993770599365234, -0.0664215087890625, -0.06290531158447266, -0.05938911437988281, -0.05587291717529297, -0.052356719970703125, -0.04884052276611328, -0.04532432556152344, -0.041808128356933594, -0.03829193115234375, -0.034775733947753906, -0.03125953674316406, -0.02774333953857422, -0.024227142333984375, -0.02071094512939453, -0.017194747924804688, -0.013678550720214844, -0.010162353515625, -0.006646156311035156, -0.0031299591064453125, 0.00038623809814453125, 0.003902435302734375, 0.007418632507324219, 0.010934829711914062, 0.014451026916503906, 0.01796722412109375, 0.021483421325683594, 0.024999618530273438, 0.02851581573486328, 0.032032012939453125, 0.03554821014404297, 0.03906440734863281, 0.042580604553222656, 0.0460968017578125, 0.049612998962402344, 0.05312919616699219, 0.05664539337158203, 0.060161590576171875, 0.06367778778076172, 0.06719398498535156, 0.0707101821899414, 0.07422637939453125, 0.0777425765991211, 0.08125877380371094, 0.08477497100830078, 0.08829116821289062, 0.09180736541748047, 0.09532356262207031, 0.09883975982666016, 0.10235595703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 13.0, 9.0, 16.0, 17.0, 22.0, 17.0, 21.0, 32.0, 30.0, 38.0, 32.0, 37.0, 44.0, 38.0, 49.0, 40.0, 44.0, 43.0, 32.0, 40.0, 42.0, 47.0, 32.0, 26.0, 29.0, 26.0, 17.0, 23.0, 20.0, 13.0, 10.0, 19.0, 11.0, 6.0, 10.0, 6.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10345458984375, -0.09997940063476562, -0.09650421142578125, -0.09302902221679688, -0.0895538330078125, -0.08607864379882812, -0.08260345458984375, -0.07912826538085938, -0.075653076171875, -0.07217788696289062, -0.06870269775390625, -0.06522750854492188, -0.0617523193359375, -0.058277130126953125, -0.05480194091796875, -0.051326751708984375, -0.0478515625, -0.044376373291015625, -0.04090118408203125, -0.037425994873046875, -0.0339508056640625, -0.030475616455078125, -0.02700042724609375, -0.023525238037109375, -0.020050048828125, -0.016574859619140625, -0.01309967041015625, -0.009624481201171875, -0.0061492919921875, -0.002674102783203125, 0.00080108642578125, 0.004276275634765625, 0.00775146484375, 0.011226654052734375, 0.01470184326171875, 0.018177032470703125, 0.0216522216796875, 0.025127410888671875, 0.02860260009765625, 0.032077789306640625, 0.035552978515625, 0.039028167724609375, 0.04250335693359375, 0.045978546142578125, 0.0494537353515625, 0.052928924560546875, 0.05640411376953125, 0.059879302978515625, 0.0633544921875, 0.06682968139648438, 0.07030487060546875, 0.07378005981445312, 0.0772552490234375, 0.08073043823242188, 0.08420562744140625, 0.08768081665039062, 0.091156005859375, 0.09463119506835938, 0.09810638427734375, 0.10158157348632812, 0.1050567626953125, 0.10853195190429688, 0.11200714111328125, 0.11548233032226562, 0.11895751953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 12.0, 16.0, 21.0, 32.0, 73.0, 122.0, 211.0, 545.0, 1601.0, 7889.0, 109260.0, 895448.0, 27918.0, 3697.0, 947.0, 346.0, 171.0, 79.0, 41.0, 28.0, 22.0, 18.0, 13.0, 7.0, 2.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07891845703125, -0.07639598846435547, -0.07387351989746094, -0.0713510513305664, -0.06882858276367188, -0.06630611419677734, -0.06378364562988281, -0.06126117706298828, -0.05873870849609375, -0.05621623992919922, -0.05369377136230469, -0.051171302795410156, -0.048648834228515625, -0.046126365661621094, -0.04360389709472656, -0.04108142852783203, -0.0385589599609375, -0.03603649139404297, -0.03351402282714844, -0.030991554260253906, -0.028469085693359375, -0.025946617126464844, -0.023424148559570312, -0.02090167999267578, -0.01837921142578125, -0.01585674285888672, -0.013334274291992188, -0.010811805725097656, -0.008289337158203125, -0.005766868591308594, -0.0032444000244140625, -0.0007219314575195312, 0.001800537109375, 0.004323005676269531, 0.0068454742431640625, 0.009367942810058594, 0.011890411376953125, 0.014412879943847656, 0.016935348510742188, 0.01945781707763672, 0.02198028564453125, 0.02450275421142578, 0.027025222778320312, 0.029547691345214844, 0.032070159912109375, 0.034592628479003906, 0.03711509704589844, 0.03963756561279297, 0.0421600341796875, 0.04468250274658203, 0.04720497131347656, 0.049727439880371094, 0.052249908447265625, 0.054772377014160156, 0.05729484558105469, 0.05981731414794922, 0.06233978271484375, 0.06486225128173828, 0.06738471984863281, 0.06990718841552734, 0.07242965698242188, 0.0749521255493164, 0.07747459411621094, 0.07999706268310547, 0.08251953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 11.0, 6.0, 11.0, 12.0, 23.0, 16.0, 30.0, 39.0, 65.0, 65.0, 120.0, 111.0, 116.0, 96.0, 79.0, 44.0, 33.0, 36.0, 17.0, 15.0, 14.0, 11.0, 7.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.514787673950195e-05, -6.342492997646332e-05, -6.170198321342468e-05, -5.997903645038605e-05, -5.825608968734741e-05, -5.653314292430878e-05, -5.481019616127014e-05, -5.3087249398231506e-05, -5.136430263519287e-05, -4.9641355872154236e-05, -4.79184091091156e-05, -4.6195462346076965e-05, -4.447251558303833e-05, -4.2749568819999695e-05, -4.102662205696106e-05, -3.9303675293922424e-05, -3.758072853088379e-05, -3.5857781767845154e-05, -3.413483500480652e-05, -3.241188824176788e-05, -3.068894147872925e-05, -2.8965994715690613e-05, -2.7243047952651978e-05, -2.5520101189613342e-05, -2.3797154426574707e-05, -2.2074207663536072e-05, -2.0351260900497437e-05, -1.86283141374588e-05, -1.6905367374420166e-05, -1.518242061138153e-05, -1.3459473848342896e-05, -1.173652708530426e-05, -1.0013580322265625e-05, -8.29063355922699e-06, -6.5676867961883545e-06, -4.844740033149719e-06, -3.121793270111084e-06, -1.3988465070724487e-06, 3.241002559661865e-07, 2.0470470190048218e-06, 3.769993782043457e-06, 5.492940545082092e-06, 7.2158873081207275e-06, 8.938834071159363e-06, 1.0661780834197998e-05, 1.2384727597236633e-05, 1.4107674360275269e-05, 1.5830621123313904e-05, 1.755356788635254e-05, 1.9276514649391174e-05, 2.099946141242981e-05, 2.2722408175468445e-05, 2.444535493850708e-05, 2.6168301701545715e-05, 2.789124846458435e-05, 2.9614195227622986e-05, 3.133714199066162e-05, 3.3060088753700256e-05, 3.478303551673889e-05, 3.650598227977753e-05, 3.822892904281616e-05, 3.99518758058548e-05, 4.167482256889343e-05, 4.339776933193207e-05, 4.51207160949707e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 10.0, 9.0, 13.0, 12.0, 21.0, 26.0, 33.0, 35.0, 62.0, 111.0, 152.0, 258.0, 438.0, 806.0, 1850.0, 4504.0, 12845.0, 58013.0, 693036.0, 234751.0, 27700.0, 7916.0, 3073.0, 1287.0, 630.0, 345.0, 204.0, 126.0, 84.0, 66.0, 37.0, 30.0, 22.0, 11.0, 11.0, 9.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042633056640625, -0.041248321533203125, -0.03986358642578125, -0.038478851318359375, -0.0370941162109375, -0.035709381103515625, -0.03432464599609375, -0.032939910888671875, -0.03155517578125, -0.030170440673828125, -0.02878570556640625, -0.027400970458984375, -0.0260162353515625, -0.024631500244140625, -0.02324676513671875, -0.021862030029296875, -0.020477294921875, -0.019092559814453125, -0.01770782470703125, -0.016323089599609375, -0.0149383544921875, -0.013553619384765625, -0.01216888427734375, -0.010784149169921875, -0.0093994140625, -0.008014678955078125, -0.00662994384765625, -0.005245208740234375, -0.0038604736328125, -0.002475738525390625, -0.00109100341796875, 0.000293731689453125, 0.001678466796875, 0.003063201904296875, 0.00444793701171875, 0.005832672119140625, 0.0072174072265625, 0.008602142333984375, 0.00998687744140625, 0.011371612548828125, 0.01275634765625, 0.014141082763671875, 0.01552581787109375, 0.016910552978515625, 0.0182952880859375, 0.019680023193359375, 0.02106475830078125, 0.022449493408203125, 0.023834228515625, 0.025218963623046875, 0.02660369873046875, 0.027988433837890625, 0.0293731689453125, 0.030757904052734375, 0.03214263916015625, 0.033527374267578125, 0.034912109375, 0.036296844482421875, 0.03768157958984375, 0.039066314697265625, 0.0404510498046875, 0.041835784912109375, 0.04322052001953125, 0.044605255126953125, 0.045989990234375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 13.0, 10.0, 17.0, 32.0, 30.0, 65.0, 97.0, 95.0, 115.0, 116.0, 106.0, 84.0, 59.0, 45.0, 27.0, 19.0, 13.0, 3.0, 5.0, 12.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.034210205078125, -0.0328974723815918, -0.031584739685058594, -0.03027200698852539, -0.028959274291992188, -0.027646541595458984, -0.02633380889892578, -0.025021076202392578, -0.023708343505859375, -0.022395610809326172, -0.02108287811279297, -0.019770145416259766, -0.018457412719726562, -0.01714468002319336, -0.015831947326660156, -0.014519214630126953, -0.01320648193359375, -0.011893749237060547, -0.010581016540527344, -0.00926828384399414, -0.007955551147460938, -0.006642818450927734, -0.005330085754394531, -0.004017353057861328, -0.002704620361328125, -0.0013918876647949219, -7.915496826171875e-05, 0.0012335777282714844, 0.0025463104248046875, 0.0038590431213378906, 0.005171775817871094, 0.006484508514404297, 0.0077972412109375, 0.009109973907470703, 0.010422706604003906, 0.01173543930053711, 0.013048171997070312, 0.014360904693603516, 0.01567363739013672, 0.016986370086669922, 0.018299102783203125, 0.019611835479736328, 0.02092456817626953, 0.022237300872802734, 0.023550033569335938, 0.02486276626586914, 0.026175498962402344, 0.027488231658935547, 0.02880096435546875, 0.030113697052001953, 0.031426429748535156, 0.03273916244506836, 0.03405189514160156, 0.035364627838134766, 0.03667736053466797, 0.03799009323120117, 0.039302825927734375, 0.04061555862426758, 0.04192829132080078, 0.043241024017333984, 0.04455375671386719, 0.04586648941040039, 0.047179222106933594, 0.0484919548034668, 0.0498046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 10.0, 11.0, 32.0, 180.0, 563.0, 174.0, 19.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.9239914417266846, -2.8637728691101074, -2.8035542964935303, -2.7433359622955322, -2.683117389678955, -2.622898817062378, -2.562680244445801, -2.5024619102478027, -2.4422433376312256, -2.3820247650146484, -2.3218061923980713, -2.2615878582000732, -2.201369285583496, -2.141150712966919, -2.080932140350342, -2.0207138061523438, -1.960495114326477, -1.9002765417099, -1.8400580883026123, -1.7798395156860352, -1.7196210622787476, -1.6594024896621704, -1.5991840362548828, -1.5389654636383057, -1.4787468910217285, -1.4185283184051514, -1.3583098649978638, -1.2980912923812866, -1.237872838973999, -1.1776542663574219, -1.1174356937408447, -1.0572172403335571, -0.9969988465309143, -0.9367803335189819, -0.8765618205070496, -0.8163433074951172, -0.75612473487854, -0.6959062814712524, -0.6356877088546753, -0.5754691958427429, -0.5152506828308105, -0.4550321698188782, -0.3948136568069458, -0.33459511399269104, -0.27437660098075867, -0.2141580879688263, -0.15393954515457153, -0.09372103214263916, -0.03350251913070679, 0.026716001331806183, 0.08693452179431915, 0.14715304970741272, 0.2073715627193451, 0.26759007573127747, 0.3278086185455322, 0.3880271315574646, 0.448245644569397, 0.5084641575813293, 0.5686826705932617, 0.6289012432098389, 0.6891196966171265, 0.7493382692337036, 0.809556782245636, 0.8697752952575684, 0.9299938082695007]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 6.0, 11.0, 12.0, 21.0, 15.0, 28.0, 26.0, 25.0, 39.0, 39.0, 30.0, 41.0, 41.0, 42.0, 55.0, 60.0, 72.0, 50.0, 41.0, 39.0, 38.0, 39.0, 32.0, 26.0, 35.0, 16.0, 20.0, 13.0, 14.0, 16.0, 9.0, 7.0, 12.0, 2.0, 2.0, 7.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5337928533554077, -0.5174675583839417, -0.5011422634124756, -0.4848169684410095, -0.46849164366722107, -0.452166348695755, -0.43584105372428894, -0.4195157587528229, -0.4031904339790344, -0.38686513900756836, -0.3705398440361023, -0.35421454906463623, -0.3378892242908478, -0.3215639293193817, -0.30523863434791565, -0.2889133393764496, -0.2725880444049835, -0.25626274943351746, -0.2399374395608902, -0.22361214458942413, -0.20728683471679688, -0.1909615397453308, -0.17463624477386475, -0.15831094980239868, -0.14198563992977142, -0.12566034495830536, -0.1093350350856781, -0.09300974011421204, -0.07668443769216537, -0.06035913527011871, -0.04403384029865265, -0.027708537876605988, -0.011383235454559326, 0.004942065104842186, 0.021267365664243698, 0.03759266436100006, 0.05391796678304672, 0.07024326920509338, 0.08656856417655945, 0.10289386659860611, 0.11921916902065277, 0.13554446399211884, 0.1518697738647461, 0.16819506883621216, 0.18452036380767822, 0.20084567368030548, 0.21717096865177155, 0.2334962785243988, 0.24982157349586487, 0.26614686846733093, 0.282472163438797, 0.29879748821258545, 0.3151227831840515, 0.3314480781555176, 0.34777337312698364, 0.3640986680984497, 0.38042396306991577, 0.39674925804138184, 0.4130745530128479, 0.42939984798431396, 0.4457251727581024, 0.4620504677295685, 0.47837576270103455, 0.4947010576725006, 0.5110263824462891]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 9.0, 14.0, 12.0, 31.0, 62.0, 129.0, 247.0, 639.0, 2158.0, 9580.0, 107489.0, 3074932.0, 960990.0, 31561.0, 4497.0, 1224.0, 393.0, 173.0, 70.0, 36.0, 21.0, 9.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10400390625, -0.10125160217285156, -0.09849929809570312, -0.09574699401855469, -0.09299468994140625, -0.09024238586425781, -0.08749008178710938, -0.08473777770996094, -0.0819854736328125, -0.07923316955566406, -0.07648086547851562, -0.07372856140136719, -0.07097625732421875, -0.06822395324707031, -0.06547164916992188, -0.06271934509277344, -0.059967041015625, -0.05721473693847656, -0.054462432861328125, -0.05171012878417969, -0.04895782470703125, -0.04620552062988281, -0.043453216552734375, -0.04070091247558594, -0.0379486083984375, -0.03519630432128906, -0.032444000244140625, -0.029691696166992188, -0.02693939208984375, -0.024187088012695312, -0.021434783935546875, -0.018682479858398438, -0.01593017578125, -0.013177871704101562, -0.010425567626953125, -0.0076732635498046875, -0.00492095947265625, -0.0021686553955078125, 0.000583648681640625, 0.0033359527587890625, 0.0060882568359375, 0.008840560913085938, 0.011592864990234375, 0.014345169067382812, 0.01709747314453125, 0.019849777221679688, 0.022602081298828125, 0.025354385375976562, 0.028106689453125, 0.030858993530273438, 0.033611297607421875, 0.03636360168457031, 0.03911590576171875, 0.04186820983886719, 0.044620513916015625, 0.04737281799316406, 0.0501251220703125, 0.05287742614746094, 0.055629730224609375, 0.05838203430175781, 0.06113433837890625, 0.06388664245605469, 0.06663894653320312, 0.06939125061035156, 0.0721435546875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 10.0, 10.0, 14.0, 16.0, 21.0, 20.0, 14.0, 23.0, 26.0, 44.0, 43.0, 52.0, 58.0, 60.0, 59.0, 66.0, 67.0, 61.0, 51.0, 60.0, 34.0, 47.0, 34.0, 28.0, 15.0, 18.0, 14.0, 9.0, 5.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.047271728515625, -0.045889854431152344, -0.04450798034667969, -0.04312610626220703, -0.041744232177734375, -0.04036235809326172, -0.03898048400878906, -0.037598609924316406, -0.03621673583984375, -0.034834861755371094, -0.03345298767089844, -0.03207111358642578, -0.030689239501953125, -0.02930736541748047, -0.027925491333007812, -0.026543617248535156, -0.0251617431640625, -0.023779869079589844, -0.022397994995117188, -0.02101612091064453, -0.019634246826171875, -0.01825237274169922, -0.016870498657226562, -0.015488624572753906, -0.01410675048828125, -0.012724876403808594, -0.011343002319335938, -0.009961128234863281, -0.008579254150390625, -0.007197380065917969, -0.0058155059814453125, -0.004433631896972656, -0.0030517578125, -0.0016698837280273438, -0.0002880096435546875, 0.0010938644409179688, 0.002475738525390625, 0.0038576126098632812, 0.0052394866943359375, 0.006621360778808594, 0.00800323486328125, 0.009385108947753906, 0.010766983032226562, 0.012148857116699219, 0.013530731201171875, 0.014912605285644531, 0.016294479370117188, 0.017676353454589844, 0.0190582275390625, 0.020440101623535156, 0.021821975708007812, 0.02320384979248047, 0.024585723876953125, 0.02596759796142578, 0.027349472045898438, 0.028731346130371094, 0.03011322021484375, 0.031495094299316406, 0.03287696838378906, 0.03425884246826172, 0.035640716552734375, 0.03702259063720703, 0.03840446472167969, 0.039786338806152344, 0.041168212890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 16.0, 22.0, 54.0, 77.0, 166.0, 293.0, 676.0, 1743.0, 6396.0, 35368.0, 466974.0, 3451413.0, 199912.0, 23020.0, 5148.0, 1560.0, 671.0, 313.0, 166.0, 95.0, 58.0, 40.0, 15.0, 17.0, 14.0, 8.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.091552734375, -0.08910274505615234, -0.08665275573730469, -0.08420276641845703, -0.08175277709960938, -0.07930278778076172, -0.07685279846191406, -0.0744028091430664, -0.07195281982421875, -0.0695028305053711, -0.06705284118652344, -0.06460285186767578, -0.062152862548828125, -0.05970287322998047, -0.05725288391113281, -0.054802894592285156, -0.0523529052734375, -0.049902915954589844, -0.04745292663574219, -0.04500293731689453, -0.042552947998046875, -0.04010295867919922, -0.03765296936035156, -0.035202980041503906, -0.03275299072265625, -0.030303001403808594, -0.027853012084960938, -0.02540302276611328, -0.022953033447265625, -0.02050304412841797, -0.018053054809570312, -0.015603065490722656, -0.013153076171875, -0.010703086853027344, -0.008253097534179688, -0.005803108215332031, -0.003353118896484375, -0.0009031295776367188, 0.0015468597412109375, 0.003996849060058594, 0.00644683837890625, 0.008896827697753906, 0.011346817016601562, 0.013796806335449219, 0.016246795654296875, 0.01869678497314453, 0.021146774291992188, 0.023596763610839844, 0.0260467529296875, 0.028496742248535156, 0.030946731567382812, 0.03339672088623047, 0.035846710205078125, 0.03829669952392578, 0.04074668884277344, 0.043196678161621094, 0.04564666748046875, 0.048096656799316406, 0.05054664611816406, 0.05299663543701172, 0.055446624755859375, 0.05789661407470703, 0.06034660339355469, 0.06279659271240234, 0.06524658203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 9.0, 12.0, 19.0, 23.0, 48.0, 45.0, 76.0, 147.0, 250.0, 502.0, 786.0, 823.0, 620.0, 295.0, 160.0, 89.0, 51.0, 20.0, 30.0, 15.0, 14.0, 8.0, 5.0, 5.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06378173828125, -0.06101512908935547, -0.05824851989746094, -0.055481910705566406, -0.052715301513671875, -0.049948692321777344, -0.04718208312988281, -0.04441547393798828, -0.04164886474609375, -0.03888225555419922, -0.03611564636230469, -0.033349037170410156, -0.030582427978515625, -0.027815818786621094, -0.025049209594726562, -0.02228260040283203, -0.0195159912109375, -0.01674938201904297, -0.013982772827148438, -0.011216163635253906, -0.008449554443359375, -0.005682945251464844, -0.0029163360595703125, -0.00014972686767578125, 0.00261688232421875, 0.005383491516113281, 0.008150100708007812, 0.010916709899902344, 0.013683319091796875, 0.016449928283691406, 0.019216537475585938, 0.02198314666748047, 0.024749755859375, 0.02751636505126953, 0.030282974243164062, 0.033049583435058594, 0.035816192626953125, 0.038582801818847656, 0.04134941101074219, 0.04411602020263672, 0.04688262939453125, 0.04964923858642578, 0.05241584777832031, 0.055182456970214844, 0.057949066162109375, 0.060715675354003906, 0.06348228454589844, 0.06624889373779297, 0.0690155029296875, 0.07178211212158203, 0.07454872131347656, 0.0773153305053711, 0.08008193969726562, 0.08284854888916016, 0.08561515808105469, 0.08838176727294922, 0.09114837646484375, 0.09391498565673828, 0.09668159484863281, 0.09944820404052734, 0.10221481323242188, 0.1049814224243164, 0.10774803161621094, 0.11051464080810547, 0.11328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 11.0, 15.0, 26.0, 60.0, 94.0, 231.0, 261.0, 162.0, 75.0, 29.0, 14.0, 9.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0696187019348145, -1.0415470600128174, -1.0134752988815308, -0.9854035973548889, -0.9573318958282471, -0.9292601943016052, -0.9011884927749634, -0.8731168508529663, -0.8450450897216797, -0.8169733881950378, -0.788901686668396, -0.7608299851417542, -0.7327582836151123, -0.7046865820884705, -0.6766148805618286, -0.6485432386398315, -0.6204715371131897, -0.5923998355865479, -0.564328134059906, -0.5362564325332642, -0.5081847310066223, -0.48011302947998047, -0.452041357755661, -0.42396965622901917, -0.3958979547023773, -0.3678262531757355, -0.33975455164909363, -0.31168287992477417, -0.2836111783981323, -0.2555394768714905, -0.22746777534484863, -0.1993960738182068, -0.17132437229156494, -0.1432526707649231, -0.11518097668886185, -0.0871092826128006, -0.05903758108615875, -0.030965879559516907, -0.002894192934036255, 0.02517750859260559, 0.053249210119247437, 0.08132091164588928, 0.10939260572195053, 0.13746429979801178, 0.16553600132465363, 0.19360770285129547, 0.22167938947677612, 0.24975109100341797, 0.2778227925300598, 0.30589449405670166, 0.3339661955833435, 0.36203789710998535, 0.3901095986366272, 0.41818130016326904, 0.4462529718875885, 0.47432467341423035, 0.5023963451385498, 0.5304680466651917, 0.5585397481918335, 0.5866114497184753, 0.6146831512451172, 0.642754852771759, 0.6708265542984009, 0.698898196220398, 0.7269699573516846]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 5.0, 3.0, 5.0, 8.0, 8.0, 8.0, 9.0, 14.0, 13.0, 12.0, 19.0, 22.0, 27.0, 27.0, 38.0, 34.0, 42.0, 42.0, 35.0, 42.0, 48.0, 55.0, 49.0, 42.0, 41.0, 41.0, 35.0, 38.0, 38.0, 34.0, 38.0, 24.0, 19.0, 16.0, 10.0, 10.0, 10.0, 10.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.35849255323410034, -0.34809526801109314, -0.3376980125904083, -0.3273007273674011, -0.3169034421443939, -0.3065061569213867, -0.2961089015007019, -0.2857116162776947, -0.2753143310546875, -0.2649170458316803, -0.2545197904109955, -0.24412250518798828, -0.23372521996498108, -0.22332794964313507, -0.21293067932128906, -0.20253339409828186, -0.19213612377643585, -0.18173885345458984, -0.17134156823158264, -0.16094429790973663, -0.15054701268672943, -0.14014974236488342, -0.12975245714187622, -0.11935518682003021, -0.10895790904760361, -0.098560631275177, -0.0881633535027504, -0.07776607573032379, -0.06736880540847778, -0.05697152391076088, -0.04657424986362457, -0.03617697209119797, -0.025779694318771362, -0.015382417477667332, -0.004985140636563301, 0.005412135273218155, 0.01580941304564476, 0.026206690818071365, 0.03660396486520767, 0.04700124263763428, 0.05739852041006088, 0.06779579818248749, 0.07819307595491409, 0.0885903537273407, 0.0989876240491867, 0.10938490927219391, 0.11978217959403992, 0.13017946481704712, 0.14057673513889313, 0.15097400546073914, 0.16137129068374634, 0.17176856100559235, 0.18216584622859955, 0.19256311655044556, 0.20296040177345276, 0.21335767209529877, 0.22375494241714478, 0.23415221273899078, 0.24454949796199799, 0.254946768283844, 0.2653440535068512, 0.2757413387298584, 0.2861385941505432, 0.2965358793735504, 0.3069331645965576]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 1.0, 16.0, 17.0, 17.0, 29.0, 36.0, 68.0, 102.0, 153.0, 295.0, 535.0, 1160.0, 2718.0, 7814.0, 26202.0, 95782.0, 344369.0, 401334.0, 119833.0, 32652.0, 9424.0, 3189.0, 1336.0, 635.0, 344.0, 177.0, 123.0, 62.0, 45.0, 20.0, 21.0, 7.0, 13.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061737060546875, -0.06002616882324219, -0.058315277099609375, -0.05660438537597656, -0.05489349365234375, -0.05318260192871094, -0.051471710205078125, -0.04976081848144531, -0.0480499267578125, -0.04633903503417969, -0.044628143310546875, -0.04291725158691406, -0.04120635986328125, -0.03949546813964844, -0.037784576416015625, -0.03607368469238281, -0.03436279296875, -0.03265190124511719, -0.030941009521484375, -0.029230117797851562, -0.02751922607421875, -0.025808334350585938, -0.024097442626953125, -0.022386550903320312, -0.0206756591796875, -0.018964767456054688, -0.017253875732421875, -0.015542984008789062, -0.01383209228515625, -0.012121200561523438, -0.010410308837890625, -0.008699417114257812, -0.006988525390625, -0.0052776336669921875, -0.003566741943359375, -0.0018558502197265625, -0.00014495849609375, 0.0015659332275390625, 0.003276824951171875, 0.0049877166748046875, 0.0066986083984375, 0.008409500122070312, 0.010120391845703125, 0.011831283569335938, 0.01354217529296875, 0.015253067016601562, 0.016963958740234375, 0.018674850463867188, 0.0203857421875, 0.022096633911132812, 0.023807525634765625, 0.025518417358398438, 0.02722930908203125, 0.028940200805664062, 0.030651092529296875, 0.03236198425292969, 0.0340728759765625, 0.03578376770019531, 0.037494659423828125, 0.03920555114746094, 0.04091644287109375, 0.04262733459472656, 0.044338226318359375, 0.04604911804199219, 0.047760009765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 7.0, 10.0, 9.0, 14.0, 28.0, 19.0, 28.0, 43.0, 47.0, 45.0, 68.0, 60.0, 61.0, 78.0, 84.0, 68.0, 66.0, 50.0, 45.0, 34.0, 31.0, 22.0, 23.0, 11.0, 13.0, 10.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.054046630859375, -0.05252408981323242, -0.051001548767089844, -0.049479007720947266, -0.04795646667480469, -0.04643392562866211, -0.04491138458251953, -0.04338884353637695, -0.041866302490234375, -0.0403437614440918, -0.03882122039794922, -0.03729867935180664, -0.03577613830566406, -0.034253597259521484, -0.032731056213378906, -0.031208515167236328, -0.02968597412109375, -0.028163433074951172, -0.026640892028808594, -0.025118350982666016, -0.023595809936523438, -0.02207326889038086, -0.02055072784423828, -0.019028186798095703, -0.017505645751953125, -0.015983104705810547, -0.014460563659667969, -0.01293802261352539, -0.011415481567382812, -0.009892940521240234, -0.008370399475097656, -0.006847858428955078, -0.0053253173828125, -0.003802776336669922, -0.0022802352905273438, -0.0007576942443847656, 0.0007648468017578125, 0.0022873878479003906, 0.0038099288940429688, 0.005332469940185547, 0.006855010986328125, 0.008377552032470703, 0.009900093078613281, 0.01142263412475586, 0.012945175170898438, 0.014467716217041016, 0.015990257263183594, 0.017512798309326172, 0.01903533935546875, 0.020557880401611328, 0.022080421447753906, 0.023602962493896484, 0.025125503540039062, 0.02664804458618164, 0.02817058563232422, 0.029693126678466797, 0.031215667724609375, 0.03273820877075195, 0.03426074981689453, 0.03578329086303711, 0.03730583190917969, 0.038828372955322266, 0.040350914001464844, 0.04187345504760742, 0.04339599609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 12.0, 13.0, 21.0, 30.0, 49.0, 84.0, 117.0, 166.0, 260.0, 477.0, 863.0, 1754.0, 4804.0, 27731.0, 774621.0, 218723.0, 12619.0, 3148.0, 1282.0, 705.0, 407.0, 230.0, 162.0, 87.0, 54.0, 44.0, 21.0, 21.0, 18.0, 9.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1695556640625, -0.1646862030029297, -0.15981674194335938, -0.15494728088378906, -0.15007781982421875, -0.14520835876464844, -0.14033889770507812, -0.1354694366455078, -0.1305999755859375, -0.1257305145263672, -0.12086105346679688, -0.11599159240722656, -0.11112213134765625, -0.10625267028808594, -0.10138320922851562, -0.09651374816894531, -0.091644287109375, -0.08677482604980469, -0.08190536499023438, -0.07703590393066406, -0.07216644287109375, -0.06729698181152344, -0.062427520751953125, -0.05755805969238281, -0.0526885986328125, -0.04781913757324219, -0.042949676513671875, -0.03808021545410156, -0.03321075439453125, -0.028341293334960938, -0.023471832275390625, -0.018602371215820312, -0.01373291015625, -0.008863449096679688, -0.003993988037109375, 0.0008754730224609375, 0.00574493408203125, 0.010614395141601562, 0.015483856201171875, 0.020353317260742188, 0.0252227783203125, 0.030092239379882812, 0.034961700439453125, 0.03983116149902344, 0.04470062255859375, 0.04957008361816406, 0.054439544677734375, 0.05930900573730469, 0.064178466796875, 0.06904792785644531, 0.07391738891601562, 0.07878684997558594, 0.08365631103515625, 0.08852577209472656, 0.09339523315429688, 0.09826469421386719, 0.1031341552734375, 0.10800361633300781, 0.11287307739257812, 0.11774253845214844, 0.12261199951171875, 0.12748146057128906, 0.13235092163085938, 0.1372203826904297, 0.14208984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 6.0, 4.0, 9.0, 10.0, 15.0, 15.0, 16.0, 19.0, 24.0, 23.0, 27.0, 32.0, 53.0, 47.0, 56.0, 37.0, 54.0, 58.0, 55.0, 47.0, 56.0, 55.0, 55.0, 42.0, 30.0, 31.0, 25.0, 26.0, 21.0, 11.0, 9.0, 12.0, 6.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.17345619201660156, -0.16795730590820312, -0.1624584197998047, -0.15695953369140625, -0.1514606475830078, -0.14596176147460938, -0.14046287536621094, -0.1349639892578125, -0.12946510314941406, -0.12396621704101562, -0.11846733093261719, -0.11296844482421875, -0.10746955871582031, -0.10197067260742188, -0.09647178649902344, -0.090972900390625, -0.08547401428222656, -0.07997512817382812, -0.07447624206542969, -0.06897735595703125, -0.06347846984863281, -0.057979583740234375, -0.05248069763183594, -0.0469818115234375, -0.04148292541503906, -0.035984039306640625, -0.030485153198242188, -0.02498626708984375, -0.019487380981445312, -0.013988494873046875, -0.008489608764648438, -0.00299072265625, 0.0025081634521484375, 0.008007049560546875, 0.013505935668945312, 0.01900482177734375, 0.024503707885742188, 0.030002593994140625, 0.03550148010253906, 0.0410003662109375, 0.04649925231933594, 0.051998138427734375, 0.05749702453613281, 0.06299591064453125, 0.06849479675292969, 0.07399368286132812, 0.07949256896972656, 0.084991455078125, 0.09049034118652344, 0.09598922729492188, 0.10148811340332031, 0.10698699951171875, 0.11248588562011719, 0.11798477172851562, 0.12348365783691406, 0.1289825439453125, 0.13448143005371094, 0.13998031616210938, 0.1454792022705078, 0.15097808837890625, 0.1564769744873047, 0.16197586059570312, 0.16747474670410156, 0.1729736328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 7.0, 10.0, 11.0, 22.0, 34.0, 31.0, 48.0, 70.0, 103.0, 157.0, 213.0, 343.0, 550.0, 918.0, 1697.0, 3678.0, 9169.0, 27882.0, 119331.0, 694966.0, 139433.0, 31663.0, 9918.0, 3814.0, 1845.0, 977.0, 574.0, 320.0, 238.0, 165.0, 103.0, 59.0, 51.0, 46.0, 43.0, 19.0, 15.0, 7.0, 13.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.04107666015625, -0.039852142333984375, -0.03862762451171875, -0.037403106689453125, -0.0361785888671875, -0.034954071044921875, -0.03372955322265625, -0.032505035400390625, -0.031280517578125, -0.030055999755859375, -0.02883148193359375, -0.027606964111328125, -0.0263824462890625, -0.025157928466796875, -0.02393341064453125, -0.022708892822265625, -0.021484375, -0.020259857177734375, -0.01903533935546875, -0.017810821533203125, -0.0165863037109375, -0.015361785888671875, -0.01413726806640625, -0.012912750244140625, -0.011688232421875, -0.010463714599609375, -0.00923919677734375, -0.008014678955078125, -0.0067901611328125, -0.005565643310546875, -0.00434112548828125, -0.003116607666015625, -0.00189208984375, -0.000667572021484375, 0.00055694580078125, 0.001781463623046875, 0.0030059814453125, 0.004230499267578125, 0.00545501708984375, 0.006679534912109375, 0.007904052734375, 0.009128570556640625, 0.01035308837890625, 0.011577606201171875, 0.0128021240234375, 0.014026641845703125, 0.01525115966796875, 0.016475677490234375, 0.0177001953125, 0.018924713134765625, 0.02014923095703125, 0.021373748779296875, 0.0225982666015625, 0.023822784423828125, 0.02504730224609375, 0.026271820068359375, 0.027496337890625, 0.028720855712890625, 0.02994537353515625, 0.031169891357421875, 0.0323944091796875, 0.033618927001953125, 0.03484344482421875, 0.036067962646484375, 0.03729248046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 9.0, 4.0, 5.0, 5.0, 15.0, 15.0, 17.0, 16.0, 20.0, 37.0, 39.0, 50.0, 75.0, 102.0, 111.0, 106.0, 78.0, 60.0, 39.0, 30.0, 33.0, 22.0, 16.0, 18.0, 15.0, 5.0, 7.0, 10.0, 10.0, 5.0, 5.0, 4.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.40614128112793e-05, -5.222950130701065e-05, -5.0397589802742004e-05, -4.856567829847336e-05, -4.673376679420471e-05, -4.4901855289936066e-05, -4.306994378566742e-05, -4.123803228139877e-05, -3.940612077713013e-05, -3.757420927286148e-05, -3.5742297768592834e-05, -3.391038626432419e-05, -3.207847476005554e-05, -3.0246563255786896e-05, -2.841465175151825e-05, -2.6582740247249603e-05, -2.4750828742980957e-05, -2.291891723871231e-05, -2.1087005734443665e-05, -1.925509423017502e-05, -1.7423182725906372e-05, -1.5591271221637726e-05, -1.375935971736908e-05, -1.1927448213100433e-05, -1.0095536708831787e-05, -8.263625204563141e-06, -6.431713700294495e-06, -4.599802196025848e-06, -2.767890691757202e-06, -9.359791874885559e-07, 8.959323167800903e-07, 2.7278438210487366e-06, 4.559755325317383e-06, 6.391666829586029e-06, 8.223578333854675e-06, 1.0055489838123322e-05, 1.1887401342391968e-05, 1.3719312846660614e-05, 1.555122435092926e-05, 1.7383135855197906e-05, 1.9215047359466553e-05, 2.10469588637352e-05, 2.2878870368003845e-05, 2.471078187227249e-05, 2.6542693376541138e-05, 2.8374604880809784e-05, 3.020651638507843e-05, 3.2038427889347076e-05, 3.387033939361572e-05, 3.570225089788437e-05, 3.7534162402153015e-05, 3.936607390642166e-05, 4.119798541069031e-05, 4.3029896914958954e-05, 4.48618084192276e-05, 4.6693719923496246e-05, 4.852563142776489e-05, 5.035754293203354e-05, 5.2189454436302185e-05, 5.402136594057083e-05, 5.585327744483948e-05, 5.7685188949108124e-05, 5.951710045337677e-05, 6.134901195764542e-05, 6.318092346191406e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 8.0, 8.0, 21.0, 21.0, 38.0, 49.0, 76.0, 102.0, 150.0, 204.0, 360.0, 651.0, 1159.0, 2653.0, 7433.0, 28702.0, 214669.0, 716758.0, 55449.0, 12383.0, 3969.0, 1568.0, 819.0, 433.0, 283.0, 180.0, 120.0, 69.0, 61.0, 49.0, 28.0, 14.0, 17.0, 9.0, 11.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052337646484375, -0.05054521560668945, -0.048752784729003906, -0.04696035385131836, -0.04516792297363281, -0.043375492095947266, -0.04158306121826172, -0.03979063034057617, -0.037998199462890625, -0.03620576858520508, -0.03441333770751953, -0.032620906829833984, -0.030828475952148438, -0.02903604507446289, -0.027243614196777344, -0.025451183319091797, -0.02365875244140625, -0.021866321563720703, -0.020073890686035156, -0.01828145980834961, -0.016489028930664062, -0.014696598052978516, -0.012904167175292969, -0.011111736297607422, -0.009319305419921875, -0.007526874542236328, -0.005734443664550781, -0.003942012786865234, -0.0021495819091796875, -0.0003571510314941406, 0.0014352798461914062, 0.003227710723876953, 0.0050201416015625, 0.006812572479248047, 0.008605003356933594, 0.01039743423461914, 0.012189865112304688, 0.013982295989990234, 0.01577472686767578, 0.017567157745361328, 0.019359588623046875, 0.021152019500732422, 0.02294445037841797, 0.024736881256103516, 0.026529312133789062, 0.02832174301147461, 0.030114173889160156, 0.0319066047668457, 0.03369903564453125, 0.0354914665222168, 0.037283897399902344, 0.03907632827758789, 0.04086875915527344, 0.042661190032958984, 0.04445362091064453, 0.04624605178833008, 0.048038482666015625, 0.04983091354370117, 0.05162334442138672, 0.053415775299072266, 0.05520820617675781, 0.05700063705444336, 0.058793067932128906, 0.06058549880981445, 0.0623779296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 14.0, 9.0, 10.0, 13.0, 22.0, 12.0, 30.0, 44.0, 65.0, 109.0, 154.0, 137.0, 101.0, 67.0, 61.0, 36.0, 23.0, 14.0, 19.0, 15.0, 5.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055572509765625, -0.053713321685791016, -0.05185413360595703, -0.04999494552612305, -0.04813575744628906, -0.04627656936645508, -0.044417381286621094, -0.04255819320678711, -0.040699005126953125, -0.03883981704711914, -0.036980628967285156, -0.03512144088745117, -0.03326225280761719, -0.0314030647277832, -0.02954387664794922, -0.027684688568115234, -0.02582550048828125, -0.023966312408447266, -0.02210712432861328, -0.020247936248779297, -0.018388748168945312, -0.016529560089111328, -0.014670372009277344, -0.01281118392944336, -0.010951995849609375, -0.00909280776977539, -0.007233619689941406, -0.005374431610107422, -0.0035152435302734375, -0.0016560554504394531, 0.00020313262939453125, 0.0020623207092285156, 0.0039215087890625, 0.005780696868896484, 0.007639884948730469, 0.009499073028564453, 0.011358261108398438, 0.013217449188232422, 0.015076637268066406, 0.01693582534790039, 0.018795013427734375, 0.02065420150756836, 0.022513389587402344, 0.024372577667236328, 0.026231765747070312, 0.028090953826904297, 0.02995014190673828, 0.031809329986572266, 0.03366851806640625, 0.035527706146240234, 0.03738689422607422, 0.0392460823059082, 0.04110527038574219, 0.04296445846557617, 0.044823646545410156, 0.04668283462524414, 0.048542022705078125, 0.05040121078491211, 0.052260398864746094, 0.05411958694458008, 0.05597877502441406, 0.05783796310424805, 0.05969715118408203, 0.061556339263916016, 0.06341552734375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 5.0, 6.0, 1.0, 3.0, 9.0, 14.0, 30.0, 108.0, 203.0, 326.0, 172.0, 70.0, 27.0, 14.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.3807121515274048, -1.3415590524673462, -1.3024060726165771, -1.2632529735565186, -1.22409987449646, -1.184946894645691, -1.1457937955856323, -1.1066408157348633, -1.0674877166748047, -1.028334617614746, -0.989181637763977, -0.9500285387039185, -0.9108754992485046, -0.8717224597930908, -0.8325693607330322, -0.7934163212776184, -0.7542632818222046, -0.7151102423667908, -0.675957202911377, -0.6368041038513184, -0.5976510643959045, -0.5584980249404907, -0.5193449258804321, -0.4801918864250183, -0.4410388469696045, -0.4018858075141907, -0.36273273825645447, -0.32357966899871826, -0.28442662954330444, -0.24527357518672943, -0.20612052083015442, -0.1669674515724182, -0.12781453132629395, -0.08866147696971893, -0.04950842261314392, -0.010355368256568909, 0.028797686100006104, 0.06795074045658112, 0.10710379481315613, 0.14625686407089233, 0.18540990352630615, 0.22456295788288116, 0.2637160122394562, 0.3028690814971924, 0.3420221209526062, 0.38117516040802, 0.4203282296657562, 0.45948129892349243, 0.49863433837890625, 0.5377873778343201, 0.5769404172897339, 0.6160935163497925, 0.6552465558052063, 0.6943995952606201, 0.7335526943206787, 0.7727057337760925, 0.8118587732315063, 0.8510118126869202, 0.890164852142334, 0.9293179512023926, 0.9684709906578064, 1.0076240301132202, 1.0467771291732788, 1.0859301090240479, 1.1250832080841064]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 13.0, 14.0, 12.0, 9.0, 10.0, 13.0, 17.0, 24.0, 31.0, 28.0, 31.0, 39.0, 33.0, 45.0, 53.0, 43.0, 60.0, 77.0, 39.0, 34.0, 47.0, 42.0, 31.0, 29.0, 32.0, 17.0, 24.0, 11.0, 21.0, 19.0, 18.0, 18.0, 16.0, 10.0, 6.0, 9.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48582279682159424, -0.4690149128437042, -0.4522070288658142, -0.4353991746902466, -0.41859129071235657, -0.40178340673446655, -0.3849755525588989, -0.3681676685810089, -0.3513597846031189, -0.3345519006252289, -0.31774401664733887, -0.30093616247177124, -0.2841282784938812, -0.2673203945159912, -0.2505125403404236, -0.23370465636253357, -0.21689677238464355, -0.20008888840675354, -0.18328101933002472, -0.1664731502532959, -0.14966526627540588, -0.13285738229751587, -0.11604951322078705, -0.09924163669347763, -0.08243376016616821, -0.0656258836388588, -0.04881800711154938, -0.03201013058423996, -0.015202254056930542, 0.0016056224703788757, 0.018413498997688293, 0.03522137552499771, 0.052029192447662354, 0.06883706897497177, 0.08564494550228119, 0.1024528220295906, 0.11926069855690002, 0.13606858253479004, 0.15287645161151886, 0.16968432068824768, 0.1864922046661377, 0.2033000886440277, 0.22010795772075653, 0.23691582679748535, 0.25372371077537537, 0.2705315947532654, 0.287339448928833, 0.304147332906723, 0.32095521688461304, 0.33776310086250305, 0.35457098484039307, 0.3713788390159607, 0.3881867229938507, 0.4049946069717407, 0.42180246114730835, 0.43861034512519836, 0.4554182291030884, 0.4722261130809784, 0.4890339970588684, 0.505841851234436, 0.5226497650146484, 0.5394576191902161, 0.5562654733657837, 0.5730733871459961, 0.5898812413215637]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 13.0, 8.0, 8.0, 12.0, 21.0, 23.0, 38.0, 47.0, 83.0, 75.0, 173.0, 280.0, 451.0, 775.0, 1679.0, 3848.0, 11021.0, 41852.0, 248251.0, 1876117.0, 1732844.0, 223226.0, 36094.0, 10286.0, 3647.0, 1526.0, 720.0, 427.0, 257.0, 138.0, 88.0, 56.0, 51.0, 43.0, 21.0, 21.0, 11.0, 11.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.048175811767578125, -0.04666900634765625, -0.045162200927734375, -0.0436553955078125, -0.042148590087890625, -0.04064178466796875, -0.039134979248046875, -0.037628173828125, -0.036121368408203125, -0.03461456298828125, -0.033107757568359375, -0.0316009521484375, -0.030094146728515625, -0.02858734130859375, -0.027080535888671875, -0.02557373046875, -0.024066925048828125, -0.02256011962890625, -0.021053314208984375, -0.0195465087890625, -0.018039703369140625, -0.01653289794921875, -0.015026092529296875, -0.013519287109375, -0.012012481689453125, -0.01050567626953125, -0.008998870849609375, -0.0074920654296875, -0.005985260009765625, -0.00447845458984375, -0.002971649169921875, -0.00146484375, 4.1961669921875e-05, 0.00154876708984375, 0.003055572509765625, 0.0045623779296875, 0.006069183349609375, 0.00757598876953125, 0.009082794189453125, 0.010589599609375, 0.012096405029296875, 0.01360321044921875, 0.015110015869140625, 0.0166168212890625, 0.018123626708984375, 0.01963043212890625, 0.021137237548828125, 0.02264404296875, 0.024150848388671875, 0.02565765380859375, 0.027164459228515625, 0.0286712646484375, 0.030178070068359375, 0.03168487548828125, 0.033191680908203125, 0.034698486328125, 0.036205291748046875, 0.03771209716796875, 0.039218902587890625, 0.0407257080078125, 0.042232513427734375, 0.04373931884765625, 0.045246124267578125, 0.0467529296875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 13.0, 15.0, 16.0, 29.0, 34.0, 51.0, 53.0, 57.0, 69.0, 67.0, 82.0, 88.0, 78.0, 70.0, 59.0, 54.0, 36.0, 39.0, 31.0, 15.0, 11.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.06878662109375, -0.06701517105102539, -0.06524372100830078, -0.06347227096557617, -0.06170082092285156, -0.05992937088012695, -0.058157920837402344, -0.056386470794677734, -0.054615020751953125, -0.052843570709228516, -0.051072120666503906, -0.0493006706237793, -0.04752922058105469, -0.04575777053833008, -0.04398632049560547, -0.04221487045288086, -0.04044342041015625, -0.03867197036743164, -0.03690052032470703, -0.03512907028198242, -0.03335762023925781, -0.0315861701965332, -0.029814720153808594, -0.028043270111083984, -0.026271820068359375, -0.024500370025634766, -0.022728919982910156, -0.020957469940185547, -0.019186019897460938, -0.017414569854736328, -0.01564311981201172, -0.01387166976928711, -0.0121002197265625, -0.01032876968383789, -0.008557319641113281, -0.006785869598388672, -0.0050144195556640625, -0.003242969512939453, -0.0014715194702148438, 0.0002999305725097656, 0.002071380615234375, 0.0038428306579589844, 0.005614280700683594, 0.007385730743408203, 0.009157180786132812, 0.010928630828857422, 0.012700080871582031, 0.01447153091430664, 0.01624298095703125, 0.01801443099975586, 0.01978588104248047, 0.021557331085205078, 0.023328781127929688, 0.025100231170654297, 0.026871681213378906, 0.028643131256103516, 0.030414581298828125, 0.032186031341552734, 0.033957481384277344, 0.03572893142700195, 0.03750038146972656, 0.03927183151245117, 0.04104328155517578, 0.04281473159790039, 0.044586181640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 9.0, 22.0, 28.0, 55.0, 94.0, 173.0, 582.0, 3737.0, 2515251.0, 1668503.0, 4323.0, 678.0, 291.0, 178.0, 132.0, 67.0, 57.0, 44.0, 22.0, 16.0, 9.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267578125, -0.2597026824951172, -0.2518272399902344, -0.24395179748535156, -0.23607635498046875, -0.22820091247558594, -0.22032546997070312, -0.2124500274658203, -0.2045745849609375, -0.1966991424560547, -0.18882369995117188, -0.18094825744628906, -0.17307281494140625, -0.16519737243652344, -0.15732192993164062, -0.1494464874267578, -0.141571044921875, -0.1336956024169922, -0.12582015991210938, -0.11794471740722656, -0.11006927490234375, -0.10219383239746094, -0.09431838989257812, -0.08644294738769531, -0.0785675048828125, -0.07069206237792969, -0.06281661987304688, -0.05494117736816406, -0.04706573486328125, -0.03919029235839844, -0.031314849853515625, -0.023439407348632812, -0.01556396484375, -0.0076885223388671875, 0.000186920166015625, 0.008062362670898438, 0.01593780517578125, 0.023813247680664062, 0.031688690185546875, 0.03956413269042969, 0.0474395751953125, 0.05531501770019531, 0.06319046020507812, 0.07106590270996094, 0.07894134521484375, 0.08681678771972656, 0.09469223022460938, 0.10256767272949219, 0.110443115234375, 0.11831855773925781, 0.12619400024414062, 0.13406944274902344, 0.14194488525390625, 0.14982032775878906, 0.15769577026367188, 0.1655712127685547, 0.1734466552734375, 0.1813220977783203, 0.18919754028320312, 0.19707298278808594, 0.20494842529296875, 0.21282386779785156, 0.22069931030273438, 0.2285747528076172, 0.2364501953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 8.0, 7.0, 13.0, 18.0, 23.0, 58.0, 178.0, 563.0, 1159.0, 1183.0, 490.0, 181.0, 100.0, 34.0, 27.0, 12.0, 11.0, 5.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0513916015625, -0.046688079833984375, -0.04198455810546875, -0.037281036376953125, -0.0325775146484375, -0.027873992919921875, -0.02317047119140625, -0.018466949462890625, -0.013763427734375, -0.009059906005859375, -0.00435638427734375, 0.000347137451171875, 0.0050506591796875, 0.009754180908203125, 0.01445770263671875, 0.019161224365234375, 0.02386474609375, 0.028568267822265625, 0.03327178955078125, 0.037975311279296875, 0.0426788330078125, 0.047382354736328125, 0.05208587646484375, 0.056789398193359375, 0.061492919921875, 0.06619644165039062, 0.07089996337890625, 0.07560348510742188, 0.0803070068359375, 0.08501052856445312, 0.08971405029296875, 0.09441757202148438, 0.09912109375, 0.10382461547851562, 0.10852813720703125, 0.11323165893554688, 0.1179351806640625, 0.12263870239257812, 0.12734222412109375, 0.13204574584960938, 0.136749267578125, 0.14145278930664062, 0.14615631103515625, 0.15085983276367188, 0.1555633544921875, 0.16026687622070312, 0.16497039794921875, 0.16967391967773438, 0.17437744140625, 0.17908096313476562, 0.18378448486328125, 0.18848800659179688, 0.1931915283203125, 0.19789505004882812, 0.20259857177734375, 0.20730209350585938, 0.212005615234375, 0.21670913696289062, 0.22141265869140625, 0.22611618041992188, 0.2308197021484375, 0.23552322387695312, 0.24022674560546875, 0.24493026733398438, 0.2496337890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 12.0, 29.0, 102.0, 269.0, 291.0, 160.0, 56.0, 30.0, 18.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4173469543457031, -1.3728350400924683, -1.3283231258392334, -1.2838112115859985, -1.2392992973327637, -1.1947872638702393, -1.1502753496170044, -1.1057634353637695, -1.0612515211105347, -1.0167396068572998, -0.9722276926040649, -0.9277157187461853, -0.8832038044929504, -0.8386918902397156, -0.7941799163818359, -0.7496680021286011, -0.7051560878753662, -0.6606441736221313, -0.6161322593688965, -0.5716202855110168, -0.527108371257782, -0.4825964570045471, -0.43808451294898987, -0.3935725688934326, -0.34906065464019775, -0.3045487403869629, -0.26003679633140564, -0.21552486717700958, -0.17101293802261353, -0.12650100886821747, -0.08198907971382141, -0.03747713565826416, 0.007034778594970703, 0.05154670774936676, 0.09605863690376282, 0.14057056605815887, 0.18508249521255493, 0.229594424366951, 0.27410635352134705, 0.3186182975769043, 0.36313021183013916, 0.407642126083374, 0.4521540701389313, 0.4966660141944885, 0.5411779284477234, 0.5856898427009583, 0.6302018165588379, 0.6747137308120728, 0.7192256450653076, 0.7637375593185425, 0.8082494735717773, 0.852761447429657, 0.8972733616828918, 0.9417852759361267, 0.9862972497940063, 1.0308091640472412, 1.075321078300476, 1.119832992553711, 1.1643449068069458, 1.2088568210601807, 1.253368854522705, 1.29788076877594, 1.3423926830291748, 1.3869045972824097, 1.4314165115356445]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 3.0, 11.0, 11.0, 6.0, 10.0, 21.0, 38.0, 30.0, 45.0, 47.0, 32.0, 56.0, 48.0, 47.0, 48.0, 58.0, 44.0, 42.0, 34.0, 47.0, 46.0, 37.0, 40.0, 22.0, 30.0, 17.0, 24.0, 20.0, 12.0, 7.0, 13.0, 12.0, 2.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5206177830696106, -0.5041826963424683, -0.48774755001068115, -0.47131243348121643, -0.4548773169517517, -0.4384422302246094, -0.42200711369514465, -0.40557199716567993, -0.3891368806362152, -0.3727017641067505, -0.35626664757728577, -0.33983153104782104, -0.3233964443206787, -0.3069612979888916, -0.29052621126174927, -0.27409109473228455, -0.2576559782028198, -0.2412208616733551, -0.22478574514389038, -0.20835064351558685, -0.19191552698612213, -0.1754804104566574, -0.15904530882835388, -0.14261019229888916, -0.12617507576942444, -0.10973995923995972, -0.09330485016107559, -0.07686974108219147, -0.060434624552726746, -0.043999508023262024, -0.0275643989443779, -0.011129289865493774, 0.005305886268615723, 0.021740999072790146, 0.03817611187696457, 0.05461122468113899, 0.07104633748531342, 0.08748145401477814, 0.10391656309366226, 0.12035167217254639, 0.1367867887020111, 0.15322190523147583, 0.16965702176094055, 0.18609212338924408, 0.2025272399187088, 0.21896235644817352, 0.23539745807647705, 0.2518325746059418, 0.2682676911354065, 0.2847028076648712, 0.30113792419433594, 0.31757304072380066, 0.3340081572532654, 0.3504432439804077, 0.36687836050987244, 0.38331347703933716, 0.3997485935688019, 0.4161837100982666, 0.4326188266277313, 0.44905394315719604, 0.4654890298843384, 0.4819241762161255, 0.4983592629432678, 0.5147943496704102, 0.5312294960021973]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 9.0, 5.0, 16.0, 18.0, 26.0, 42.0, 64.0, 118.0, 165.0, 329.0, 675.0, 1415.0, 3672.0, 11053.0, 39606.0, 198435.0, 586923.0, 157411.0, 33206.0, 9407.0, 3317.0, 1259.0, 602.0, 268.0, 142.0, 98.0, 80.0, 53.0, 35.0, 18.0, 19.0, 11.0, 12.0, 4.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.0877828598022461, -0.08523368835449219, -0.08268451690673828, -0.08013534545898438, -0.07758617401123047, -0.07503700256347656, -0.07248783111572266, -0.06993865966796875, -0.06738948822021484, -0.06484031677246094, -0.06229114532470703, -0.059741973876953125, -0.05719280242919922, -0.05464363098144531, -0.052094459533691406, -0.0495452880859375, -0.046996116638183594, -0.04444694519042969, -0.04189777374267578, -0.039348602294921875, -0.03679943084716797, -0.03425025939941406, -0.031701087951660156, -0.02915191650390625, -0.026602745056152344, -0.024053573608398438, -0.02150440216064453, -0.018955230712890625, -0.01640605926513672, -0.013856887817382812, -0.011307716369628906, -0.008758544921875, -0.006209373474121094, -0.0036602020263671875, -0.0011110305786132812, 0.001438140869140625, 0.003987312316894531, 0.0065364837646484375, 0.009085655212402344, 0.01163482666015625, 0.014183998107910156, 0.016733169555664062, 0.01928234100341797, 0.021831512451171875, 0.02438068389892578, 0.026929855346679688, 0.029479026794433594, 0.0320281982421875, 0.034577369689941406, 0.03712654113769531, 0.03967571258544922, 0.042224884033203125, 0.04477405548095703, 0.04732322692871094, 0.049872398376464844, 0.05242156982421875, 0.054970741271972656, 0.05751991271972656, 0.06006908416748047, 0.06261825561523438, 0.06516742706298828, 0.06771659851074219, 0.0702657699584961, 0.07281494140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 4.0, 13.0, 12.0, 17.0, 24.0, 35.0, 32.0, 38.0, 56.0, 73.0, 49.0, 64.0, 58.0, 65.0, 65.0, 59.0, 59.0, 52.0, 65.0, 32.0, 28.0, 20.0, 21.0, 12.0, 16.0, 7.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056182861328125, -0.05454206466674805, -0.052901268005371094, -0.05126047134399414, -0.04961967468261719, -0.047978878021240234, -0.04633808135986328, -0.04469728469848633, -0.043056488037109375, -0.04141569137573242, -0.03977489471435547, -0.038134098052978516, -0.03649330139160156, -0.03485250473022461, -0.033211708068847656, -0.0315709114074707, -0.02993011474609375, -0.028289318084716797, -0.026648521423339844, -0.02500772476196289, -0.023366928100585938, -0.021726131439208984, -0.02008533477783203, -0.018444538116455078, -0.016803741455078125, -0.015162944793701172, -0.013522148132324219, -0.011881351470947266, -0.010240554809570312, -0.00859975814819336, -0.006958961486816406, -0.005318164825439453, -0.0036773681640625, -0.002036571502685547, -0.00039577484130859375, 0.0012450218200683594, 0.0028858184814453125, 0.004526615142822266, 0.006167411804199219, 0.007808208465576172, 0.009449005126953125, 0.011089801788330078, 0.012730598449707031, 0.014371395111083984, 0.016012191772460938, 0.01765298843383789, 0.019293785095214844, 0.020934581756591797, 0.02257537841796875, 0.024216175079345703, 0.025856971740722656, 0.02749776840209961, 0.029138565063476562, 0.030779361724853516, 0.03242015838623047, 0.03406095504760742, 0.035701751708984375, 0.03734254837036133, 0.03898334503173828, 0.040624141693115234, 0.04226493835449219, 0.04390573501586914, 0.045546531677246094, 0.04718732833862305, 0.048828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 12.0, 10.0, 25.0, 24.0, 37.0, 69.0, 85.0, 162.0, 282.0, 461.0, 765.0, 1606.0, 4091.0, 17494.0, 284704.0, 703355.0, 26029.0, 5148.0, 1897.0, 950.0, 465.0, 281.0, 191.0, 118.0, 81.0, 45.0, 40.0, 37.0, 27.0, 15.0, 8.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.2386474609375, -0.2325439453125, -0.2264404296875, -0.2203369140625, -0.2142333984375, -0.2081298828125, -0.2020263671875, -0.1959228515625, -0.1898193359375, -0.1837158203125, -0.1776123046875, -0.1715087890625, -0.1654052734375, -0.1593017578125, -0.1531982421875, -0.1470947265625, -0.1409912109375, -0.1348876953125, -0.1287841796875, -0.1226806640625, -0.1165771484375, -0.1104736328125, -0.1043701171875, -0.0982666015625, -0.0921630859375, -0.0860595703125, -0.0799560546875, -0.0738525390625, -0.0677490234375, -0.0616455078125, -0.0555419921875, -0.0494384765625, -0.0433349609375, -0.0372314453125, -0.0311279296875, -0.0250244140625, -0.0189208984375, -0.0128173828125, -0.0067138671875, -0.0006103515625, 0.0054931640625, 0.0115966796875, 0.0177001953125, 0.0238037109375, 0.0299072265625, 0.0360107421875, 0.0421142578125, 0.0482177734375, 0.0543212890625, 0.0604248046875, 0.0665283203125, 0.0726318359375, 0.0787353515625, 0.0848388671875, 0.0909423828125, 0.0970458984375, 0.1031494140625, 0.1092529296875, 0.1153564453125, 0.1214599609375, 0.1275634765625, 0.1336669921875, 0.1397705078125, 0.1458740234375, 0.1519775390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 11.0, 7.0, 9.0, 8.0, 15.0, 26.0, 19.0, 25.0, 23.0, 34.0, 32.0, 25.0, 48.0, 50.0, 52.0, 38.0, 51.0, 54.0, 46.0, 55.0, 44.0, 37.0, 33.0, 30.0, 24.0, 22.0, 22.0, 31.0, 16.0, 17.0, 12.0, 12.0, 13.0, 5.0, 6.0, 5.0, 2.0, 7.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.14929962158203125, -0.1443023681640625, -0.13930511474609375, -0.134307861328125, -0.12931060791015625, -0.1243133544921875, -0.11931610107421875, -0.11431884765625, -0.10932159423828125, -0.1043243408203125, -0.09932708740234375, -0.094329833984375, -0.08933258056640625, -0.0843353271484375, -0.07933807373046875, -0.0743408203125, -0.06934356689453125, -0.0643463134765625, -0.05934906005859375, -0.054351806640625, -0.04935455322265625, -0.0443572998046875, -0.03936004638671875, -0.03436279296875, -0.02936553955078125, -0.0243682861328125, -0.01937103271484375, -0.014373779296875, -0.00937652587890625, -0.0043792724609375, 0.00061798095703125, 0.005615234375, 0.01061248779296875, 0.0156097412109375, 0.02060699462890625, 0.025604248046875, 0.03060150146484375, 0.0355987548828125, 0.04059600830078125, 0.04559326171875, 0.05059051513671875, 0.0555877685546875, 0.06058502197265625, 0.065582275390625, 0.07057952880859375, 0.0755767822265625, 0.08057403564453125, 0.0855712890625, 0.09056854248046875, 0.0955657958984375, 0.10056304931640625, 0.105560302734375, 0.11055755615234375, 0.1155548095703125, 0.12055206298828125, 0.12554931640625, 0.13054656982421875, 0.1355438232421875, 0.14054107666015625, 0.145538330078125, 0.15053558349609375, 0.1555328369140625, 0.16053009033203125, 0.16552734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 7.0, 7.0, 10.0, 13.0, 18.0, 24.0, 30.0, 42.0, 66.0, 104.0, 170.0, 293.0, 536.0, 1246.0, 3565.0, 15010.0, 104858.0, 827944.0, 76903.0, 12339.0, 3042.0, 1114.0, 482.0, 270.0, 150.0, 83.0, 59.0, 41.0, 32.0, 19.0, 20.0, 11.0, 8.0, 3.0, 5.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.08160400390625, -0.07923412322998047, -0.07686424255371094, -0.0744943618774414, -0.07212448120117188, -0.06975460052490234, -0.06738471984863281, -0.06501483917236328, -0.06264495849609375, -0.06027507781982422, -0.05790519714355469, -0.055535316467285156, -0.053165435791015625, -0.050795555114746094, -0.04842567443847656, -0.04605579376220703, -0.0436859130859375, -0.04131603240966797, -0.03894615173339844, -0.036576271057128906, -0.034206390380859375, -0.031836509704589844, -0.029466629028320312, -0.02709674835205078, -0.02472686767578125, -0.02235698699951172, -0.019987106323242188, -0.017617225646972656, -0.015247344970703125, -0.012877464294433594, -0.010507583618164062, -0.008137702941894531, -0.005767822265625, -0.0033979415893554688, -0.0010280609130859375, 0.0013418197631835938, 0.003711700439453125, 0.006081581115722656, 0.008451461791992188, 0.010821342468261719, 0.01319122314453125, 0.015561103820800781, 0.017930984497070312, 0.020300865173339844, 0.022670745849609375, 0.025040626525878906, 0.027410507202148438, 0.02978038787841797, 0.0321502685546875, 0.03452014923095703, 0.03689002990722656, 0.039259910583496094, 0.041629791259765625, 0.043999671936035156, 0.04636955261230469, 0.04873943328857422, 0.05110931396484375, 0.05347919464111328, 0.05584907531738281, 0.058218955993652344, 0.060588836669921875, 0.0629587173461914, 0.06532859802246094, 0.06769847869873047, 0.070068359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 9.0, 10.0, 9.0, 14.0, 26.0, 38.0, 42.0, 60.0, 84.0, 73.0, 95.0, 89.0, 91.0, 55.0, 57.0, 45.0, 39.0, 32.0, 21.0, 29.0, 16.0, 8.0, 6.0, 4.0, 7.0, 7.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.310773849487305e-05, -5.144532769918442e-05, -4.978291690349579e-05, -4.812050610780716e-05, -4.645809531211853e-05, -4.47956845164299e-05, -4.313327372074127e-05, -4.147086292505264e-05, -3.9808452129364014e-05, -3.8146041333675385e-05, -3.6483630537986755e-05, -3.4821219742298126e-05, -3.31588089466095e-05, -3.149639815092087e-05, -2.983398735523224e-05, -2.817157655954361e-05, -2.650916576385498e-05, -2.484675496816635e-05, -2.3184344172477722e-05, -2.1521933376789093e-05, -1.9859522581100464e-05, -1.8197111785411835e-05, -1.6534700989723206e-05, -1.4872290194034576e-05, -1.3209879398345947e-05, -1.1547468602657318e-05, -9.885057806968689e-06, -8.22264701128006e-06, -6.560236215591431e-06, -4.8978254199028015e-06, -3.2354146242141724e-06, -1.5730038285255432e-06, 8.940696716308594e-08, 1.751817762851715e-06, 3.4142285585403442e-06, 5.076639354228973e-06, 6.7390501499176025e-06, 8.401460945606232e-06, 1.006387174129486e-05, 1.172628253698349e-05, 1.3388693332672119e-05, 1.5051104128360748e-05, 1.6713514924049377e-05, 1.8375925719738007e-05, 2.0038336515426636e-05, 2.1700747311115265e-05, 2.3363158106803894e-05, 2.5025568902492523e-05, 2.6687979698181152e-05, 2.835039049386978e-05, 3.001280128955841e-05, 3.167521208524704e-05, 3.333762288093567e-05, 3.50000336766243e-05, 3.666244447231293e-05, 3.8324855268001556e-05, 3.9987266063690186e-05, 4.1649676859378815e-05, 4.3312087655067444e-05, 4.497449845075607e-05, 4.66369092464447e-05, 4.829932004213333e-05, 4.996173083782196e-05, 5.162414163351059e-05, 5.328655242919922e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 4.0, 8.0, 18.0, 17.0, 26.0, 16.0, 42.0, 47.0, 72.0, 88.0, 134.0, 164.0, 246.0, 407.0, 620.0, 1077.0, 2237.0, 5223.0, 16291.0, 65378.0, 608807.0, 280475.0, 46171.0, 12397.0, 4134.0, 1828.0, 919.0, 548.0, 356.0, 237.0, 137.0, 109.0, 68.0, 59.0, 49.0, 31.0, 29.0, 21.0, 13.0, 14.0, 9.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04962158203125, -0.048065185546875, -0.0465087890625, -0.044952392578125, -0.04339599609375, -0.041839599609375, -0.040283203125, -0.038726806640625, -0.03717041015625, -0.035614013671875, -0.0340576171875, -0.032501220703125, -0.03094482421875, -0.029388427734375, -0.02783203125, -0.026275634765625, -0.02471923828125, -0.023162841796875, -0.0216064453125, -0.020050048828125, -0.01849365234375, -0.016937255859375, -0.015380859375, -0.013824462890625, -0.01226806640625, -0.010711669921875, -0.0091552734375, -0.007598876953125, -0.00604248046875, -0.004486083984375, -0.0029296875, -0.001373291015625, 0.00018310546875, 0.001739501953125, 0.0032958984375, 0.004852294921875, 0.00640869140625, 0.007965087890625, 0.009521484375, 0.011077880859375, 0.01263427734375, 0.014190673828125, 0.0157470703125, 0.017303466796875, 0.01885986328125, 0.020416259765625, 0.02197265625, 0.023529052734375, 0.02508544921875, 0.026641845703125, 0.0281982421875, 0.029754638671875, 0.03131103515625, 0.032867431640625, 0.034423828125, 0.035980224609375, 0.03753662109375, 0.039093017578125, 0.0406494140625, 0.042205810546875, 0.04376220703125, 0.045318603515625, 0.046875, 0.048431396484375, 0.04998779296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 0.0, 4.0, 2.0, 3.0, 7.0, 7.0, 7.0, 4.0, 11.0, 17.0, 16.0, 22.0, 16.0, 20.0, 32.0, 43.0, 42.0, 48.0, 80.0, 106.0, 81.0, 71.0, 65.0, 58.0, 42.0, 29.0, 28.0, 17.0, 21.0, 20.0, 12.0, 12.0, 12.0, 5.0, 6.0, 10.0, 7.0, 2.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03961181640625, -0.03842878341674805, -0.037245750427246094, -0.03606271743774414, -0.03487968444824219, -0.033696651458740234, -0.03251361846923828, -0.03133058547973633, -0.030147552490234375, -0.028964519500732422, -0.02778148651123047, -0.026598453521728516, -0.025415420532226562, -0.02423238754272461, -0.023049354553222656, -0.021866321563720703, -0.02068328857421875, -0.019500255584716797, -0.018317222595214844, -0.01713418960571289, -0.015951156616210938, -0.014768123626708984, -0.013585090637207031, -0.012402057647705078, -0.011219024658203125, -0.010035991668701172, -0.008852958679199219, -0.007669925689697266, -0.0064868927001953125, -0.005303859710693359, -0.004120826721191406, -0.002937793731689453, -0.0017547607421875, -0.0005717277526855469, 0.0006113052368164062, 0.0017943382263183594, 0.0029773712158203125, 0.004160404205322266, 0.005343437194824219, 0.006526470184326172, 0.007709503173828125, 0.008892536163330078, 0.010075569152832031, 0.011258602142333984, 0.012441635131835938, 0.01362466812133789, 0.014807701110839844, 0.015990734100341797, 0.01717376708984375, 0.018356800079345703, 0.019539833068847656, 0.02072286605834961, 0.021905899047851562, 0.023088932037353516, 0.02427196502685547, 0.025454998016357422, 0.026638031005859375, 0.027821063995361328, 0.02900409698486328, 0.030187129974365234, 0.03137016296386719, 0.03255319595336914, 0.033736228942871094, 0.03491926193237305, 0.036102294921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 19.0, 37.0, 116.0, 262.0, 336.0, 143.0, 40.0, 12.0, 9.0, 3.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.093743920326233, -1.0464215278625488, -0.99909907579422, -0.9517766237258911, -0.904454231262207, -0.857131838798523, -0.8098093867301941, -0.7624869346618652, -0.7151645421981812, -0.6678421497344971, -0.6205196976661682, -0.5731972455978394, -0.5258748531341553, -0.4785524308681488, -0.43123000860214233, -0.38390758633613586, -0.3365851640701294, -0.2892627418041229, -0.24194031953811646, -0.19461789727210999, -0.14729547500610352, -0.09997305274009705, -0.052650630474090576, -0.0053282082080841064, 0.04199421405792236, 0.08931663632392883, 0.1366390585899353, 0.18396148085594177, 0.23128390312194824, 0.2786063253879547, 0.3259287476539612, 0.37325116991996765, 0.4205735921859741, 0.4678960144519806, 0.5152184367179871, 0.5625408887863159, 0.60986328125, 0.6571856737136841, 0.7045081257820129, 0.7518305778503418, 0.7991529703140259, 0.84647536277771, 0.8937978148460388, 0.9411202669143677, 0.9884426593780518, 1.0357650518417358, 1.08308744430542, 1.1304099559783936, 1.1777323484420776, 1.2250547409057617, 1.2723772525787354, 1.3196996450424194, 1.3670220375061035, 1.4143444299697876, 1.4616668224334717, 1.5089893341064453, 1.5563117265701294, 1.6036341190338135, 1.650956630706787, 1.6982790231704712, 1.7456014156341553, 1.7929238080978394, 1.8402462005615234, 1.887568712234497, 1.9348911046981812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 8.0, 5.0, 9.0, 10.0, 15.0, 16.0, 14.0, 15.0, 18.0, 16.0, 21.0, 28.0, 27.0, 43.0, 30.0, 31.0, 62.0, 69.0, 84.0, 74.0, 57.0, 47.0, 40.0, 42.0, 37.0, 30.0, 27.0, 22.0, 19.0, 11.0, 16.0, 12.0, 4.0, 8.0, 8.0, 4.0, 3.0, 7.0, 4.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.9035405516624451, -0.8794444799423218, -0.8553484678268433, -0.83125239610672, -0.8071563243865967, -0.7830602526664734, -0.7589642405509949, -0.7348681688308716, -0.7107720971107483, -0.686676025390625, -0.6625800132751465, -0.6384839415550232, -0.6143878698348999, -0.5902917981147766, -0.5661957859992981, -0.5420997142791748, -0.5180037021636963, -0.4939076602458954, -0.4698115885257721, -0.4457155466079712, -0.4216194748878479, -0.397523432970047, -0.3734273910522461, -0.3493313193321228, -0.3252352476119995, -0.3011392056941986, -0.2770431339740753, -0.2529470920562744, -0.22885102033615112, -0.20475497841835022, -0.18065892159938812, -0.15656286478042603, -0.13246679306030273, -0.10837073624134064, -0.08427467942237854, -0.06017863005399704, -0.03608257323503494, -0.011986516416072845, 0.012109532952308655, 0.03620558977127075, 0.06030164659023285, 0.08439770340919495, 0.10849376022815704, 0.13258981704711914, 0.15668585896492004, 0.18078193068504333, 0.20487797260284424, 0.22897402942180634, 0.25307008624076843, 0.27716612815856934, 0.3012621998786926, 0.32535824179649353, 0.3494543135166168, 0.3735503554344177, 0.397646427154541, 0.4217424690723419, 0.4458385109901428, 0.4699345529079437, 0.494030624628067, 0.5181266665458679, 0.5422227382659912, 0.5663188099861145, 0.590414822101593, 0.6145108938217163, 0.6386069655418396]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 9.0, 16.0, 19.0, 40.0, 60.0, 109.0, 185.0, 277.0, 597.0, 1349.0, 3661.0, 14816.0, 125981.0, 2428574.0, 1530216.0, 71970.0, 11290.0, 2867.0, 1103.0, 485.0, 253.0, 133.0, 86.0, 44.0, 31.0, 32.0, 14.0, 14.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0809326171875, -0.07831287384033203, -0.07569313049316406, -0.0730733871459961, -0.07045364379882812, -0.06783390045166016, -0.06521415710449219, -0.06259441375732422, -0.05997467041015625, -0.05735492706298828, -0.05473518371582031, -0.052115440368652344, -0.049495697021484375, -0.046875953674316406, -0.04425621032714844, -0.04163646697998047, -0.0390167236328125, -0.03639698028564453, -0.03377723693847656, -0.031157493591308594, -0.028537750244140625, -0.025918006896972656, -0.023298263549804688, -0.02067852020263672, -0.01805877685546875, -0.015439033508300781, -0.012819290161132812, -0.010199546813964844, -0.007579803466796875, -0.004960060119628906, -0.0023403167724609375, 0.00027942657470703125, 0.002899169921875, 0.005518913269042969, 0.008138656616210938, 0.010758399963378906, 0.013378143310546875, 0.015997886657714844, 0.018617630004882812, 0.02123737335205078, 0.02385711669921875, 0.02647686004638672, 0.029096603393554688, 0.031716346740722656, 0.034336090087890625, 0.036955833435058594, 0.03957557678222656, 0.04219532012939453, 0.0448150634765625, 0.04743480682373047, 0.05005455017089844, 0.052674293518066406, 0.055294036865234375, 0.057913780212402344, 0.06053352355957031, 0.06315326690673828, 0.06577301025390625, 0.06839275360107422, 0.07101249694824219, 0.07363224029541016, 0.07625198364257812, 0.0788717269897461, 0.08149147033691406, 0.08411121368408203, 0.08673095703125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 9.0, 11.0, 15.0, 16.0, 20.0, 26.0, 33.0, 41.0, 52.0, 56.0, 56.0, 74.0, 70.0, 76.0, 73.0, 54.0, 63.0, 44.0, 49.0, 32.0, 41.0, 12.0, 17.0, 15.0, 8.0, 8.0, 9.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.0633544921875, -0.06170082092285156, -0.060047149658203125, -0.05839347839355469, -0.05673980712890625, -0.05508613586425781, -0.053432464599609375, -0.05177879333496094, -0.0501251220703125, -0.04847145080566406, -0.046817779541015625, -0.04516410827636719, -0.04351043701171875, -0.04185676574707031, -0.040203094482421875, -0.03854942321777344, -0.036895751953125, -0.03524208068847656, -0.033588409423828125, -0.03193473815917969, -0.03028106689453125, -0.028627395629882812, -0.026973724365234375, -0.025320053100585938, -0.0236663818359375, -0.022012710571289062, -0.020359039306640625, -0.018705368041992188, -0.01705169677734375, -0.015398025512695312, -0.013744354248046875, -0.012090682983398438, -0.01043701171875, -0.008783340454101562, -0.007129669189453125, -0.0054759979248046875, -0.00382232666015625, -0.0021686553955078125, -0.000514984130859375, 0.0011386871337890625, 0.0027923583984375, 0.0044460296630859375, 0.006099700927734375, 0.0077533721923828125, 0.00940704345703125, 0.011060714721679688, 0.012714385986328125, 0.014368057250976562, 0.016021728515625, 0.017675399780273438, 0.019329071044921875, 0.020982742309570312, 0.02263641357421875, 0.024290084838867188, 0.025943756103515625, 0.027597427368164062, 0.0292510986328125, 0.030904769897460938, 0.032558441162109375, 0.03421211242675781, 0.03586578369140625, 0.03751945495605469, 0.039173126220703125, 0.04082679748535156, 0.04248046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 11.0, 18.0, 26.0, 40.0, 69.0, 145.0, 338.0, 998.0, 5185.0, 1140779.0, 3039155.0, 5605.0, 1039.0, 351.0, 188.0, 126.0, 78.0, 50.0, 33.0, 11.0, 7.0, 6.0, 6.0, 2.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23388671875, -0.22327804565429688, -0.21266937255859375, -0.20206069946289062, -0.1914520263671875, -0.18084335327148438, -0.17023468017578125, -0.15962600708007812, -0.149017333984375, -0.13840866088867188, -0.12779998779296875, -0.11719131469726562, -0.1065826416015625, -0.09597396850585938, -0.08536529541015625, -0.07475662231445312, -0.06414794921875, -0.053539276123046875, -0.04293060302734375, -0.032321929931640625, -0.0217132568359375, -0.011104583740234375, -0.00049591064453125, 0.010112762451171875, 0.020721435546875, 0.031330108642578125, 0.04193878173828125, 0.052547454833984375, 0.0631561279296875, 0.07376480102539062, 0.08437347412109375, 0.09498214721679688, 0.1055908203125, 0.11619949340820312, 0.12680816650390625, 0.13741683959960938, 0.1480255126953125, 0.15863418579101562, 0.16924285888671875, 0.17985153198242188, 0.190460205078125, 0.20106887817382812, 0.21167755126953125, 0.22228622436523438, 0.2328948974609375, 0.24350357055664062, 0.25411224365234375, 0.2647209167480469, 0.27532958984375, 0.2859382629394531, 0.29654693603515625, 0.3071556091308594, 0.3177642822265625, 0.3283729553222656, 0.33898162841796875, 0.3495903015136719, 0.360198974609375, 0.3708076477050781, 0.38141632080078125, 0.3920249938964844, 0.4026336669921875, 0.4132423400878906, 0.42385101318359375, 0.4344596862792969, 0.445068359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 21.0, 35.0, 78.0, 373.0, 1646.0, 1470.0, 305.0, 89.0, 33.0, 10.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152587890625, -0.144073486328125, -0.13555908203125, -0.127044677734375, -0.1185302734375, -0.110015869140625, -0.10150146484375, -0.092987060546875, -0.08447265625, -0.075958251953125, -0.06744384765625, -0.058929443359375, -0.0504150390625, -0.041900634765625, -0.03338623046875, -0.024871826171875, -0.016357421875, -0.007843017578125, 0.00067138671875, 0.009185791015625, 0.0177001953125, 0.026214599609375, 0.03472900390625, 0.043243408203125, 0.0517578125, 0.060272216796875, 0.06878662109375, 0.077301025390625, 0.0858154296875, 0.094329833984375, 0.10284423828125, 0.111358642578125, 0.119873046875, 0.128387451171875, 0.13690185546875, 0.145416259765625, 0.1539306640625, 0.162445068359375, 0.17095947265625, 0.179473876953125, 0.18798828125, 0.196502685546875, 0.20501708984375, 0.213531494140625, 0.2220458984375, 0.230560302734375, 0.23907470703125, 0.247589111328125, 0.256103515625, 0.264617919921875, 0.27313232421875, 0.281646728515625, 0.2901611328125, 0.298675537109375, 0.30718994140625, 0.315704345703125, 0.32421875, 0.332733154296875, 0.34124755859375, 0.349761962890625, 0.3582763671875, 0.366790771484375, 0.37530517578125, 0.383819580078125, 0.392333984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 4.0, 19.0, 20.0, 94.0, 286.0, 367.0, 137.0, 34.0, 19.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46077299118042, -2.390542507171631, -2.320312261581421, -2.250081777572632, -2.179851531982422, -2.109621047973633, -2.039390802383423, -1.9691603183746338, -1.8989300727844238, -1.8286997079849243, -1.7584693431854248, -1.6882389783859253, -1.6180086135864258, -1.5477782487869263, -1.4775478839874268, -1.4073173999786377, -1.3370870351791382, -1.2668566703796387, -1.1966263055801392, -1.1263959407806396, -1.0561655759811401, -0.9859352111816406, -0.9157047867774963, -0.8454744219779968, -0.7752440571784973, -0.7050136923789978, -0.6347833275794983, -0.564552903175354, -0.4943225681781769, -0.42409220337867737, -0.35386180877685547, -0.28363144397735596, -0.21340107917785645, -0.14317071437835693, -0.07294033467769623, -0.0027099549770355225, 0.06752040982246399, 0.1377507746219635, 0.2079811692237854, 0.2782115340232849, 0.3484418988227844, 0.41867226362228394, 0.48890262842178345, 0.5591330528259277, 0.6293634176254272, 0.6995937824249268, 0.7698241472244263, 0.8400545120239258, 0.9102848768234253, 0.9805152416229248, 1.0507456064224243, 1.1209759712219238, 1.1912063360214233, 1.2614367008209229, 1.331667184829712, 1.4018974304199219, 1.472127914428711, 1.5423582792282104, 1.61258864402771, 1.6828190088272095, 1.753049373626709, 1.8232797384262085, 1.893510103225708, 1.963740587234497, 2.033970832824707]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 5.0, 3.0, 10.0, 11.0, 7.0, 7.0, 14.0, 22.0, 24.0, 39.0, 29.0, 37.0, 55.0, 39.0, 43.0, 42.0, 61.0, 59.0, 45.0, 53.0, 46.0, 37.0, 46.0, 32.0, 44.0, 33.0, 26.0, 18.0, 21.0, 22.0, 16.0, 13.0, 5.0, 8.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.49044913053512573, -0.4750463366508484, -0.45964357256889343, -0.4442407786846161, -0.42883798480033875, -0.4134352207183838, -0.39803242683410645, -0.3826296329498291, -0.36722683906555176, -0.3518240451812744, -0.33642128109931946, -0.3210184872150421, -0.30561569333076477, -0.2902129292488098, -0.27481013536453247, -0.2594073414802551, -0.24400457739830017, -0.22860179841518402, -0.21319900453090668, -0.19779622554779053, -0.18239343166351318, -0.16699065268039703, -0.15158787369728088, -0.13618507981300354, -0.12078230082988739, -0.10537951439619064, -0.0899767279624939, -0.07457394897937775, -0.059171162545681, -0.04376837611198425, -0.028365597128868103, -0.012962810695171356, 0.0024399757385253906, 0.017842760309576988, 0.033245544880628586, 0.048648327589035034, 0.06405111402273178, 0.07945390045642853, 0.09485667943954468, 0.11025946587324142, 0.12566225230693817, 0.14106503129005432, 0.15646782517433167, 0.17187060415744781, 0.18727338314056396, 0.2026761770248413, 0.21807895600795746, 0.2334817349910736, 0.24888452887535095, 0.2642873227596283, 0.27969008684158325, 0.2950928807258606, 0.31049567461013794, 0.3258984684944153, 0.34130123257637024, 0.3567040264606476, 0.37210679054260254, 0.3875095844268799, 0.40291234850883484, 0.4183151423931122, 0.4337179362773895, 0.4491207003593445, 0.4645234942436218, 0.47992628812789917, 0.4953290820121765]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 6.0, 6.0, 6.0, 11.0, 18.0, 33.0, 38.0, 45.0, 98.0, 159.0, 268.0, 581.0, 1349.0, 3658.0, 11796.0, 55482.0, 395074.0, 485616.0, 72751.0, 14291.0, 4302.0, 1521.0, 661.0, 306.0, 168.0, 101.0, 64.0, 34.0, 33.0, 20.0, 12.0, 7.0, 7.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.09735107421875, -0.09449386596679688, -0.09163665771484375, -0.08877944946289062, -0.0859222412109375, -0.08306503295898438, -0.08020782470703125, -0.07735061645507812, -0.074493408203125, -0.07163619995117188, -0.06877899169921875, -0.06592178344726562, -0.0630645751953125, -0.060207366943359375, -0.05735015869140625, -0.054492950439453125, -0.0516357421875, -0.048778533935546875, -0.04592132568359375, -0.043064117431640625, -0.0402069091796875, -0.037349700927734375, -0.03449249267578125, -0.031635284423828125, -0.028778076171875, -0.025920867919921875, -0.02306365966796875, -0.020206451416015625, -0.0173492431640625, -0.014492034912109375, -0.01163482666015625, -0.008777618408203125, -0.00592041015625, -0.003063201904296875, -0.00020599365234375, 0.002651214599609375, 0.0055084228515625, 0.008365631103515625, 0.01122283935546875, 0.014080047607421875, 0.016937255859375, 0.019794464111328125, 0.02265167236328125, 0.025508880615234375, 0.0283660888671875, 0.031223297119140625, 0.03408050537109375, 0.036937713623046875, 0.039794921875, 0.042652130126953125, 0.04550933837890625, 0.048366546630859375, 0.0512237548828125, 0.054080963134765625, 0.05693817138671875, 0.059795379638671875, 0.062652587890625, 0.06550979614257812, 0.06836700439453125, 0.07122421264648438, 0.0740814208984375, 0.07693862915039062, 0.07979583740234375, 0.08265304565429688, 0.08551025390625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 11.0, 13.0, 19.0, 27.0, 26.0, 31.0, 49.0, 57.0, 56.0, 69.0, 78.0, 75.0, 93.0, 82.0, 57.0, 50.0, 45.0, 30.0, 37.0, 28.0, 19.0, 14.0, 11.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.06420040130615234, -0.06217765808105469, -0.06015491485595703, -0.058132171630859375, -0.05610942840576172, -0.05408668518066406, -0.052063941955566406, -0.05004119873046875, -0.048018455505371094, -0.04599571228027344, -0.04397296905517578, -0.041950225830078125, -0.03992748260498047, -0.03790473937988281, -0.035881996154785156, -0.0338592529296875, -0.031836509704589844, -0.029813766479492188, -0.02779102325439453, -0.025768280029296875, -0.02374553680419922, -0.021722793579101562, -0.019700050354003906, -0.01767730712890625, -0.015654563903808594, -0.013631820678710938, -0.011609077453613281, -0.009586334228515625, -0.007563591003417969, -0.0055408477783203125, -0.0035181045532226562, -0.001495361328125, 0.0005273818969726562, 0.0025501251220703125, 0.004572868347167969, 0.006595611572265625, 0.008618354797363281, 0.010641098022460938, 0.012663841247558594, 0.01468658447265625, 0.016709327697753906, 0.018732070922851562, 0.02075481414794922, 0.022777557373046875, 0.02480030059814453, 0.026823043823242188, 0.028845787048339844, 0.0308685302734375, 0.032891273498535156, 0.03491401672363281, 0.03693675994873047, 0.038959503173828125, 0.04098224639892578, 0.04300498962402344, 0.045027732849121094, 0.04705047607421875, 0.049073219299316406, 0.05109596252441406, 0.05311870574951172, 0.055141448974609375, 0.05716419219970703, 0.05918693542480469, 0.061209678649902344, 0.063232421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 11.0, 9.0, 9.0, 25.0, 22.0, 34.0, 58.0, 112.0, 150.0, 256.0, 500.0, 1053.0, 2466.0, 8309.0, 59077.0, 799689.0, 156066.0, 14435.0, 3425.0, 1350.0, 625.0, 292.0, 195.0, 116.0, 72.0, 47.0, 34.0, 19.0, 16.0, 14.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1546630859375, -0.14992904663085938, -0.14519500732421875, -0.14046096801757812, -0.1357269287109375, -0.13099288940429688, -0.12625885009765625, -0.12152481079101562, -0.116790771484375, -0.11205673217773438, -0.10732269287109375, -0.10258865356445312, -0.0978546142578125, -0.09312057495117188, -0.08838653564453125, -0.08365249633789062, -0.07891845703125, -0.07418441772460938, -0.06945037841796875, -0.06471633911132812, -0.0599822998046875, -0.055248260498046875, -0.05051422119140625, -0.045780181884765625, -0.041046142578125, -0.036312103271484375, -0.03157806396484375, -0.026844024658203125, -0.0221099853515625, -0.017375946044921875, -0.01264190673828125, -0.007907867431640625, -0.003173828125, 0.001560211181640625, 0.00629425048828125, 0.011028289794921875, 0.0157623291015625, 0.020496368408203125, 0.02523040771484375, 0.029964447021484375, 0.034698486328125, 0.039432525634765625, 0.04416656494140625, 0.048900604248046875, 0.0536346435546875, 0.058368682861328125, 0.06310272216796875, 0.06783676147460938, 0.07257080078125, 0.07730484008789062, 0.08203887939453125, 0.08677291870117188, 0.0915069580078125, 0.09624099731445312, 0.10097503662109375, 0.10570907592773438, 0.110443115234375, 0.11517715454101562, 0.11991119384765625, 0.12464523315429688, 0.1293792724609375, 0.13411331176757812, 0.13884735107421875, 0.14358139038085938, 0.1483154296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 2.0, 9.0, 11.0, 8.0, 11.0, 13.0, 13.0, 25.0, 24.0, 30.0, 50.0, 35.0, 43.0, 62.0, 58.0, 70.0, 64.0, 62.0, 59.0, 52.0, 52.0, 36.0, 43.0, 25.0, 33.0, 24.0, 22.0, 11.0, 11.0, 6.0, 9.0, 8.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2135009765625, -0.20691680908203125, -0.2003326416015625, -0.19374847412109375, -0.187164306640625, -0.18058013916015625, -0.1739959716796875, -0.16741180419921875, -0.16082763671875, -0.15424346923828125, -0.1476593017578125, -0.14107513427734375, -0.134490966796875, -0.12790679931640625, -0.1213226318359375, -0.11473846435546875, -0.108154296875, -0.10157012939453125, -0.0949859619140625, -0.08840179443359375, -0.081817626953125, -0.07523345947265625, -0.0686492919921875, -0.06206512451171875, -0.05548095703125, -0.04889678955078125, -0.0423126220703125, -0.03572845458984375, -0.029144287109375, -0.02256011962890625, -0.0159759521484375, -0.00939178466796875, -0.0028076171875, 0.00377655029296875, 0.0103607177734375, 0.01694488525390625, 0.023529052734375, 0.03011322021484375, 0.0366973876953125, 0.04328155517578125, 0.04986572265625, 0.05644989013671875, 0.0630340576171875, 0.06961822509765625, 0.076202392578125, 0.08278656005859375, 0.0893707275390625, 0.09595489501953125, 0.1025390625, 0.10912322998046875, 0.1157073974609375, 0.12229156494140625, 0.128875732421875, 0.13545989990234375, 0.1420440673828125, 0.14862823486328125, 0.15521240234375, 0.16179656982421875, 0.1683807373046875, 0.17496490478515625, 0.181549072265625, 0.18813323974609375, 0.1947174072265625, 0.20130157470703125, 0.2078857421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 12.0, 18.0, 30.0, 41.0, 84.0, 150.0, 288.0, 666.0, 1479.0, 3880.0, 12314.0, 64888.0, 748894.0, 182436.0, 23181.0, 6200.0, 2167.0, 920.0, 424.0, 208.0, 106.0, 53.0, 43.0, 28.0, 12.0, 7.0, 3.0, 4.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.050384521484375, -0.04849863052368164, -0.04661273956298828, -0.04472684860229492, -0.04284095764160156, -0.0409550666809082, -0.039069175720214844, -0.037183284759521484, -0.035297393798828125, -0.033411502838134766, -0.031525611877441406, -0.029639720916748047, -0.027753829956054688, -0.025867938995361328, -0.02398204803466797, -0.02209615707397461, -0.02021026611328125, -0.01832437515258789, -0.01643848419189453, -0.014552593231201172, -0.012666702270507812, -0.010780811309814453, -0.008894920349121094, -0.007009029388427734, -0.005123138427734375, -0.0032372474670410156, -0.0013513565063476562, 0.0005345344543457031, 0.0024204254150390625, 0.004306316375732422, 0.006192207336425781, 0.00807809829711914, 0.0099639892578125, 0.01184988021850586, 0.013735771179199219, 0.015621662139892578, 0.017507553100585938, 0.019393444061279297, 0.021279335021972656, 0.023165225982666016, 0.025051116943359375, 0.026937007904052734, 0.028822898864746094, 0.030708789825439453, 0.03259468078613281, 0.03448057174682617, 0.03636646270751953, 0.03825235366821289, 0.04013824462890625, 0.04202413558959961, 0.04391002655029297, 0.04579591751098633, 0.04768180847167969, 0.04956769943237305, 0.051453590393066406, 0.053339481353759766, 0.055225372314453125, 0.057111263275146484, 0.058997154235839844, 0.0608830451965332, 0.06276893615722656, 0.06465482711791992, 0.06654071807861328, 0.06842660903930664, 0.0703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 3.0, 12.0, 16.0, 25.0, 27.0, 35.0, 45.0, 70.0, 86.0, 89.0, 108.0, 83.0, 77.0, 66.0, 52.0, 54.0, 37.0, 28.0, 14.0, 17.0, 7.0, 12.0, 7.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8848648071289062e-05, -2.7623027563095093e-05, -2.6397407054901123e-05, -2.5171786546707153e-05, -2.3946166038513184e-05, -2.2720545530319214e-05, -2.1494925022125244e-05, -2.0269304513931274e-05, -1.9043684005737305e-05, -1.7818063497543335e-05, -1.6592442989349365e-05, -1.5366822481155396e-05, -1.4141201972961426e-05, -1.2915581464767456e-05, -1.1689960956573486e-05, -1.0464340448379517e-05, -9.238719940185547e-06, -8.013099431991577e-06, -6.787478923797607e-06, -5.561858415603638e-06, -4.336237907409668e-06, -3.1106173992156982e-06, -1.8849968910217285e-06, -6.593763828277588e-07, 5.662441253662109e-07, 1.7918646335601807e-06, 3.0174851417541504e-06, 4.24310564994812e-06, 5.46872615814209e-06, 6.6943466663360596e-06, 7.91996717453003e-06, 9.145587682723999e-06, 1.0371208190917969e-05, 1.1596828699111938e-05, 1.2822449207305908e-05, 1.4048069715499878e-05, 1.5273690223693848e-05, 1.6499310731887817e-05, 1.7724931240081787e-05, 1.8950551748275757e-05, 2.0176172256469727e-05, 2.1401792764663696e-05, 2.2627413272857666e-05, 2.3853033781051636e-05, 2.5078654289245605e-05, 2.6304274797439575e-05, 2.7529895305633545e-05, 2.8755515813827515e-05, 2.9981136322021484e-05, 3.1206756830215454e-05, 3.2432377338409424e-05, 3.3657997846603394e-05, 3.488361835479736e-05, 3.610923886299133e-05, 3.73348593711853e-05, 3.856047987937927e-05, 3.978610038757324e-05, 4.101172089576721e-05, 4.223734140396118e-05, 4.346296191215515e-05, 4.468858242034912e-05, 4.591420292854309e-05, 4.713982343673706e-05, 4.836544394493103e-05, 4.9591064453125e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 10.0, 18.0, 39.0, 54.0, 134.0, 333.0, 880.0, 2944.0, 13729.0, 128670.0, 823040.0, 66370.0, 9100.0, 2054.0, 670.0, 248.0, 115.0, 60.0, 37.0, 18.0, 4.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0704345703125, -0.06803703308105469, -0.06563949584960938, -0.06324195861816406, -0.06084442138671875, -0.05844688415527344, -0.056049346923828125, -0.05365180969238281, -0.0512542724609375, -0.04885673522949219, -0.046459197998046875, -0.04406166076660156, -0.04166412353515625, -0.03926658630371094, -0.036869049072265625, -0.03447151184082031, -0.032073974609375, -0.029676437377929688, -0.027278900146484375, -0.024881362915039062, -0.02248382568359375, -0.020086288452148438, -0.017688751220703125, -0.015291213989257812, -0.0128936767578125, -0.010496139526367188, -0.008098602294921875, -0.0057010650634765625, -0.00330352783203125, -0.0009059906005859375, 0.001491546630859375, 0.0038890838623046875, 0.00628662109375, 0.008684158325195312, 0.011081695556640625, 0.013479232788085938, 0.01587677001953125, 0.018274307250976562, 0.020671844482421875, 0.023069381713867188, 0.0254669189453125, 0.027864456176757812, 0.030261993408203125, 0.03265953063964844, 0.03505706787109375, 0.03745460510253906, 0.039852142333984375, 0.04224967956542969, 0.044647216796875, 0.04704475402832031, 0.049442291259765625, 0.05183982849121094, 0.05423736572265625, 0.05663490295410156, 0.059032440185546875, 0.06142997741699219, 0.0638275146484375, 0.06622505187988281, 0.06862258911132812, 0.07102012634277344, 0.07341766357421875, 0.07581520080566406, 0.07821273803710938, 0.08061027526855469, 0.0830078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 8.0, 9.0, 8.0, 17.0, 22.0, 45.0, 64.0, 84.0, 138.0, 149.0, 148.0, 101.0, 57.0, 57.0, 26.0, 23.0, 13.0, 6.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07464599609375, -0.07255744934082031, -0.07046890258789062, -0.06838035583496094, -0.06629180908203125, -0.06420326232910156, -0.062114715576171875, -0.06002616882324219, -0.0579376220703125, -0.05584907531738281, -0.053760528564453125, -0.05167198181152344, -0.04958343505859375, -0.04749488830566406, -0.045406341552734375, -0.04331779479980469, -0.041229248046875, -0.03914070129394531, -0.037052154541015625, -0.03496360778808594, -0.03287506103515625, -0.030786514282226562, -0.028697967529296875, -0.026609420776367188, -0.0245208740234375, -0.022432327270507812, -0.020343780517578125, -0.018255233764648438, -0.01616668701171875, -0.014078140258789062, -0.011989593505859375, -0.009901046752929688, -0.0078125, -0.0057239532470703125, -0.003635406494140625, -0.0015468597412109375, 0.00054168701171875, 0.0026302337646484375, 0.004718780517578125, 0.0068073272705078125, 0.0088958740234375, 0.010984420776367188, 0.013072967529296875, 0.015161514282226562, 0.01725006103515625, 0.019338607788085938, 0.021427154541015625, 0.023515701293945312, 0.025604248046875, 0.027692794799804688, 0.029781341552734375, 0.03186988830566406, 0.03395843505859375, 0.03604698181152344, 0.038135528564453125, 0.04022407531738281, 0.0423126220703125, 0.04440116882324219, 0.046489715576171875, 0.04857826232910156, 0.05066680908203125, 0.05275535583496094, 0.054843902587890625, 0.05693244934082031, 0.05902099609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 5.0, 13.0, 20.0, 57.0, 184.0, 400.0, 204.0, 71.0, 25.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7535669803619385, -1.7015347480773926, -1.6495023965835571, -1.5974701642990112, -1.5454378128051758, -1.4934055805206299, -1.441373348236084, -1.3893409967422485, -1.337308645248413, -1.2852764129638672, -1.2332440614700317, -1.1812118291854858, -1.1291794776916504, -1.0771472454071045, -1.0251150131225586, -0.9730826616287231, -0.9210504293441772, -0.8690181374549866, -0.8169858455657959, -0.76495361328125, -0.7129212617874146, -0.6608890295028687, -0.608856737613678, -0.5568244457244873, -0.5047921538352966, -0.45275986194610596, -0.4007275700569153, -0.348695307970047, -0.2966630160808563, -0.24463072419166565, -0.19259846210479736, -0.1405661702156067, -0.08853387832641602, -0.03650159388780594, 0.015530690550804138, 0.06756296753883362, 0.11959525942802429, 0.17162755131721497, 0.22365981340408325, 0.2756921052932739, 0.3277243971824646, 0.3797566890716553, 0.43178898096084595, 0.48382124304771423, 0.5358535051345825, 0.587885856628418, 0.6399180889129639, 0.6919503808021545, 0.7439826726913452, 0.7960149645805359, 0.8480472564697266, 0.9000794887542725, 0.9521118402481079, 1.0041440725326538, 1.0561764240264893, 1.1082086563110352, 1.160240888595581, 1.212273120880127, 1.2643054723739624, 1.3163377046585083, 1.3683700561523438, 1.4204022884368896, 1.4724345207214355, 1.524466872215271, 1.5764992237091064]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 8.0, 7.0, 5.0, 11.0, 6.0, 21.0, 25.0, 16.0, 24.0, 20.0, 29.0, 41.0, 43.0, 40.0, 61.0, 75.0, 97.0, 91.0, 66.0, 38.0, 31.0, 28.0, 28.0, 25.0, 25.0, 19.0, 18.0, 15.0, 13.0, 8.0, 14.0, 10.0, 3.0, 13.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.9341650605201721, -0.9087353944778442, -0.8833057284355164, -0.8578760623931885, -0.8324464559555054, -0.8070167899131775, -0.7815871238708496, -0.7561574578285217, -0.7307277917861938, -0.705298125743866, -0.6798684597015381, -0.654438853263855, -0.6290091872215271, -0.6035795211791992, -0.5781498551368713, -0.5527201890945435, -0.5272905826568604, -0.5018609166145325, -0.476431280374527, -0.4510016143321991, -0.4255719780921936, -0.4001423120498657, -0.37471264600753784, -0.34928297996520996, -0.32385334372520447, -0.2984236776828766, -0.2729940414428711, -0.2475643754005432, -0.22213472425937653, -0.19670507311820984, -0.17127540707588196, -0.14584575593471527, -0.12041610479354858, -0.0949864536523819, -0.06955679506063461, -0.04412713646888733, -0.018697485327720642, 0.006732165813446045, 0.032161831855773926, 0.05759148299694061, 0.0830211341381073, 0.10845078527927399, 0.13388043642044067, 0.15931010246276855, 0.18473975360393524, 0.21016940474510193, 0.2355990707874298, 0.2610287070274353, 0.2864583730697632, 0.31188803911209106, 0.33731767535209656, 0.36274734139442444, 0.38817697763442993, 0.4136066436767578, 0.4390363097190857, 0.4644659757614136, 0.48989561200141907, 0.5153252482414246, 0.5407549142837524, 0.5661845803260803, 0.5916142463684082, 0.6170438528060913, 0.642473578453064, 0.6679031848907471, 0.693332850933075]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 1.0, 4.0, 15.0, 11.0, 14.0, 21.0, 26.0, 53.0, 73.0, 98.0, 139.0, 275.0, 399.0, 716.0, 1356.0, 2883.0, 6704.0, 18750.0, 70382.0, 374234.0, 1803044.0, 1552628.0, 277679.0, 55444.0, 16465.0, 6220.0, 2923.0, 1507.0, 833.0, 501.0, 305.0, 214.0, 104.0, 70.0, 67.0, 38.0, 23.0, 17.0, 14.0, 9.0, 5.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055633544921875, -0.05404090881347656, -0.052448272705078125, -0.05085563659667969, -0.04926300048828125, -0.04767036437988281, -0.046077728271484375, -0.04448509216308594, -0.0428924560546875, -0.04129981994628906, -0.039707183837890625, -0.03811454772949219, -0.03652191162109375, -0.03492927551269531, -0.033336639404296875, -0.03174400329589844, -0.0301513671875, -0.028558731079101562, -0.026966094970703125, -0.025373458862304688, -0.02378082275390625, -0.022188186645507812, -0.020595550537109375, -0.019002914428710938, -0.0174102783203125, -0.015817642211914062, -0.014225006103515625, -0.012632369995117188, -0.01103973388671875, -0.009447097778320312, -0.007854461669921875, -0.0062618255615234375, -0.004669189453125, -0.0030765533447265625, -0.001483917236328125, 0.0001087188720703125, 0.00170135498046875, 0.0032939910888671875, 0.004886627197265625, 0.0064792633056640625, 0.0080718994140625, 0.009664535522460938, 0.011257171630859375, 0.012849807739257812, 0.01444244384765625, 0.016035079956054688, 0.017627716064453125, 0.019220352172851562, 0.02081298828125, 0.022405624389648438, 0.023998260498046875, 0.025590896606445312, 0.02718353271484375, 0.028776168823242188, 0.030368804931640625, 0.03196144104003906, 0.0335540771484375, 0.03514671325683594, 0.036739349365234375, 0.03833198547363281, 0.03992462158203125, 0.04151725769042969, 0.043109893798828125, 0.04470252990722656, 0.046295166015625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 5.0, 8.0, 15.0, 10.0, 21.0, 20.0, 28.0, 33.0, 49.0, 40.0, 74.0, 63.0, 67.0, 65.0, 55.0, 86.0, 57.0, 50.0, 44.0, 46.0, 32.0, 33.0, 25.0, 15.0, 19.0, 5.0, 7.0, 5.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06526470184326172, -0.06339073181152344, -0.061516761779785156, -0.059642791748046875, -0.057768821716308594, -0.05589485168457031, -0.05402088165283203, -0.05214691162109375, -0.05027294158935547, -0.04839897155761719, -0.046525001525878906, -0.044651031494140625, -0.042777061462402344, -0.04090309143066406, -0.03902912139892578, -0.0371551513671875, -0.03528118133544922, -0.03340721130371094, -0.031533241271972656, -0.029659271240234375, -0.027785301208496094, -0.025911331176757812, -0.02403736114501953, -0.02216339111328125, -0.02028942108154297, -0.018415451049804688, -0.016541481018066406, -0.014667510986328125, -0.012793540954589844, -0.010919570922851562, -0.009045600891113281, -0.007171630859375, -0.005297660827636719, -0.0034236907958984375, -0.0015497207641601562, 0.000324249267578125, 0.0021982192993164062, 0.0040721893310546875, 0.005946159362792969, 0.00782012939453125, 0.009694099426269531, 0.011568069458007812, 0.013442039489746094, 0.015316009521484375, 0.017189979553222656, 0.019063949584960938, 0.02093791961669922, 0.0228118896484375, 0.02468585968017578, 0.026559829711914062, 0.028433799743652344, 0.030307769775390625, 0.032181739807128906, 0.03405570983886719, 0.03592967987060547, 0.03780364990234375, 0.03967761993408203, 0.04155158996582031, 0.043425559997558594, 0.045299530029296875, 0.047173500061035156, 0.04904747009277344, 0.05092144012451172, 0.05279541015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 11.0, 19.0, 34.0, 77.0, 151.0, 367.0, 1459.0, 122610.0, 4065121.0, 3415.0, 572.0, 230.0, 116.0, 50.0, 30.0, 15.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.3936614990234375, -0.378631591796875, -0.3636016845703125, -0.34857177734375, -0.3335418701171875, -0.318511962890625, -0.3034820556640625, -0.2884521484375, -0.2734222412109375, -0.258392333984375, -0.2433624267578125, -0.22833251953125, -0.2133026123046875, -0.198272705078125, -0.1832427978515625, -0.168212890625, -0.1531829833984375, -0.138153076171875, -0.1231231689453125, -0.10809326171875, -0.0930633544921875, -0.078033447265625, -0.0630035400390625, -0.0479736328125, -0.0329437255859375, -0.017913818359375, -0.0028839111328125, 0.01214599609375, 0.0271759033203125, 0.042205810546875, 0.0572357177734375, 0.072265625, 0.0872955322265625, 0.102325439453125, 0.1173553466796875, 0.13238525390625, 0.1474151611328125, 0.162445068359375, 0.1774749755859375, 0.1925048828125, 0.2075347900390625, 0.222564697265625, 0.2375946044921875, 0.25262451171875, 0.2676544189453125, 0.282684326171875, 0.2977142333984375, 0.312744140625, 0.3277740478515625, 0.342803955078125, 0.3578338623046875, 0.37286376953125, 0.3878936767578125, 0.402923583984375, 0.4179534912109375, 0.4329833984375, 0.4480133056640625, 0.463043212890625, 0.4780731201171875, 0.49310302734375, 0.5081329345703125, 0.523162841796875, 0.5381927490234375, 0.55322265625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 27.0, 41.0, 88.0, 181.0, 499.0, 1117.0, 1152.0, 550.0, 212.0, 97.0, 46.0, 21.0, 13.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08795166015625, -0.0820913314819336, -0.07623100280761719, -0.07037067413330078, -0.06451034545898438, -0.05865001678466797, -0.05278968811035156, -0.046929359436035156, -0.04106903076171875, -0.035208702087402344, -0.029348373413085938, -0.02348804473876953, -0.017627716064453125, -0.011767387390136719, -0.0059070587158203125, -4.673004150390625e-05, 0.0058135986328125, 0.011673927307128906, 0.017534255981445312, 0.02339458465576172, 0.029254913330078125, 0.03511524200439453, 0.04097557067871094, 0.046835899353027344, 0.05269622802734375, 0.058556556701660156, 0.06441688537597656, 0.07027721405029297, 0.07613754272460938, 0.08199787139892578, 0.08785820007324219, 0.0937185287475586, 0.099578857421875, 0.1054391860961914, 0.11129951477050781, 0.11715984344482422, 0.12302017211914062, 0.12888050079345703, 0.13474082946777344, 0.14060115814208984, 0.14646148681640625, 0.15232181549072266, 0.15818214416503906, 0.16404247283935547, 0.16990280151367188, 0.17576313018798828, 0.1816234588623047, 0.1874837875366211, 0.1933441162109375, 0.1992044448852539, 0.2050647735595703, 0.21092510223388672, 0.21678543090820312, 0.22264575958251953, 0.22850608825683594, 0.23436641693115234, 0.24022674560546875, 0.24608707427978516, 0.25194740295410156, 0.25780773162841797, 0.2636680603027344, 0.2695283889770508, 0.2753887176513672, 0.2812490463256836, 0.287109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 11.0, 24.0, 88.0, 140.0, 230.0, 236.0, 109.0, 72.0, 31.0, 21.0, 11.0, 5.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5425498485565186, -1.500517725944519, -1.4584856033325195, -1.4164533615112305, -1.374421238899231, -1.3323891162872314, -1.2903568744659424, -1.2483247518539429, -1.2062926292419434, -1.1642605066299438, -1.1222283840179443, -1.0801961421966553, -1.0381640195846558, -0.9961318969726562, -0.954099714756012, -0.9120675325393677, -0.8700354099273682, -0.8280032873153687, -0.7859711050987244, -0.7439389228820801, -0.7019068002700806, -0.659874677658081, -0.6178424954414368, -0.5758103132247925, -0.533778190612793, -0.49174603819847107, -0.44971388578414917, -0.40768173336982727, -0.36564958095550537, -0.32361742854118347, -0.2815852761268616, -0.23955312371253967, -0.19752085208892822, -0.15548869967460632, -0.11345654726028442, -0.07142439484596252, -0.029392242431640625, 0.012639909982681274, 0.054672062397003174, 0.09670421481132507, 0.13873636722564697, 0.18076851963996887, 0.22280067205429077, 0.26483282446861267, 0.30686497688293457, 0.34889712929725647, 0.39092928171157837, 0.43296143412590027, 0.47499358654022217, 0.5170257091522217, 0.559057891368866, 0.6010900735855103, 0.6431221961975098, 0.6851543188095093, 0.7271865010261536, 0.7692186832427979, 0.8112508058547974, 0.8532829284667969, 0.8953151106834412, 0.9373472929000854, 0.979379415512085, 1.0214115381240845, 1.063443660736084, 1.105475902557373, 1.1475080251693726]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 4.0, 11.0, 5.0, 11.0, 16.0, 23.0, 19.0, 20.0, 28.0, 39.0, 36.0, 34.0, 35.0, 41.0, 41.0, 43.0, 37.0, 53.0, 41.0, 55.0, 38.0, 39.0, 39.0, 40.0, 37.0, 35.0, 28.0, 29.0, 20.0, 29.0, 12.0, 13.0, 9.0, 9.0, 6.0, 8.0, 2.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5444459319114685, -0.5280500650405884, -0.511654257774353, -0.4952584207057953, -0.47886258363723755, -0.4624667465686798, -0.44607090950012207, -0.42967507243156433, -0.4132792353630066, -0.39688339829444885, -0.3804875612258911, -0.3640917241573334, -0.34769588708877563, -0.3313000500202179, -0.31490421295166016, -0.2985083758831024, -0.2821125388145447, -0.26571670174598694, -0.2493208646774292, -0.23292502760887146, -0.21652919054031372, -0.20013335347175598, -0.18373751640319824, -0.1673416793346405, -0.15094584226608276, -0.13455000519752502, -0.11815416812896729, -0.10175833106040955, -0.0853624939918518, -0.06896665692329407, -0.05257081985473633, -0.03617498278617859, -0.019779086112976074, -0.003383249044418335, 0.013012588024139404, 0.029408425092697144, 0.04580426216125488, 0.06220009922981262, 0.07859593629837036, 0.0949917733669281, 0.11138761043548584, 0.12778344750404358, 0.14417928457260132, 0.16057512164115906, 0.1769709587097168, 0.19336679577827454, 0.20976263284683228, 0.22615846991539001, 0.24255430698394775, 0.2589501440525055, 0.27534598112106323, 0.29174181818962097, 0.3081376552581787, 0.32453349232673645, 0.3409293293952942, 0.35732516646385193, 0.37372100353240967, 0.3901168406009674, 0.40651267766952515, 0.4229085147380829, 0.4393043518066406, 0.45570018887519836, 0.4720960259437561, 0.48849186301231384, 0.5048877000808716]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 17.0, 15.0, 26.0, 53.0, 83.0, 161.0, 341.0, 777.0, 1869.0, 5025.0, 17155.0, 94435.0, 627418.0, 253148.0, 34467.0, 8409.0, 2875.0, 1186.0, 475.0, 263.0, 121.0, 81.0, 54.0, 29.0, 8.0, 14.0, 15.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11810302734375, -0.11488723754882812, -0.11167144775390625, -0.10845565795898438, -0.1052398681640625, -0.10202407836914062, -0.09880828857421875, -0.09559249877929688, -0.092376708984375, -0.08916091918945312, -0.08594512939453125, -0.08272933959960938, -0.0795135498046875, -0.07629776000976562, -0.07308197021484375, -0.06986618041992188, -0.066650390625, -0.06343460083007812, -0.06021881103515625, -0.057003021240234375, -0.0537872314453125, -0.050571441650390625, -0.04735565185546875, -0.044139862060546875, -0.040924072265625, -0.037708282470703125, -0.03449249267578125, -0.031276702880859375, -0.0280609130859375, -0.024845123291015625, -0.02162933349609375, -0.018413543701171875, -0.01519775390625, -0.011981964111328125, -0.00876617431640625, -0.005550384521484375, -0.0023345947265625, 0.000881195068359375, 0.00409698486328125, 0.007312774658203125, 0.010528564453125, 0.013744354248046875, 0.01696014404296875, 0.020175933837890625, 0.0233917236328125, 0.026607513427734375, 0.02982330322265625, 0.033039093017578125, 0.0362548828125, 0.039470672607421875, 0.04268646240234375, 0.045902252197265625, 0.0491180419921875, 0.052333831787109375, 0.05554962158203125, 0.058765411376953125, 0.061981201171875, 0.06519699096679688, 0.06841278076171875, 0.07162857055664062, 0.0748443603515625, 0.07806015014648438, 0.08127593994140625, 0.08449172973632812, 0.08770751953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 10.0, 11.0, 12.0, 16.0, 20.0, 27.0, 32.0, 34.0, 48.0, 46.0, 39.0, 53.0, 52.0, 51.0, 63.0, 54.0, 43.0, 44.0, 53.0, 42.0, 43.0, 34.0, 30.0, 27.0, 21.0, 17.0, 14.0, 16.0, 9.0, 7.0, 5.0, 4.0, 6.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.059173583984375, -0.05750751495361328, -0.05584144592285156, -0.054175376892089844, -0.052509307861328125, -0.050843238830566406, -0.04917716979980469, -0.04751110076904297, -0.04584503173828125, -0.04417896270751953, -0.04251289367675781, -0.040846824645996094, -0.039180755615234375, -0.037514686584472656, -0.03584861755371094, -0.03418254852294922, -0.0325164794921875, -0.03085041046142578, -0.029184341430664062, -0.027518272399902344, -0.025852203369140625, -0.024186134338378906, -0.022520065307617188, -0.02085399627685547, -0.01918792724609375, -0.01752185821533203, -0.015855789184570312, -0.014189720153808594, -0.012523651123046875, -0.010857582092285156, -0.009191513061523438, -0.007525444030761719, -0.005859375, -0.004193305969238281, -0.0025272369384765625, -0.0008611679077148438, 0.000804901123046875, 0.0024709701538085938, 0.0041370391845703125, 0.005803108215332031, 0.00746917724609375, 0.009135246276855469, 0.010801315307617188, 0.012467384338378906, 0.014133453369140625, 0.015799522399902344, 0.017465591430664062, 0.01913166046142578, 0.0207977294921875, 0.02246379852294922, 0.024129867553710938, 0.025795936584472656, 0.027462005615234375, 0.029128074645996094, 0.030794143676757812, 0.03246021270751953, 0.03412628173828125, 0.03579235076904297, 0.03745841979980469, 0.039124488830566406, 0.040790557861328125, 0.042456626892089844, 0.04412269592285156, 0.04578876495361328, 0.047454833984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 3.0, 4.0, 8.0, 10.0, 9.0, 11.0, 15.0, 35.0, 44.0, 65.0, 86.0, 131.0, 193.0, 303.0, 526.0, 983.0, 2336.0, 7420.0, 46037.0, 829583.0, 140314.0, 13767.0, 3582.0, 1329.0, 670.0, 377.0, 220.0, 158.0, 105.0, 70.0, 48.0, 40.0, 16.0, 17.0, 11.0, 7.0, 5.0, 5.0, 1.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.174560546875, -0.16938018798828125, -0.1641998291015625, -0.15901947021484375, -0.153839111328125, -0.14865875244140625, -0.1434783935546875, -0.13829803466796875, -0.13311767578125, -0.12793731689453125, -0.1227569580078125, -0.11757659912109375, -0.112396240234375, -0.10721588134765625, -0.1020355224609375, -0.09685516357421875, -0.0916748046875, -0.08649444580078125, -0.0813140869140625, -0.07613372802734375, -0.070953369140625, -0.06577301025390625, -0.0605926513671875, -0.05541229248046875, -0.05023193359375, -0.04505157470703125, -0.0398712158203125, -0.03469085693359375, -0.029510498046875, -0.02433013916015625, -0.0191497802734375, -0.01396942138671875, -0.0087890625, -0.00360870361328125, 0.0015716552734375, 0.00675201416015625, 0.011932373046875, 0.01711273193359375, 0.0222930908203125, 0.02747344970703125, 0.03265380859375, 0.03783416748046875, 0.0430145263671875, 0.04819488525390625, 0.053375244140625, 0.05855560302734375, 0.0637359619140625, 0.06891632080078125, 0.0740966796875, 0.07927703857421875, 0.0844573974609375, 0.08963775634765625, 0.094818115234375, 0.09999847412109375, 0.1051788330078125, 0.11035919189453125, 0.11553955078125, 0.12071990966796875, 0.1259002685546875, 0.13108062744140625, 0.136260986328125, 0.14144134521484375, 0.1466217041015625, 0.15180206298828125, 0.156982421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 15.0, 5.0, 13.0, 22.0, 25.0, 24.0, 23.0, 32.0, 46.0, 38.0, 61.0, 54.0, 63.0, 64.0, 78.0, 71.0, 55.0, 50.0, 47.0, 40.0, 26.0, 19.0, 32.0, 12.0, 14.0, 10.0, 11.0, 11.0, 6.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17625045776367188, -0.16939544677734375, -0.16254043579101562, -0.1556854248046875, -0.14883041381835938, -0.14197540283203125, -0.13512039184570312, -0.128265380859375, -0.12141036987304688, -0.11455535888671875, -0.10770034790039062, -0.1008453369140625, -0.09399032592773438, -0.08713531494140625, -0.08028030395507812, -0.07342529296875, -0.06657028198242188, -0.05971527099609375, -0.052860260009765625, -0.0460052490234375, -0.039150238037109375, -0.03229522705078125, -0.025440216064453125, -0.018585205078125, -0.011730194091796875, -0.00487518310546875, 0.001979827880859375, 0.0088348388671875, 0.015689849853515625, 0.02254486083984375, 0.029399871826171875, 0.0362548828125, 0.043109893798828125, 0.04996490478515625, 0.056819915771484375, 0.0636749267578125, 0.07052993774414062, 0.07738494873046875, 0.08423995971679688, 0.091094970703125, 0.09794998168945312, 0.10480499267578125, 0.11166000366210938, 0.1185150146484375, 0.12537002563476562, 0.13222503662109375, 0.13908004760742188, 0.14593505859375, 0.15279006958007812, 0.15964508056640625, 0.16650009155273438, 0.1733551025390625, 0.18021011352539062, 0.18706512451171875, 0.19392013549804688, 0.200775146484375, 0.20763015747070312, 0.21448516845703125, 0.22134017944335938, 0.2281951904296875, 0.23505020141601562, 0.24190521240234375, 0.24876022338867188, 0.255615234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 10.0, 7.0, 10.0, 12.0, 14.0, 22.0, 24.0, 53.0, 74.0, 102.0, 172.0, 316.0, 739.0, 1846.0, 5807.0, 24712.0, 293906.0, 679594.0, 30550.0, 6665.0, 2146.0, 794.0, 384.0, 209.0, 115.0, 76.0, 46.0, 42.0, 20.0, 16.0, 17.0, 12.0, 11.0, 10.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.081298828125, -0.07876300811767578, -0.07622718811035156, -0.07369136810302734, -0.07115554809570312, -0.0686197280883789, -0.06608390808105469, -0.06354808807373047, -0.06101226806640625, -0.05847644805908203, -0.05594062805175781, -0.053404808044433594, -0.050868988037109375, -0.048333168029785156, -0.04579734802246094, -0.04326152801513672, -0.0407257080078125, -0.03818988800048828, -0.03565406799316406, -0.033118247985839844, -0.030582427978515625, -0.028046607971191406, -0.025510787963867188, -0.02297496795654297, -0.02043914794921875, -0.01790332794189453, -0.015367507934570312, -0.012831687927246094, -0.010295867919921875, -0.007760047912597656, -0.0052242279052734375, -0.0026884078979492188, -0.000152587890625, 0.0023832321166992188, 0.0049190521240234375, 0.007454872131347656, 0.009990692138671875, 0.012526512145996094, 0.015062332153320312, 0.01759815216064453, 0.02013397216796875, 0.02266979217529297, 0.025205612182617188, 0.027741432189941406, 0.030277252197265625, 0.032813072204589844, 0.03534889221191406, 0.03788471221923828, 0.0404205322265625, 0.04295635223388672, 0.04549217224121094, 0.048027992248535156, 0.050563812255859375, 0.053099632263183594, 0.05563545227050781, 0.05817127227783203, 0.06070709228515625, 0.06324291229248047, 0.06577873229980469, 0.0683145523071289, 0.07085037231445312, 0.07338619232177734, 0.07592201232910156, 0.07845783233642578, 0.08099365234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 5.0, 9.0, 7.0, 9.0, 10.0, 17.0, 24.0, 22.0, 27.0, 43.0, 49.0, 54.0, 81.0, 78.0, 75.0, 73.0, 67.0, 65.0, 49.0, 50.0, 28.0, 28.0, 20.0, 24.0, 16.0, 12.0, 9.0, 9.0, 2.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.6656856536865234e-05, -3.5686418414115906e-05, -3.471598029136658e-05, -3.374554216861725e-05, -3.277510404586792e-05, -3.180466592311859e-05, -3.083422780036926e-05, -2.9863789677619934e-05, -2.8893351554870605e-05, -2.7922913432121277e-05, -2.6952475309371948e-05, -2.598203718662262e-05, -2.501159906387329e-05, -2.4041160941123962e-05, -2.3070722818374634e-05, -2.2100284695625305e-05, -2.1129846572875977e-05, -2.0159408450126648e-05, -1.918897032737732e-05, -1.821853220462799e-05, -1.7248094081878662e-05, -1.6277655959129333e-05, -1.5307217836380005e-05, -1.4336779713630676e-05, -1.3366341590881348e-05, -1.2395903468132019e-05, -1.142546534538269e-05, -1.0455027222633362e-05, -9.484589099884033e-06, -8.514150977134705e-06, -7.543712854385376e-06, -6.573274731636047e-06, -5.602836608886719e-06, -4.63239848613739e-06, -3.6619603633880615e-06, -2.691522240638733e-06, -1.7210841178894043e-06, -7.506459951400757e-07, 2.1979212760925293e-07, 1.1902302503585815e-06, 2.16066837310791e-06, 3.1311064958572388e-06, 4.101544618606567e-06, 5.071982741355896e-06, 6.042420864105225e-06, 7.012858986854553e-06, 7.983297109603882e-06, 8.95373523235321e-06, 9.924173355102539e-06, 1.0894611477851868e-05, 1.1865049600601196e-05, 1.2835487723350525e-05, 1.3805925846099854e-05, 1.4776363968849182e-05, 1.574680209159851e-05, 1.671724021434784e-05, 1.7687678337097168e-05, 1.8658116459846497e-05, 1.9628554582595825e-05, 2.0598992705345154e-05, 2.1569430828094482e-05, 2.253986895084381e-05, 2.351030707359314e-05, 2.4480745196342468e-05, 2.5451183319091797e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 7.0, 12.0, 14.0, 19.0, 24.0, 32.0, 65.0, 97.0, 139.0, 224.0, 415.0, 781.0, 1782.0, 4492.0, 14899.0, 71736.0, 792352.0, 128948.0, 21868.0, 6229.0, 2255.0, 956.0, 499.0, 232.0, 155.0, 91.0, 67.0, 53.0, 24.0, 22.0, 17.0, 11.0, 5.0, 1.0, 5.0, 1.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.05466127395629883, -0.052529335021972656, -0.050397396087646484, -0.04826545715332031, -0.04613351821899414, -0.04400157928466797, -0.0418696403503418, -0.039737701416015625, -0.03760576248168945, -0.03547382354736328, -0.03334188461303711, -0.031209945678710938, -0.029078006744384766, -0.026946067810058594, -0.024814128875732422, -0.02268218994140625, -0.020550251007080078, -0.018418312072753906, -0.016286373138427734, -0.014154434204101562, -0.01202249526977539, -0.009890556335449219, -0.007758617401123047, -0.005626678466796875, -0.003494739532470703, -0.0013628005981445312, 0.0007691383361816406, 0.0029010772705078125, 0.005033016204833984, 0.007164955139160156, 0.009296894073486328, 0.0114288330078125, 0.013560771942138672, 0.015692710876464844, 0.017824649810791016, 0.019956588745117188, 0.02208852767944336, 0.02422046661376953, 0.026352405548095703, 0.028484344482421875, 0.030616283416748047, 0.03274822235107422, 0.03488016128540039, 0.03701210021972656, 0.039144039154052734, 0.041275978088378906, 0.04340791702270508, 0.04553985595703125, 0.04767179489135742, 0.049803733825683594, 0.051935672760009766, 0.05406761169433594, 0.05619955062866211, 0.05833148956298828, 0.06046342849731445, 0.06259536743164062, 0.0647273063659668, 0.06685924530029297, 0.06899118423461914, 0.07112312316894531, 0.07325506210327148, 0.07538700103759766, 0.07751893997192383, 0.07965087890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 9.0, 11.0, 19.0, 21.0, 29.0, 50.0, 81.0, 124.0, 188.0, 131.0, 93.0, 57.0, 50.0, 32.0, 19.0, 19.0, 14.0, 4.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06732177734375, -0.06537199020385742, -0.06342220306396484, -0.061472415924072266, -0.05952262878417969, -0.05757284164428711, -0.05562305450439453, -0.05367326736450195, -0.051723480224609375, -0.0497736930847168, -0.04782390594482422, -0.04587411880493164, -0.04392433166503906, -0.041974544525146484, -0.040024757385253906, -0.03807497024536133, -0.03612518310546875, -0.03417539596557617, -0.032225608825683594, -0.030275821685791016, -0.028326034545898438, -0.02637624740600586, -0.02442646026611328, -0.022476673126220703, -0.020526885986328125, -0.018577098846435547, -0.01662731170654297, -0.01467752456665039, -0.012727737426757812, -0.010777950286865234, -0.008828163146972656, -0.006878376007080078, -0.0049285888671875, -0.002978801727294922, -0.0010290145874023438, 0.0009207725524902344, 0.0028705596923828125, 0.004820346832275391, 0.006770133972167969, 0.008719921112060547, 0.010669708251953125, 0.012619495391845703, 0.014569282531738281, 0.01651906967163086, 0.018468856811523438, 0.020418643951416016, 0.022368431091308594, 0.024318218231201172, 0.02626800537109375, 0.028217792510986328, 0.030167579650878906, 0.032117366790771484, 0.03406715393066406, 0.03601694107055664, 0.03796672821044922, 0.0399165153503418, 0.041866302490234375, 0.04381608963012695, 0.04576587677001953, 0.04771566390991211, 0.04966545104980469, 0.051615238189697266, 0.053565025329589844, 0.05551481246948242, 0.057464599609375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 46.0, 210.0, 583.0, 106.0, 26.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5598280429840088, -1.4586185216903687, -1.357408881187439, -1.2561993598937988, -1.1549897193908691, -1.053780198097229, -0.9525706768035889, -0.851361095905304, -0.750151515007019, -0.6489419341087341, -0.5477323532104492, -0.4465228319168091, -0.34531325101852417, -0.24410367012023926, -0.14289414882659912, -0.04168456792831421, 0.0595250129699707, 0.16073457896709442, 0.26194414496421814, 0.36315369606018066, 0.4643632769584656, 0.5655728578567505, 0.6667823791503906, 0.7679919600486755, 0.8692015409469604, 0.9704111218452454, 1.0716207027435303, 1.1728302240371704, 1.2740397453308105, 1.3752493858337402, 1.4764589071273804, 1.5776684284210205, 1.678877830505371, 1.7800873517990112, 1.881296992301941, 1.982506513595581, 2.0837161540985107, 2.1849255561828613, 2.286135196685791, 2.3873448371887207, 2.4885544776916504, 2.58976411819458, 2.6909735202789307, 2.7921831607818604, 2.89339280128479, 2.9946022033691406, 3.0958118438720703, 3.197021484375, 3.2982308864593506, 3.3994405269622803, 3.500649929046631, 3.6018595695495605, 3.7030692100524902, 3.80427885055542, 3.9054882526397705, 4.006697654724121, 4.107907295227051, 4.2091169357299805, 4.31032657623291, 4.41153621673584, 4.512745380401611, 4.613955020904541, 4.715164661407471, 4.8163743019104, 4.91758394241333]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 7.0, 11.0, 5.0, 13.0, 15.0, 9.0, 12.0, 22.0, 24.0, 30.0, 28.0, 23.0, 33.0, 37.0, 47.0, 67.0, 96.0, 100.0, 57.0, 40.0, 27.0, 29.0, 35.0, 22.0, 25.0, 26.0, 21.0, 13.0, 14.0, 11.0, 15.0, 6.0, 12.0, 6.0, 9.0, 8.0, 3.0, 4.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6319724321365356, -0.6116079092025757, -0.5912433862686157, -0.5708789229393005, -0.5505144000053406, -0.5301498770713806, -0.5097853541374207, -0.4894208312034607, -0.4690563380718231, -0.44869181513786316, -0.4283273220062256, -0.4079627990722656, -0.38759827613830566, -0.3672337830066681, -0.34686926007270813, -0.32650476694107056, -0.3061402440071106, -0.28577572107315063, -0.26541122794151306, -0.2450467050075531, -0.22468219697475433, -0.20431768894195557, -0.1839531660079956, -0.16358865797519684, -0.14322414994239807, -0.1228596419095993, -0.10249512642621994, -0.08213061094284058, -0.06176610291004181, -0.04140159487724304, -0.021037079393863678, -0.000672563910484314, 0.01969200372695923, 0.040056515485048294, 0.06042102724313736, 0.08078554272651672, 0.10115005075931549, 0.12151455879211426, 0.14187908172607422, 0.16224358975887299, 0.18260809779167175, 0.20297260582447052, 0.2233371138572693, 0.24370163679122925, 0.2640661597251892, 0.2844306528568268, 0.30479517579078674, 0.3251596689224243, 0.3455241918563843, 0.36588871479034424, 0.3862532079219818, 0.4066177308559418, 0.42698222398757935, 0.4473467469215393, 0.46771126985549927, 0.48807579278945923, 0.5084402561187744, 0.5288047790527344, 0.5491693019866943, 0.5695337653160095, 0.5898982882499695, 0.6102628111839294, 0.6306273341178894, 0.6509918570518494, 0.6713563799858093]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 11.0, 10.0, 10.0, 25.0, 23.0, 43.0, 55.0, 116.0, 146.0, 270.0, 439.0, 710.0, 1337.0, 2650.0, 5773.0, 14960.0, 53136.0, 268229.0, 1352792.0, 1888248.0, 474993.0, 90092.0, 23957.0, 8738.0, 3640.0, 1693.0, 1007.0, 489.0, 257.0, 165.0, 100.0, 60.0, 24.0, 21.0, 25.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044219970703125, -0.04252958297729492, -0.040839195251464844, -0.039148807525634766, -0.03745841979980469, -0.03576803207397461, -0.03407764434814453, -0.03238725662231445, -0.030696868896484375, -0.029006481170654297, -0.02731609344482422, -0.02562570571899414, -0.023935317993164062, -0.022244930267333984, -0.020554542541503906, -0.018864154815673828, -0.01717376708984375, -0.015483379364013672, -0.013792991638183594, -0.012102603912353516, -0.010412216186523438, -0.00872182846069336, -0.007031440734863281, -0.005341053009033203, -0.003650665283203125, -0.001960277557373047, -0.00026988983154296875, 0.0014204978942871094, 0.0031108856201171875, 0.004801273345947266, 0.006491661071777344, 0.008182048797607422, 0.0098724365234375, 0.011562824249267578, 0.013253211975097656, 0.014943599700927734, 0.016633987426757812, 0.01832437515258789, 0.02001476287841797, 0.021705150604248047, 0.023395538330078125, 0.025085926055908203, 0.02677631378173828, 0.02846670150756836, 0.030157089233398438, 0.031847476959228516, 0.033537864685058594, 0.03522825241088867, 0.03691864013671875, 0.03860902786254883, 0.040299415588378906, 0.041989803314208984, 0.04368019104003906, 0.04537057876586914, 0.04706096649169922, 0.0487513542175293, 0.050441741943359375, 0.05213212966918945, 0.05382251739501953, 0.05551290512084961, 0.05720329284667969, 0.058893680572509766, 0.060584068298339844, 0.06227445602416992, 0.06396484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 11.0, 12.0, 20.0, 17.0, 24.0, 26.0, 37.0, 30.0, 50.0, 46.0, 46.0, 59.0, 47.0, 52.0, 44.0, 62.0, 51.0, 48.0, 48.0, 44.0, 35.0, 40.0, 33.0, 20.0, 24.0, 11.0, 20.0, 12.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06549072265625, -0.06374740600585938, -0.06200408935546875, -0.060260772705078125, -0.0585174560546875, -0.056774139404296875, -0.05503082275390625, -0.053287506103515625, -0.051544189453125, -0.049800872802734375, -0.04805755615234375, -0.046314239501953125, -0.0445709228515625, -0.042827606201171875, -0.04108428955078125, -0.039340972900390625, -0.03759765625, -0.035854339599609375, -0.03411102294921875, -0.032367706298828125, -0.0306243896484375, -0.028881072998046875, -0.02713775634765625, -0.025394439697265625, -0.023651123046875, -0.021907806396484375, -0.02016448974609375, -0.018421173095703125, -0.0166778564453125, -0.014934539794921875, -0.01319122314453125, -0.011447906494140625, -0.00970458984375, -0.007961273193359375, -0.00621795654296875, -0.004474639892578125, -0.0027313232421875, -0.000988006591796875, 0.00075531005859375, 0.002498626708984375, 0.004241943359375, 0.005985260009765625, 0.00772857666015625, 0.009471893310546875, 0.0112152099609375, 0.012958526611328125, 0.01470184326171875, 0.016445159912109375, 0.0181884765625, 0.019931793212890625, 0.02167510986328125, 0.023418426513671875, 0.0251617431640625, 0.026905059814453125, 0.02864837646484375, 0.030391693115234375, 0.032135009765625, 0.033878326416015625, 0.03562164306640625, 0.037364959716796875, 0.0391082763671875, 0.040851593017578125, 0.04259490966796875, 0.044338226318359375, 0.04608154296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 6.0, 16.0, 18.0, 16.0, 34.0, 59.0, 75.0, 106.0, 156.0, 292.0, 575.0, 1333.0, 5867.0, 80586.0, 3985617.0, 110135.0, 6542.0, 1447.0, 595.0, 301.0, 144.0, 117.0, 56.0, 46.0, 31.0, 30.0, 12.0, 15.0, 10.0, 10.0, 3.0, 5.0, 5.0, 0.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2275390625, -0.22008705139160156, -0.21263504028320312, -0.2051830291748047, -0.19773101806640625, -0.1902790069580078, -0.18282699584960938, -0.17537498474121094, -0.1679229736328125, -0.16047096252441406, -0.15301895141601562, -0.1455669403076172, -0.13811492919921875, -0.1306629180908203, -0.12321090698242188, -0.11575889587402344, -0.108306884765625, -0.10085487365722656, -0.09340286254882812, -0.08595085144042969, -0.07849884033203125, -0.07104682922363281, -0.06359481811523438, -0.05614280700683594, -0.0486907958984375, -0.04123878479003906, -0.033786773681640625, -0.026334762573242188, -0.01888275146484375, -0.011430740356445312, -0.003978729248046875, 0.0034732818603515625, 0.01092529296875, 0.018377304077148438, 0.025829315185546875, 0.03328132629394531, 0.04073333740234375, 0.04818534851074219, 0.055637359619140625, 0.06308937072753906, 0.0705413818359375, 0.07799339294433594, 0.08544540405273438, 0.09289741516113281, 0.10034942626953125, 0.10780143737792969, 0.11525344848632812, 0.12270545959472656, 0.130157470703125, 0.13760948181152344, 0.14506149291992188, 0.1525135040283203, 0.15996551513671875, 0.1674175262451172, 0.17486953735351562, 0.18232154846191406, 0.1897735595703125, 0.19722557067871094, 0.20467758178710938, 0.2121295928955078, 0.21958160400390625, 0.2270336151123047, 0.23448562622070312, 0.24193763732910156, 0.2493896484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 5.0, 2.0, 11.0, 19.0, 25.0, 34.0, 50.0, 102.0, 185.0, 329.0, 650.0, 868.0, 758.0, 416.0, 233.0, 136.0, 92.0, 51.0, 31.0, 18.0, 18.0, 9.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1767578125, -0.1721782684326172, -0.16759872436523438, -0.16301918029785156, -0.15843963623046875, -0.15386009216308594, -0.14928054809570312, -0.1447010040283203, -0.1401214599609375, -0.1355419158935547, -0.13096237182617188, -0.12638282775878906, -0.12180328369140625, -0.11722373962402344, -0.11264419555664062, -0.10806465148925781, -0.103485107421875, -0.09890556335449219, -0.09432601928710938, -0.08974647521972656, -0.08516693115234375, -0.08058738708496094, -0.07600784301757812, -0.07142829895019531, -0.0668487548828125, -0.06226921081542969, -0.057689666748046875, -0.05311012268066406, -0.04853057861328125, -0.04395103454589844, -0.039371490478515625, -0.03479194641113281, -0.03021240234375, -0.025632858276367188, -0.021053314208984375, -0.016473770141601562, -0.01189422607421875, -0.0073146820068359375, -0.002735137939453125, 0.0018444061279296875, 0.0064239501953125, 0.011003494262695312, 0.015583038330078125, 0.020162582397460938, 0.02474212646484375, 0.029321670532226562, 0.033901214599609375, 0.03848075866699219, 0.043060302734375, 0.04763984680175781, 0.052219390869140625, 0.05679893493652344, 0.06137847900390625, 0.06595802307128906, 0.07053756713867188, 0.07511711120605469, 0.0796966552734375, 0.08427619934082031, 0.08885574340820312, 0.09343528747558594, 0.09801483154296875, 0.10259437561035156, 0.10717391967773438, 0.11175346374511719, 0.1163330078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 17.0, 20.0, 50.0, 114.0, 245.0, 258.0, 164.0, 58.0, 33.0, 12.0, 9.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2218151092529297, -1.166082739830017, -1.110350489616394, -1.0546181201934814, -0.9988858103752136, -0.9431535005569458, -0.8874211311340332, -0.8316888213157654, -0.7759565114974976, -0.7202242016792297, -0.6644918322563171, -0.6087595224380493, -0.5530272126197815, -0.4972948729991913, -0.4415625333786011, -0.38583022356033325, -0.33009785413742065, -0.27436551451683044, -0.21863320469856262, -0.1629008650779724, -0.1071685403585434, -0.05143621563911438, 0.00429612398147583, 0.06002843379974365, 0.11576077342033386, 0.17149309813976288, 0.2272254228591919, 0.2829577624797821, 0.3386901021003723, 0.39442241191864014, 0.45015475153923035, 0.5058870315551758, 0.5616194009780884, 0.6173517107963562, 0.6730840802192688, 0.7288163900375366, 0.7845486998558044, 0.8402810096740723, 0.8960133790969849, 0.9517456889152527, 1.0074779987335205, 1.063210368156433, 1.1189426183700562, 1.1746749877929688, 1.2304073572158813, 1.2861396074295044, 1.341871976852417, 1.39760422706604, 1.4533367156982422, 1.5090690851211548, 1.5648013353347778, 1.6205337047576904, 1.676266074180603, 1.731998324394226, 1.7877306938171387, 1.8434629440307617, 1.8991953134536743, 1.954927682876587, 2.01065993309021, 2.066392421722412, 2.122124671936035, 2.177856922149658, 2.2335891723632812, 2.2893216609954834, 2.3450539112091064]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 14.0, 19.0, 20.0, 32.0, 38.0, 43.0, 48.0, 42.0, 55.0, 38.0, 41.0, 62.0, 47.0, 57.0, 33.0, 58.0, 60.0, 32.0, 47.0, 28.0, 34.0, 33.0, 24.0, 18.0, 21.0, 15.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7813282608985901, -0.7614042162895203, -0.7414801716804504, -0.7215561270713806, -0.701632022857666, -0.6817079782485962, -0.6617839336395264, -0.6418598890304565, -0.6219358444213867, -0.6020117998123169, -0.5820877552032471, -0.5621637105941772, -0.5422396659851074, -0.5223155617713928, -0.502391517162323, -0.4824674725532532, -0.46254342794418335, -0.4426193833351135, -0.4226953387260437, -0.4027712643146515, -0.38284721970558167, -0.36292317509651184, -0.34299910068511963, -0.3230750560760498, -0.30315101146698, -0.28322696685791016, -0.26330292224884033, -0.24337884783744812, -0.2234548032283783, -0.20353075861930847, -0.18360669910907745, -0.16368263959884644, -0.1437585949897766, -0.12383454293012619, -0.10391049087047577, -0.08398643881082535, -0.06406238675117493, -0.044138334691524506, -0.024214282631874084, -0.004290223121643066, 0.015633821487426758, 0.03555787354707718, 0.0554819256067276, 0.07540597766637802, 0.09533002972602844, 0.11525408178567886, 0.13517813384532928, 0.1551021933555603, 0.17502623796463013, 0.19495028257369995, 0.21487434208393097, 0.234798401594162, 0.2547224462032318, 0.27464649081230164, 0.29457056522369385, 0.31449460983276367, 0.3344186544418335, 0.3543426990509033, 0.37426674365997314, 0.39419081807136536, 0.4141148626804352, 0.434038907289505, 0.4539629817008972, 0.47388702630996704, 0.49381107091903687]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 7.0, 8.0, 8.0, 10.0, 11.0, 32.0, 34.0, 65.0, 104.0, 126.0, 215.0, 346.0, 553.0, 971.0, 1691.0, 3242.0, 6276.0, 13563.0, 33221.0, 98906.0, 351617.0, 369613.0, 105162.0, 34720.0, 14168.0, 6501.0, 3238.0, 1649.0, 968.0, 547.0, 355.0, 210.0, 134.0, 104.0, 56.0, 34.0, 27.0, 22.0, 9.0, 12.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.07183837890625, -0.06972694396972656, -0.06761550903320312, -0.06550407409667969, -0.06339263916015625, -0.06128120422363281, -0.059169769287109375, -0.05705833435058594, -0.0549468994140625, -0.05283546447753906, -0.050724029541015625, -0.04861259460449219, -0.04650115966796875, -0.04438972473144531, -0.042278289794921875, -0.04016685485839844, -0.038055419921875, -0.03594398498535156, -0.033832550048828125, -0.03172111511230469, -0.02960968017578125, -0.027498245239257812, -0.025386810302734375, -0.023275375366210938, -0.0211639404296875, -0.019052505493164062, -0.016941070556640625, -0.014829635620117188, -0.01271820068359375, -0.010606765747070312, -0.008495330810546875, -0.0063838958740234375, -0.0042724609375, -0.0021610260009765625, -4.9591064453125e-05, 0.0020618438720703125, 0.00417327880859375, 0.0062847137451171875, 0.008396148681640625, 0.010507583618164062, 0.0126190185546875, 0.014730453491210938, 0.016841888427734375, 0.018953323364257812, 0.02106475830078125, 0.023176193237304688, 0.025287628173828125, 0.027399063110351562, 0.029510498046875, 0.03162193298339844, 0.033733367919921875, 0.03584480285644531, 0.03795623779296875, 0.04006767272949219, 0.042179107666015625, 0.04429054260253906, 0.0464019775390625, 0.04851341247558594, 0.050624847412109375, 0.05273628234863281, 0.05484771728515625, 0.05695915222167969, 0.059070587158203125, 0.06118202209472656, 0.06329345703125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 4.0, 8.0, 14.0, 8.0, 18.0, 28.0, 29.0, 29.0, 30.0, 43.0, 38.0, 45.0, 53.0, 62.0, 60.0, 61.0, 57.0, 66.0, 53.0, 54.0, 40.0, 32.0, 24.0, 34.0, 26.0, 19.0, 8.0, 13.0, 12.0, 7.0, 7.0, 7.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07147216796875, -0.06948709487915039, -0.06750202178955078, -0.06551694869995117, -0.06353187561035156, -0.06154680252075195, -0.059561729431152344, -0.057576656341552734, -0.055591583251953125, -0.053606510162353516, -0.051621437072753906, -0.0496363639831543, -0.04765129089355469, -0.04566621780395508, -0.04368114471435547, -0.04169607162475586, -0.03971099853515625, -0.03772592544555664, -0.03574085235595703, -0.03375577926635742, -0.03177070617675781, -0.029785633087158203, -0.027800559997558594, -0.025815486907958984, -0.023830413818359375, -0.021845340728759766, -0.019860267639160156, -0.017875194549560547, -0.015890121459960938, -0.013905048370361328, -0.011919975280761719, -0.00993490219116211, -0.0079498291015625, -0.005964756011962891, -0.003979682922363281, -0.001994609832763672, -9.5367431640625e-06, 0.001975536346435547, 0.003960609436035156, 0.005945682525634766, 0.007930755615234375, 0.009915828704833984, 0.011900901794433594, 0.013885974884033203, 0.015871047973632812, 0.017856121063232422, 0.01984119415283203, 0.02182626724243164, 0.02381134033203125, 0.02579641342163086, 0.02778148651123047, 0.029766559600830078, 0.03175163269042969, 0.0337367057800293, 0.035721778869628906, 0.037706851959228516, 0.039691925048828125, 0.041676998138427734, 0.043662071228027344, 0.04564714431762695, 0.04763221740722656, 0.04961729049682617, 0.05160236358642578, 0.05358743667602539, 0.055572509765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 11.0, 8.0, 12.0, 12.0, 29.0, 33.0, 47.0, 59.0, 74.0, 74.0, 143.0, 174.0, 251.0, 361.0, 628.0, 1183.0, 2612.0, 8682.0, 59931.0, 867790.0, 89294.0, 10852.0, 3020.0, 1231.0, 607.0, 390.0, 265.0, 221.0, 141.0, 103.0, 82.0, 52.0, 46.0, 28.0, 29.0, 15.0, 10.0, 9.0, 9.0, 7.0, 5.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.171142578125, -0.16572189331054688, -0.16030120849609375, -0.15488052368164062, -0.1494598388671875, -0.14403915405273438, -0.13861846923828125, -0.13319778442382812, -0.127777099609375, -0.12235641479492188, -0.11693572998046875, -0.11151504516601562, -0.1060943603515625, -0.10067367553710938, -0.09525299072265625, -0.08983230590820312, -0.08441162109375, -0.07899093627929688, -0.07357025146484375, -0.06814956665039062, -0.0627288818359375, -0.057308197021484375, -0.05188751220703125, -0.046466827392578125, -0.041046142578125, -0.035625457763671875, -0.03020477294921875, -0.024784088134765625, -0.0193634033203125, -0.013942718505859375, -0.00852203369140625, -0.003101348876953125, 0.0023193359375, 0.007740020751953125, 0.01316070556640625, 0.018581390380859375, 0.0240020751953125, 0.029422760009765625, 0.03484344482421875, 0.040264129638671875, 0.045684814453125, 0.051105499267578125, 0.05652618408203125, 0.061946868896484375, 0.0673675537109375, 0.07278823852539062, 0.07820892333984375, 0.08362960815429688, 0.08905029296875, 0.09447097778320312, 0.09989166259765625, 0.10531234741210938, 0.1107330322265625, 0.11615371704101562, 0.12157440185546875, 0.12699508666992188, 0.132415771484375, 0.13783645629882812, 0.14325714111328125, 0.14867782592773438, 0.1540985107421875, 0.15951919555664062, 0.16493988037109375, 0.17036056518554688, 0.17578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 2.0, 9.0, 5.0, 9.0, 15.0, 9.0, 14.0, 18.0, 18.0, 21.0, 25.0, 50.0, 41.0, 45.0, 55.0, 58.0, 49.0, 57.0, 62.0, 73.0, 55.0, 59.0, 41.0, 35.0, 29.0, 30.0, 11.0, 17.0, 12.0, 14.0, 8.0, 11.0, 8.0, 14.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1951904296875, -0.18813133239746094, -0.18107223510742188, -0.1740131378173828, -0.16695404052734375, -0.1598949432373047, -0.15283584594726562, -0.14577674865722656, -0.1387176513671875, -0.13165855407714844, -0.12459945678710938, -0.11754035949707031, -0.11048126220703125, -0.10342216491699219, -0.09636306762695312, -0.08930397033691406, -0.082244873046875, -0.07518577575683594, -0.06812667846679688, -0.06106758117675781, -0.05400848388671875, -0.04694938659667969, -0.039890289306640625, -0.03283119201660156, -0.0257720947265625, -0.018712997436523438, -0.011653900146484375, -0.0045948028564453125, 0.00246429443359375, 0.009523391723632812, 0.016582489013671875, 0.023641586303710938, 0.03070068359375, 0.03775978088378906, 0.044818878173828125, 0.05187797546386719, 0.05893707275390625, 0.06599617004394531, 0.07305526733398438, 0.08011436462402344, 0.0871734619140625, 0.09423255920410156, 0.10129165649414062, 0.10835075378417969, 0.11540985107421875, 0.12246894836425781, 0.12952804565429688, 0.13658714294433594, 0.143646240234375, 0.15070533752441406, 0.15776443481445312, 0.1648235321044922, 0.17188262939453125, 0.1789417266845703, 0.18600082397460938, 0.19305992126464844, 0.2001190185546875, 0.20717811584472656, 0.21423721313476562, 0.2212963104248047, 0.22835540771484375, 0.2354145050048828, 0.24247360229492188, 0.24953269958496094, 0.256591796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 8.0, 4.0, 15.0, 14.0, 11.0, 17.0, 37.0, 31.0, 70.0, 92.0, 141.0, 220.0, 416.0, 988.0, 2419.0, 7965.0, 35409.0, 774167.0, 196458.0, 21234.0, 5339.0, 1782.0, 751.0, 362.0, 197.0, 102.0, 75.0, 52.0, 33.0, 29.0, 18.0, 15.0, 18.0, 8.0, 12.0, 5.0, 10.0, 3.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.067626953125, -0.06543445587158203, -0.06324195861816406, -0.061049461364746094, -0.058856964111328125, -0.056664466857910156, -0.05447196960449219, -0.05227947235107422, -0.05008697509765625, -0.04789447784423828, -0.04570198059082031, -0.043509483337402344, -0.041316986083984375, -0.039124488830566406, -0.03693199157714844, -0.03473949432373047, -0.0325469970703125, -0.03035449981689453, -0.028162002563476562, -0.025969505310058594, -0.023777008056640625, -0.021584510803222656, -0.019392013549804688, -0.01719951629638672, -0.01500701904296875, -0.012814521789550781, -0.010622024536132812, -0.008429527282714844, -0.006237030029296875, -0.004044532775878906, -0.0018520355224609375, 0.00034046173095703125, 0.002532958984375, 0.004725456237792969, 0.0069179534912109375, 0.009110450744628906, 0.011302947998046875, 0.013495445251464844, 0.015687942504882812, 0.01788043975830078, 0.02007293701171875, 0.02226543426513672, 0.024457931518554688, 0.026650428771972656, 0.028842926025390625, 0.031035423278808594, 0.03322792053222656, 0.03542041778564453, 0.0376129150390625, 0.03980541229248047, 0.04199790954589844, 0.044190406799316406, 0.046382904052734375, 0.048575401306152344, 0.05076789855957031, 0.05296039581298828, 0.05515289306640625, 0.05734539031982422, 0.05953788757324219, 0.061730384826660156, 0.06392288208007812, 0.0661153793334961, 0.06830787658691406, 0.07050037384033203, 0.07269287109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 7.0, 5.0, 12.0, 8.0, 21.0, 15.0, 24.0, 29.0, 42.0, 49.0, 65.0, 82.0, 107.0, 111.0, 91.0, 72.0, 63.0, 60.0, 26.0, 21.0, 12.0, 11.0, 8.0, 11.0, 6.0, 10.0, 5.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.500150680541992e-05, -4.357285797595978e-05, -4.2144209146499634e-05, -4.071556031703949e-05, -3.9286911487579346e-05, -3.78582626581192e-05, -3.642961382865906e-05, -3.5000964999198914e-05, -3.357231616973877e-05, -3.2143667340278625e-05, -3.071501851081848e-05, -2.9286369681358337e-05, -2.7857720851898193e-05, -2.642907202243805e-05, -2.5000423192977905e-05, -2.357177436351776e-05, -2.2143125534057617e-05, -2.0714476704597473e-05, -1.928582787513733e-05, -1.7857179045677185e-05, -1.642853021621704e-05, -1.4999881386756897e-05, -1.3571232557296753e-05, -1.2142583727836609e-05, -1.0713934898376465e-05, -9.28528606891632e-06, -7.856637239456177e-06, -6.427988409996033e-06, -4.999339580535889e-06, -3.5706907510757446e-06, -2.1420419216156006e-06, -7.133930921554565e-07, 7.152557373046875e-07, 2.1439045667648315e-06, 3.5725533962249756e-06, 5.00120222568512e-06, 6.429851055145264e-06, 7.858499884605408e-06, 9.287148714065552e-06, 1.0715797543525696e-05, 1.214444637298584e-05, 1.3573095202445984e-05, 1.5001744031906128e-05, 1.6430392861366272e-05, 1.7859041690826416e-05, 1.928769052028656e-05, 2.0716339349746704e-05, 2.2144988179206848e-05, 2.3573637008666992e-05, 2.5002285838127136e-05, 2.643093466758728e-05, 2.7859583497047424e-05, 2.928823232650757e-05, 3.071688115596771e-05, 3.2145529985427856e-05, 3.3574178814888e-05, 3.5002827644348145e-05, 3.643147647380829e-05, 3.786012530326843e-05, 3.928877413272858e-05, 4.071742296218872e-05, 4.2146071791648865e-05, 4.357472062110901e-05, 4.500336945056915e-05, 4.64320182800293e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 7.0, 4.0, 6.0, 12.0, 13.0, 22.0, 28.0, 47.0, 76.0, 77.0, 159.0, 252.0, 457.0, 1013.0, 2538.0, 8850.0, 48388.0, 801033.0, 159195.0, 18782.0, 4548.0, 1512.0, 645.0, 331.0, 194.0, 132.0, 71.0, 59.0, 24.0, 28.0, 14.0, 11.0, 7.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07965087890625, -0.0774831771850586, -0.07531547546386719, -0.07314777374267578, -0.07098007202148438, -0.06881237030029297, -0.06664466857910156, -0.06447696685791016, -0.06230926513671875, -0.060141563415527344, -0.05797386169433594, -0.05580615997314453, -0.053638458251953125, -0.05147075653076172, -0.04930305480957031, -0.047135353088378906, -0.0449676513671875, -0.042799949645996094, -0.04063224792480469, -0.03846454620361328, -0.036296844482421875, -0.03412914276123047, -0.03196144104003906, -0.029793739318847656, -0.02762603759765625, -0.025458335876464844, -0.023290634155273438, -0.02112293243408203, -0.018955230712890625, -0.01678752899169922, -0.014619827270507812, -0.012452125549316406, -0.010284423828125, -0.008116722106933594, -0.0059490203857421875, -0.0037813186645507812, -0.001613616943359375, 0.0005540847778320312, 0.0027217864990234375, 0.004889488220214844, 0.00705718994140625, 0.009224891662597656, 0.011392593383789062, 0.013560295104980469, 0.015727996826171875, 0.01789569854736328, 0.020063400268554688, 0.022231101989746094, 0.0243988037109375, 0.026566505432128906, 0.028734207153320312, 0.03090190887451172, 0.033069610595703125, 0.03523731231689453, 0.03740501403808594, 0.039572715759277344, 0.04174041748046875, 0.043908119201660156, 0.04607582092285156, 0.04824352264404297, 0.050411224365234375, 0.05257892608642578, 0.05474662780761719, 0.056914329528808594, 0.05908203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 6.0, 8.0, 14.0, 19.0, 16.0, 16.0, 42.0, 45.0, 58.0, 72.0, 90.0, 101.0, 121.0, 74.0, 73.0, 41.0, 36.0, 25.0, 18.0, 14.0, 13.0, 11.0, 9.0, 6.0, 8.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04156494140625, -0.04021120071411133, -0.038857460021972656, -0.037503719329833984, -0.03614997863769531, -0.03479623794555664, -0.03344249725341797, -0.0320887565612793, -0.030735015869140625, -0.029381275177001953, -0.02802753448486328, -0.02667379379272461, -0.025320053100585938, -0.023966312408447266, -0.022612571716308594, -0.021258831024169922, -0.01990509033203125, -0.018551349639892578, -0.017197608947753906, -0.015843868255615234, -0.014490127563476562, -0.01313638687133789, -0.011782646179199219, -0.010428905487060547, -0.009075164794921875, -0.007721424102783203, -0.006367683410644531, -0.005013942718505859, -0.0036602020263671875, -0.0023064613342285156, -0.0009527206420898438, 0.0004010200500488281, 0.0017547607421875, 0.003108501434326172, 0.004462242126464844, 0.005815982818603516, 0.0071697235107421875, 0.00852346420288086, 0.009877204895019531, 0.011230945587158203, 0.012584686279296875, 0.013938426971435547, 0.015292167663574219, 0.01664590835571289, 0.017999649047851562, 0.019353389739990234, 0.020707130432128906, 0.022060871124267578, 0.02341461181640625, 0.024768352508544922, 0.026122093200683594, 0.027475833892822266, 0.028829574584960938, 0.03018331527709961, 0.03153705596923828, 0.03289079666137695, 0.034244537353515625, 0.0355982780456543, 0.03695201873779297, 0.03830575942993164, 0.03965950012207031, 0.041013240814208984, 0.042366981506347656, 0.04372072219848633, 0.045074462890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 2.0, 11.0, 13.0, 53.0, 158.0, 520.0, 166.0, 43.0, 19.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9451993703842163, -1.8719384670257568, -1.798677682876587, -1.7254167795181274, -1.652155876159668, -1.578895092010498, -1.5056341886520386, -1.432373285293579, -1.3591125011444092, -1.2858515977859497, -1.2125908136367798, -1.1393299102783203, -1.0660690069198608, -0.9928081631660461, -0.9195473194122314, -0.846286416053772, -0.7730255126953125, -0.6997646689414978, -0.6265037655830383, -0.5532429218292236, -0.47998204827308655, -0.40672117471694946, -0.33346033096313477, -0.2601994276046753, -0.1869385838508606, -0.11367771774530411, -0.04041685163974762, 0.03284400701522827, 0.10610488057136536, 0.17936575412750244, 0.25262659788131714, 0.3258875012397766, 0.39914846420288086, 0.47240933775901794, 0.545670211315155, 0.6189310550689697, 0.6921919584274292, 0.7654528021812439, 0.8387136459350586, 0.9119745492935181, 0.9852353930473328, 1.0584962368011475, 1.131757140159607, 1.2050180435180664, 1.2782788276672363, 1.3515397310256958, 1.4248006343841553, 1.4980614185333252, 1.5713223218917847, 1.6445832252502441, 1.717844009399414, 1.7911049127578735, 1.864365816116333, 1.937626600265503, 2.010887622833252, 2.084148406982422, 2.157409191131592, 2.2306699752807617, 2.3039309978485107, 2.3771917819976807, 2.4504525661468506, 2.5237135887145996, 2.5969743728637695, 2.6702351570129395, 2.7434961795806885]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 8.0, 3.0, 7.0, 6.0, 17.0, 9.0, 23.0, 20.0, 27.0, 31.0, 43.0, 32.0, 45.0, 53.0, 125.0, 159.0, 74.0, 44.0, 29.0, 38.0, 25.0, 30.0, 31.0, 13.0, 15.0, 10.0, 15.0, 6.0, 14.0, 7.0, 11.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8998326659202576, -0.8709866404533386, -0.8421406149864197, -0.8132945895195007, -0.7844486236572266, -0.7556025981903076, -0.7267565727233887, -0.6979105472564697, -0.6690645217895508, -0.6402184963226318, -0.6113724708557129, -0.582526445388794, -0.553680419921875, -0.524834394454956, -0.4959884285926819, -0.46714240312576294, -0.438296377658844, -0.40945035219192505, -0.3806043267250061, -0.35175833106040955, -0.3229123055934906, -0.29406628012657166, -0.2652202844619751, -0.23637425899505615, -0.2075282335281372, -0.17868220806121826, -0.1498361974954605, -0.12099017947912216, -0.09214416146278381, -0.06329813599586487, -0.03445212543010712, -0.005606114864349365, 0.02323991060256958, 0.05208592861890793, 0.08093194663524628, 0.10977796465158463, 0.13862398266792297, 0.16747000813484192, 0.19631601870059967, 0.22516202926635742, 0.25400805473327637, 0.2828540802001953, 0.31170010566711426, 0.3405461013317108, 0.36939212679862976, 0.3982381522655487, 0.42708414793014526, 0.4559301733970642, 0.48477619886398315, 0.5136222243309021, 0.542468249797821, 0.57131427526474, 0.6001602411270142, 0.6290062665939331, 0.657852292060852, 0.686698317527771, 0.7155443429946899, 0.7443903684616089, 0.7732363939285278, 0.8020824193954468, 0.8309284448623657, 0.8597744703292847, 0.8886204361915588, 0.9174664616584778, 0.9463124871253967]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 11.0, 11.0, 22.0, 37.0, 83.0, 131.0, 228.0, 458.0, 867.0, 2013.0, 5077.0, 16346.0, 88497.0, 1024152.0, 2611933.0, 387484.0, 41976.0, 9054.0, 3099.0, 1317.0, 635.0, 363.0, 217.0, 103.0, 76.0, 34.0, 23.0, 8.0, 9.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08258056640625, -0.07851314544677734, -0.07444572448730469, -0.07037830352783203, -0.06631088256835938, -0.06224346160888672, -0.05817604064941406, -0.054108619689941406, -0.05004119873046875, -0.045973777770996094, -0.04190635681152344, -0.03783893585205078, -0.033771514892578125, -0.02970409393310547, -0.025636672973632812, -0.021569252014160156, -0.0175018310546875, -0.013434410095214844, -0.009366989135742188, -0.005299568176269531, -0.001232147216796875, 0.0028352737426757812, 0.0069026947021484375, 0.010970115661621094, 0.01503753662109375, 0.019104957580566406, 0.023172378540039062, 0.02723979949951172, 0.031307220458984375, 0.03537464141845703, 0.03944206237792969, 0.043509483337402344, 0.047576904296875, 0.051644325256347656, 0.05571174621582031, 0.05977916717529297, 0.06384658813476562, 0.06791400909423828, 0.07198143005371094, 0.0760488510131836, 0.08011627197265625, 0.0841836929321289, 0.08825111389160156, 0.09231853485107422, 0.09638595581054688, 0.10045337677001953, 0.10452079772949219, 0.10858821868896484, 0.1126556396484375, 0.11672306060791016, 0.12079048156738281, 0.12485790252685547, 0.12892532348632812, 0.13299274444580078, 0.13706016540527344, 0.1411275863647461, 0.14519500732421875, 0.1492624282836914, 0.15332984924316406, 0.15739727020263672, 0.16146469116210938, 0.16553211212158203, 0.1695995330810547, 0.17366695404052734, 0.177734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 8.0, 9.0, 10.0, 20.0, 27.0, 28.0, 55.0, 59.0, 65.0, 65.0, 87.0, 81.0, 64.0, 68.0, 84.0, 63.0, 56.0, 49.0, 25.0, 23.0, 19.0, 12.0, 11.0, 7.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0743408203125, -0.07168197631835938, -0.06902313232421875, -0.06636428833007812, -0.0637054443359375, -0.061046600341796875, -0.05838775634765625, -0.055728912353515625, -0.053070068359375, -0.050411224365234375, -0.04775238037109375, -0.045093536376953125, -0.0424346923828125, -0.039775848388671875, -0.03711700439453125, -0.034458160400390625, -0.03179931640625, -0.029140472412109375, -0.02648162841796875, -0.023822784423828125, -0.0211639404296875, -0.018505096435546875, -0.01584625244140625, -0.013187408447265625, -0.010528564453125, -0.007869720458984375, -0.00521087646484375, -0.002552032470703125, 0.0001068115234375, 0.002765655517578125, 0.00542449951171875, 0.008083343505859375, 0.0107421875, 0.013401031494140625, 0.01605987548828125, 0.018718719482421875, 0.0213775634765625, 0.024036407470703125, 0.02669525146484375, 0.029354095458984375, 0.032012939453125, 0.034671783447265625, 0.03733062744140625, 0.039989471435546875, 0.0426483154296875, 0.045307159423828125, 0.04796600341796875, 0.050624847412109375, 0.05328369140625, 0.055942535400390625, 0.05860137939453125, 0.061260223388671875, 0.0639190673828125, 0.06657791137695312, 0.06923675537109375, 0.07189559936523438, 0.074554443359375, 0.07721328735351562, 0.07987213134765625, 0.08253097534179688, 0.0851898193359375, 0.08784866333007812, 0.09050750732421875, 0.09316635131835938, 0.0958251953125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 6.0, 14.0, 43.0, 108.0, 361.0, 2020.0, 4175521.0, 15254.0, 685.0, 176.0, 52.0, 16.0, 4.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.809234619140625, -1.75225830078125, -1.695281982421875, -1.6383056640625, -1.581329345703125, -1.52435302734375, -1.467376708984375, -1.410400390625, -1.353424072265625, -1.29644775390625, -1.239471435546875, -1.1824951171875, -1.125518798828125, -1.06854248046875, -1.011566162109375, -0.95458984375, -0.897613525390625, -0.84063720703125, -0.783660888671875, -0.7266845703125, -0.669708251953125, -0.61273193359375, -0.555755615234375, -0.498779296875, -0.441802978515625, -0.38482666015625, -0.327850341796875, -0.2708740234375, -0.213897705078125, -0.15692138671875, -0.099945068359375, -0.04296875, 0.014007568359375, 0.07098388671875, 0.127960205078125, 0.1849365234375, 0.241912841796875, 0.29888916015625, 0.355865478515625, 0.412841796875, 0.469818115234375, 0.52679443359375, 0.583770751953125, 0.6407470703125, 0.697723388671875, 0.75469970703125, 0.811676025390625, 0.86865234375, 0.925628662109375, 0.98260498046875, 1.039581298828125, 1.0965576171875, 1.153533935546875, 1.21051025390625, 1.267486572265625, 1.324462890625, 1.381439208984375, 1.43841552734375, 1.495391845703125, 1.5523681640625, 1.609344482421875, 1.66632080078125, 1.723297119140625, 1.7802734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 27.0, 85.0, 604.0, 2247.0, 886.0, 172.0, 43.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.1327667236328125, -1.103424072265625, -1.0740814208984375, -1.04473876953125, -1.0153961181640625, -0.986053466796875, -0.9567108154296875, -0.9273681640625, -0.8980255126953125, -0.868682861328125, -0.8393402099609375, -0.80999755859375, -0.7806549072265625, -0.751312255859375, -0.7219696044921875, -0.692626953125, -0.6632843017578125, -0.633941650390625, -0.6045989990234375, -0.57525634765625, -0.5459136962890625, -0.516571044921875, -0.4872283935546875, -0.4578857421875, -0.4285430908203125, -0.399200439453125, -0.3698577880859375, -0.34051513671875, -0.3111724853515625, -0.281829833984375, -0.2524871826171875, -0.22314453125, -0.1938018798828125, -0.164459228515625, -0.1351165771484375, -0.10577392578125, -0.0764312744140625, -0.047088623046875, -0.0177459716796875, 0.0115966796875, 0.0409393310546875, 0.070281982421875, 0.0996246337890625, 0.12896728515625, 0.1583099365234375, 0.187652587890625, 0.2169952392578125, 0.246337890625, 0.2756805419921875, 0.305023193359375, 0.3343658447265625, 0.36370849609375, 0.3930511474609375, 0.422393798828125, 0.4517364501953125, 0.4810791015625, 0.5104217529296875, 0.539764404296875, 0.5691070556640625, 0.59844970703125, 0.6277923583984375, 0.657135009765625, 0.6864776611328125, 0.7158203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 7.0, 16.0, 36.0, 155.0, 471.0, 232.0, 48.0, 18.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.257539749145508, -10.028176307678223, -9.798812866210938, -9.569448471069336, -9.34008502960205, -9.110721588134766, -8.88135814666748, -8.651994705200195, -8.422630310058594, -8.193266868591309, -7.963902950286865, -7.73453950881958, -7.505175590515137, -7.275812149047852, -7.046448707580566, -6.817084789276123, -6.587721824645996, -6.358358383178711, -6.128994464874268, -5.899631023406982, -5.670267105102539, -5.440903663635254, -5.211540222167969, -4.982176303863525, -4.752812385559082, -4.523448944091797, -4.2940850257873535, -4.064721584320068, -3.835357904434204, -3.60599422454834, -3.3766305446624756, -3.1472668647766113, -2.917903423309326, -2.688539743423462, -2.4591760635375977, -2.2298126220703125, -2.0004489421844482, -1.771085262298584, -1.5417215824127197, -1.312358021736145, -1.0829943418502808, -0.8536307215690613, -0.6242671012878418, -0.39490342140197754, -0.16553980112075806, 0.06382381916046143, 0.2931874990463257, 0.5225510597229004, 0.7519147396087646, 0.9812783598899841, 1.2106419801712036, 1.4400056600570679, 1.6693692207336426, 1.8987329006195068, 2.128096580505371, 2.3574600219726562, 2.5868239402770996, 2.816187620162964, 3.045551300048828, 3.2749147415161133, 3.5042784214019775, 3.733642101287842, 3.963005781173706, 4.19236946105957, 4.4217329025268555]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 21.0, 15.0, 40.0, 35.0, 53.0, 62.0, 99.0, 108.0, 122.0, 82.0, 86.0, 66.0, 54.0, 46.0, 21.0, 18.0, 9.0, 14.0, 5.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.027252197265625, -2.9368910789489746, -2.846529960632324, -2.756168842315674, -2.6658077239990234, -2.575446605682373, -2.4850854873657227, -2.3947243690490723, -2.304363250732422, -2.2140021324157715, -2.123641014099121, -2.0332798957824707, -1.9429187774658203, -1.85255765914917, -1.7621965408325195, -1.6718354225158691, -1.5814741849899292, -1.4911130666732788, -1.4007519483566284, -1.310390830039978, -1.2200297117233276, -1.1296685934066772, -1.0393073558807373, -0.9489462971687317, -0.8585851788520813, -0.7682240605354309, -0.6778629422187805, -0.5875017642974854, -0.49714067578315735, -0.40677955746650696, -0.3164184093475342, -0.2260572910308838, -0.1356961727142334, -0.04533504694700241, 0.04502607882022858, 0.13538721203804016, 0.22574833035469055, 0.31610944867134094, 0.4064705967903137, 0.4968317151069641, 0.5871928334236145, 0.6775539517402649, 0.7679150700569153, 0.8582762479782104, 0.9486373662948608, 1.0389984846115112, 1.1293596029281616, 1.219720721244812, 1.3100818395614624, 1.4004429578781128, 1.4908040761947632, 1.5811651945114136, 1.671526312828064, 1.7618874311447144, 1.8522486686706543, 1.9426097869873047, 2.032970905303955, 2.1233320236206055, 2.213693141937256, 2.3040542602539062, 2.3944153785705566, 2.484776496887207, 2.5751376152038574, 2.665498733520508, 2.755859851837158]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 7.0, 12.0, 22.0, 18.0, 33.0, 46.0, 60.0, 120.0, 195.0, 361.0, 702.0, 1712.0, 5231.0, 22506.0, 210973.0, 742097.0, 50351.0, 9213.0, 2710.0, 1063.0, 452.0, 254.0, 157.0, 69.0, 59.0, 31.0, 34.0, 21.0, 12.0, 11.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2091064453125, -0.20348739624023438, -0.19786834716796875, -0.19224929809570312, -0.1866302490234375, -0.18101119995117188, -0.17539215087890625, -0.16977310180664062, -0.164154052734375, -0.15853500366210938, -0.15291595458984375, -0.14729690551757812, -0.1416778564453125, -0.13605880737304688, -0.13043975830078125, -0.12482070922851562, -0.11920166015625, -0.11358261108398438, -0.10796356201171875, -0.10234451293945312, -0.0967254638671875, -0.09110641479492188, -0.08548736572265625, -0.07986831665039062, -0.074249267578125, -0.06863021850585938, -0.06301116943359375, -0.057392120361328125, -0.0517730712890625, -0.046154022216796875, -0.04053497314453125, -0.034915924072265625, -0.029296875, -0.023677825927734375, -0.01805877685546875, -0.012439727783203125, -0.0068206787109375, -0.001201629638671875, 0.00441741943359375, 0.010036468505859375, 0.015655517578125, 0.021274566650390625, 0.02689361572265625, 0.032512664794921875, 0.0381317138671875, 0.043750762939453125, 0.04936981201171875, 0.054988861083984375, 0.06060791015625, 0.06622695922851562, 0.07184600830078125, 0.07746505737304688, 0.0830841064453125, 0.08870315551757812, 0.09432220458984375, 0.09994125366210938, 0.105560302734375, 0.11117935180664062, 0.11679840087890625, 0.12241744995117188, 0.1280364990234375, 0.13365554809570312, 0.13927459716796875, 0.14489364624023438, 0.1505126953125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 19.0, 19.0, 31.0, 45.0, 50.0, 85.0, 82.0, 93.0, 95.0, 99.0, 95.0, 55.0, 58.0, 43.0, 38.0, 31.0, 13.0, 12.0, 9.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14208984375, -0.13695526123046875, -0.1318206787109375, -0.12668609619140625, -0.121551513671875, -0.11641693115234375, -0.1112823486328125, -0.10614776611328125, -0.10101318359375, -0.09587860107421875, -0.0907440185546875, -0.08560943603515625, -0.080474853515625, -0.07534027099609375, -0.0702056884765625, -0.06507110595703125, -0.0599365234375, -0.05480194091796875, -0.0496673583984375, -0.04453277587890625, -0.039398193359375, -0.03426361083984375, -0.0291290283203125, -0.02399444580078125, -0.01885986328125, -0.01372528076171875, -0.0085906982421875, -0.00345611572265625, 0.001678466796875, 0.00681304931640625, 0.0119476318359375, 0.01708221435546875, 0.022216796875, 0.02735137939453125, 0.0324859619140625, 0.03762054443359375, 0.042755126953125, 0.04788970947265625, 0.0530242919921875, 0.05815887451171875, 0.06329345703125, 0.06842803955078125, 0.0735626220703125, 0.07869720458984375, 0.083831787109375, 0.08896636962890625, 0.0941009521484375, 0.09923553466796875, 0.1043701171875, 0.10950469970703125, 0.1146392822265625, 0.11977386474609375, 0.124908447265625, 0.13004302978515625, 0.1351776123046875, 0.14031219482421875, 0.14544677734375, 0.15058135986328125, 0.1557159423828125, 0.16085052490234375, 0.165985107421875, 0.17111968994140625, 0.1762542724609375, 0.18138885498046875, 0.1865234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 7.0, 13.0, 15.0, 24.0, 32.0, 61.0, 71.0, 131.0, 189.0, 405.0, 976.0, 3874.0, 66615.0, 956845.0, 15860.0, 2046.0, 657.0, 257.0, 159.0, 98.0, 67.0, 38.0, 25.0, 17.0, 14.0, 14.0, 12.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.2856178283691406, -0.27729034423828125, -0.2689628601074219, -0.2606353759765625, -0.2523078918457031, -0.24398040771484375, -0.23565292358398438, -0.227325439453125, -0.21899795532226562, -0.21067047119140625, -0.20234298706054688, -0.1940155029296875, -0.18568801879882812, -0.17736053466796875, -0.16903305053710938, -0.16070556640625, -0.15237808227539062, -0.14405059814453125, -0.13572311401367188, -0.1273956298828125, -0.11906814575195312, -0.11074066162109375, -0.10241317749023438, -0.094085693359375, -0.08575820922851562, -0.07743072509765625, -0.06910324096679688, -0.0607757568359375, -0.052448272705078125, -0.04412078857421875, -0.035793304443359375, -0.0274658203125, -0.019138336181640625, -0.01081085205078125, -0.002483367919921875, 0.0058441162109375, 0.014171600341796875, 0.02249908447265625, 0.030826568603515625, 0.039154052734375, 0.047481536865234375, 0.05580902099609375, 0.06413650512695312, 0.0724639892578125, 0.08079147338867188, 0.08911895751953125, 0.09744644165039062, 0.10577392578125, 0.11410140991210938, 0.12242889404296875, 0.13075637817382812, 0.1390838623046875, 0.14741134643554688, 0.15573883056640625, 0.16406631469726562, 0.172393798828125, 0.18072128295898438, 0.18904876708984375, 0.19737625122070312, 0.2057037353515625, 0.21403121948242188, 0.22235870361328125, 0.23068618774414062, 0.239013671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 14.0, 6.0, 6.0, 6.0, 11.0, 19.0, 17.0, 26.0, 19.0, 19.0, 36.0, 37.0, 36.0, 49.0, 54.0, 54.0, 63.0, 58.0, 63.0, 57.0, 47.0, 43.0, 43.0, 31.0, 21.0, 28.0, 18.0, 9.0, 16.0, 8.0, 16.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3125, -0.3025169372558594, -0.29253387451171875, -0.2825508117675781, -0.2725677490234375, -0.2625846862792969, -0.25260162353515625, -0.24261856079101562, -0.232635498046875, -0.22265243530273438, -0.21266937255859375, -0.20268630981445312, -0.1927032470703125, -0.18272018432617188, -0.17273712158203125, -0.16275405883789062, -0.15277099609375, -0.14278793334960938, -0.13280487060546875, -0.12282180786132812, -0.1128387451171875, -0.10285568237304688, -0.09287261962890625, -0.08288955688476562, -0.072906494140625, -0.06292343139648438, -0.05294036865234375, -0.042957305908203125, -0.0329742431640625, -0.022991180419921875, -0.01300811767578125, -0.003025054931640625, 0.0069580078125, 0.016941070556640625, 0.02692413330078125, 0.036907196044921875, 0.0468902587890625, 0.056873321533203125, 0.06685638427734375, 0.07683944702148438, 0.086822509765625, 0.09680557250976562, 0.10678863525390625, 0.11677169799804688, 0.1267547607421875, 0.13673782348632812, 0.14672088623046875, 0.15670394897460938, 0.16668701171875, 0.17667007446289062, 0.18665313720703125, 0.19663619995117188, 0.2066192626953125, 0.21660232543945312, 0.22658538818359375, 0.23656845092773438, 0.246551513671875, 0.2565345764160156, 0.26651763916015625, 0.2765007019042969, 0.2864837646484375, 0.2964668273925781, 0.30644989013671875, 0.3164329528808594, 0.326416015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 8.0, 11.0, 12.0, 19.0, 16.0, 32.0, 42.0, 77.0, 119.0, 219.0, 460.0, 1437.0, 6206.0, 127231.0, 899088.0, 10435.0, 1895.0, 620.0, 270.0, 119.0, 70.0, 42.0, 25.0, 24.0, 23.0, 11.0, 8.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046173095703125, -0.04453134536743164, -0.04288959503173828, -0.04124784469604492, -0.03960609436035156, -0.0379643440246582, -0.036322593688964844, -0.034680843353271484, -0.033039093017578125, -0.031397342681884766, -0.029755592346191406, -0.028113842010498047, -0.026472091674804688, -0.024830341339111328, -0.02318859100341797, -0.02154684066772461, -0.01990509033203125, -0.01826333999633789, -0.01662158966064453, -0.014979839324951172, -0.013338088989257812, -0.011696338653564453, -0.010054588317871094, -0.008412837982177734, -0.006771087646484375, -0.005129337310791016, -0.0034875869750976562, -0.0018458366394042969, -0.0002040863037109375, 0.0014376640319824219, 0.0030794143676757812, 0.004721164703369141, 0.0063629150390625, 0.00800466537475586, 0.009646415710449219, 0.011288166046142578, 0.012929916381835938, 0.014571666717529297, 0.016213417053222656, 0.017855167388916016, 0.019496917724609375, 0.021138668060302734, 0.022780418395996094, 0.024422168731689453, 0.026063919067382812, 0.027705669403076172, 0.02934741973876953, 0.03098917007446289, 0.03263092041015625, 0.03427267074584961, 0.03591442108154297, 0.03755617141723633, 0.03919792175292969, 0.04083967208862305, 0.042481422424316406, 0.044123172760009766, 0.045764923095703125, 0.047406673431396484, 0.049048423767089844, 0.0506901741027832, 0.05233192443847656, 0.05397367477416992, 0.05561542510986328, 0.05725717544555664, 0.05889892578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 8.0, 12.0, 14.0, 18.0, 25.0, 37.0, 26.0, 64.0, 73.0, 66.0, 89.0, 112.0, 86.0, 82.0, 55.0, 33.0, 36.0, 35.0, 33.0, 13.0, 14.0, 8.0, 8.0, 5.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.1113624572753906e-05, -3.0152499675750732e-05, -2.919137477874756e-05, -2.8230249881744385e-05, -2.726912498474121e-05, -2.6308000087738037e-05, -2.5346875190734863e-05, -2.438575029373169e-05, -2.3424625396728516e-05, -2.2463500499725342e-05, -2.1502375602722168e-05, -2.0541250705718994e-05, -1.958012580871582e-05, -1.8619000911712646e-05, -1.7657876014709473e-05, -1.66967511177063e-05, -1.5735626220703125e-05, -1.4774501323699951e-05, -1.3813376426696777e-05, -1.2852251529693604e-05, -1.189112663269043e-05, -1.0930001735687256e-05, -9.968876838684082e-06, -9.007751941680908e-06, -8.046627044677734e-06, -7.0855021476745605e-06, -6.124377250671387e-06, -5.163252353668213e-06, -4.202127456665039e-06, -3.2410025596618652e-06, -2.2798776626586914e-06, -1.3187527656555176e-06, -3.5762786865234375e-07, 6.034970283508301e-07, 1.564621925354004e-06, 2.5257468223571777e-06, 3.4868717193603516e-06, 4.447996616363525e-06, 5.409121513366699e-06, 6.370246410369873e-06, 7.331371307373047e-06, 8.29249620437622e-06, 9.253621101379395e-06, 1.0214745998382568e-05, 1.1175870895385742e-05, 1.2136995792388916e-05, 1.309812068939209e-05, 1.4059245586395264e-05, 1.5020370483398438e-05, 1.598149538040161e-05, 1.6942620277404785e-05, 1.790374517440796e-05, 1.8864870071411133e-05, 1.9825994968414307e-05, 2.078711986541748e-05, 2.1748244762420654e-05, 2.2709369659423828e-05, 2.3670494556427002e-05, 2.4631619453430176e-05, 2.559274435043335e-05, 2.6553869247436523e-05, 2.7514994144439697e-05, 2.847611904144287e-05, 2.9437243938446045e-05, 3.039836883544922e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 20.0, 16.0, 39.0, 58.0, 84.0, 143.0, 276.0, 581.0, 1333.0, 3996.0, 17940.0, 742952.0, 258402.0, 16274.0, 3851.0, 1347.0, 548.0, 277.0, 163.0, 77.0, 47.0, 37.0, 29.0, 14.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034759521484375, -0.03355979919433594, -0.032360076904296875, -0.031160354614257812, -0.02996063232421875, -0.028760910034179688, -0.027561187744140625, -0.026361465454101562, -0.0251617431640625, -0.023962020874023438, -0.022762298583984375, -0.021562576293945312, -0.02036285400390625, -0.019163131713867188, -0.017963409423828125, -0.016763687133789062, -0.01556396484375, -0.014364242553710938, -0.013164520263671875, -0.011964797973632812, -0.01076507568359375, -0.009565353393554688, -0.008365631103515625, -0.0071659088134765625, -0.0059661865234375, -0.0047664642333984375, -0.003566741943359375, -0.0023670196533203125, -0.00116729736328125, 3.24249267578125e-05, 0.001232147216796875, 0.0024318695068359375, 0.003631591796875, 0.0048313140869140625, 0.006031036376953125, 0.0072307586669921875, 0.00843048095703125, 0.009630203247070312, 0.010829925537109375, 0.012029647827148438, 0.0132293701171875, 0.014429092407226562, 0.015628814697265625, 0.016828536987304688, 0.01802825927734375, 0.019227981567382812, 0.020427703857421875, 0.021627426147460938, 0.0228271484375, 0.024026870727539062, 0.025226593017578125, 0.026426315307617188, 0.02762603759765625, 0.028825759887695312, 0.030025482177734375, 0.031225204467773438, 0.0324249267578125, 0.03362464904785156, 0.034824371337890625, 0.03602409362792969, 0.03722381591796875, 0.03842353820800781, 0.039623260498046875, 0.04082298278808594, 0.042022705078125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 11.0, 19.0, 8.0, 24.0, 64.0, 114.0, 172.0, 236.0, 144.0, 73.0, 30.0, 25.0, 15.0, 11.0, 8.0, 10.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04205322265625, -0.04037761688232422, -0.03870201110839844, -0.037026405334472656, -0.035350799560546875, -0.033675193786621094, -0.03199958801269531, -0.03032398223876953, -0.02864837646484375, -0.02697277069091797, -0.025297164916992188, -0.023621559143066406, -0.021945953369140625, -0.020270347595214844, -0.018594741821289062, -0.01691913604736328, -0.0152435302734375, -0.013567924499511719, -0.011892318725585938, -0.010216712951660156, -0.008541107177734375, -0.006865501403808594, -0.0051898956298828125, -0.0035142898559570312, -0.00183868408203125, -0.00016307830810546875, 0.0015125274658203125, 0.0031881332397460938, 0.004863739013671875, 0.006539344787597656, 0.008214950561523438, 0.009890556335449219, 0.011566162109375, 0.013241767883300781, 0.014917373657226562, 0.016592979431152344, 0.018268585205078125, 0.019944190979003906, 0.021619796752929688, 0.02329540252685547, 0.02497100830078125, 0.02664661407470703, 0.028322219848632812, 0.029997825622558594, 0.031673431396484375, 0.033349037170410156, 0.03502464294433594, 0.03670024871826172, 0.0383758544921875, 0.04005146026611328, 0.04172706604003906, 0.043402671813964844, 0.045078277587890625, 0.046753883361816406, 0.04842948913574219, 0.05010509490966797, 0.05178070068359375, 0.05345630645751953, 0.05513191223144531, 0.056807518005371094, 0.058483123779296875, 0.060158729553222656, 0.06183433532714844, 0.06350994110107422, 0.065185546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 15.0, 19.0, 77.0, 387.0, 392.0, 57.0, 27.0, 9.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.453125476837158, -2.3740053176879883, -2.2948849201202393, -2.2157647609710693, -2.1366443634033203, -2.0575242042541504, -1.978403925895691, -1.8992836475372314, -1.820163369178772, -1.7410430908203125, -1.661922812461853, -1.5828025341033936, -1.5036823749542236, -1.4245619773864746, -1.3454418182373047, -1.2663215398788452, -1.1872012615203857, -1.1080809831619263, -1.0289607048034668, -0.9498404860496521, -0.8707202076911926, -0.7915999293327332, -0.7124797105789185, -0.633359432220459, -0.5542391538619995, -0.47511887550354004, -0.39599862694740295, -0.31687837839126587, -0.2377581000328064, -0.15863782167434692, -0.07951757311820984, -0.0003973245620727539, 0.07872271537780762, 0.1578429788351059, 0.23696324229240417, 0.31608349084854126, 0.39520376920700073, 0.4743240475654602, 0.5534442663192749, 0.6325645446777344, 0.7116848230361938, 0.7908051013946533, 0.8699253797531128, 0.9490455985069275, 1.0281658172607422, 1.1072862148284912, 1.1864063739776611, 1.2655266523361206, 1.34464693069458, 1.4237672090530396, 1.502887487411499, 1.5820077657699585, 1.661128044128418, 1.740248203277588, 1.8193684816360474, 1.8984887599945068, 1.9776090383529663, 2.056729316711426, 2.1358494758605957, 2.2149698734283447, 2.2940900325775146, 2.3732104301452637, 2.4523305892944336, 2.5314507484436035, 2.6105711460113525]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 7.0, 8.0, 6.0, 11.0, 6.0, 13.0, 15.0, 32.0, 26.0, 22.0, 21.0, 32.0, 35.0, 281.0, 210.0, 37.0, 34.0, 22.0, 24.0, 28.0, 27.0, 25.0, 11.0, 9.0, 6.0, 8.0, 11.0, 5.0, 9.0, 6.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4070903062820435, -1.3643126487731934, -1.3215349912643433, -1.2787573337554932, -1.2359797954559326, -1.1932021379470825, -1.1504244804382324, -1.1076468229293823, -1.0648691654205322, -1.0220915079116821, -0.9793139100074768, -0.9365362524986267, -0.8937586545944214, -0.8509809970855713, -0.8082033395767212, -0.7654256820678711, -0.7226481437683105, -0.6798704862594604, -0.6370928883552551, -0.594315230846405, -0.5515376329421997, -0.5087599754333496, -0.4659823179244995, -0.4232046902179718, -0.3804270625114441, -0.3376494348049164, -0.29487180709838867, -0.2520941495895386, -0.20931652188301086, -0.16653889417648315, -0.12376123666763306, -0.08098360896110535, -0.03820610046386719, 0.004571534693241119, 0.047349169850349426, 0.09012681245803833, 0.13290444016456604, 0.17568206787109375, 0.21845972537994385, 0.26123735308647156, 0.30401498079299927, 0.346792608499527, 0.3895702362060547, 0.4323478937149048, 0.4751255214214325, 0.5179031491279602, 0.5606808066368103, 0.6034584045410156, 0.6462360620498657, 0.6890137195587158, 0.7317913174629211, 0.7745689749717712, 0.8173465728759766, 0.8601242303848267, 0.9029018878936768, 0.9456795454025269, 0.9884571433067322, 1.0312347412109375, 1.0740123987197876, 1.1167900562286377, 1.1595677137374878, 1.202345371246338, 1.2451229095458984, 1.2879005670547485, 1.3306782245635986]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 5.0, 6.0, 9.0, 10.0, 18.0, 15.0, 21.0, 34.0, 37.0, 39.0, 58.0, 78.0, 236.0, 151.0, 60.0, 44.0, 36.0, 38.0, 28.0, 21.0, 8.0, 15.0, 9.0, 10.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0867919921875, -0.08281517028808594, -0.07883834838867188, -0.07486152648925781, -0.07088470458984375, -0.06690788269042969, -0.06293106079101562, -0.05895423889160156, -0.0549774169921875, -0.05100059509277344, -0.047023773193359375, -0.04304695129394531, -0.03907012939453125, -0.03509330749511719, -0.031116485595703125, -0.027139663696289062, -0.023162841796875, -0.019186019897460938, -0.015209197998046875, -0.011232376098632812, -0.00725555419921875, -0.0032787322998046875, 0.000698089599609375, 0.0046749114990234375, 0.0086517333984375, 0.012628555297851562, 0.016605377197265625, 0.020582199096679688, 0.02455902099609375, 0.028535842895507812, 0.032512664794921875, 0.03648948669433594, 0.04046630859375, 0.04444313049316406, 0.048419952392578125, 0.05239677429199219, 0.05637359619140625, 0.06035041809082031, 0.06432723999023438, 0.06830406188964844, 0.0722808837890625, 0.07625770568847656, 0.08023452758789062, 0.08421134948730469, 0.08818817138671875, 0.09216499328613281, 0.09614181518554688, 0.10011863708496094, 0.104095458984375, 0.10807228088378906, 0.11204910278320312, 0.11602592468261719, 0.12000274658203125, 0.12397956848144531, 0.12795639038085938, 0.13193321228027344, 0.1359100341796875, 0.13988685607910156, 0.14386367797851562, 0.1478404998779297, 0.15181732177734375, 0.1557941436767578, 0.15977096557617188, 0.16374778747558594, 0.167724609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 6.0, 6.0, 15.0, 21.0, 29.0, 35.0, 78.0, 101.0, 196.0, 547.0, 2427.0, 66505.0, 8313514.0, 3883.0, 712.0, 246.0, 118.0, 52.0, 34.0, 19.0, 10.0, 2.0, 11.0, 13.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.9664623141288757, -0.9308241605758667, -0.8951859474182129, -0.8595477342605591, -0.82390958070755, -0.788271427154541, -0.7526332139968872, -0.7169950008392334, -0.6813568472862244, -0.6457186937332153, -0.6100804805755615, -0.5744422674179077, -0.5388041138648987, -0.5031659603118896, -0.46752774715423584, -0.4318895637989044, -0.396251380443573, -0.3606131970882416, -0.32497501373291016, -0.28933683037757874, -0.2536986470222473, -0.2180604636669159, -0.18242228031158447, -0.14678409695625305, -0.11114591360092163, -0.07550773024559021, -0.03986954689025879, -0.004231363534927368, 0.03140681982040405, 0.06704500317573547, 0.1026831865310669, 0.13832136988639832, 0.17395949363708496, 0.20959767699241638, 0.2452358603477478, 0.2808740437030792, 0.31651222705841064, 0.35215041041374207, 0.3877885937690735, 0.4234267771244049, 0.45906496047973633, 0.49470314383506775, 0.5303413271903992, 0.5659794807434082, 0.601617693901062, 0.6372559070587158, 0.6728940606117249, 0.7085322141647339, 0.7441704273223877, 0.7798086404800415, 0.8154467940330505, 0.8510849475860596, 0.8867231607437134, 0.9223613739013672, 0.9579995274543762, 0.9936376810073853, 1.029275894165039, 1.0649141073226929, 1.1005523204803467, 1.136190414428711, 1.1718286275863647, 1.2074668407440186, 1.2431049346923828, 1.2787431478500366, 1.3143813610076904]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 2.0, 6.0, 2.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 5.0, 7.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5830186009407043, -0.5527002811431885, -0.5223819613456726, -0.49206364154815674, -0.46174532175064087, -0.431427001953125, -0.40110865235328674, -0.3707903325557709, -0.340472012758255, -0.31015369296073914, -0.27983537316322327, -0.2495170384645462, -0.21919871866703033, -0.18888039886951447, -0.1585620641708374, -0.12824374437332153, -0.09792542457580566, -0.0676071047782898, -0.03728877753019333, -0.006970450282096863, 0.023347869515419006, 0.053666189312934875, 0.08398452401161194, 0.11430284380912781, 0.14462116360664368, 0.17493948340415955, 0.20525780320167542, 0.23557613790035248, 0.26589447259902954, 0.2962127923965454, 0.3265311121940613, 0.35684943199157715, 0.3871678113937378, 0.41748613119125366, 0.44780445098876953, 0.4781227707862854, 0.5084410905838013, 0.5387594103813171, 0.569077730178833, 0.5993961095809937, 0.6297143697738647, 0.6600326895713806, 0.6903510093688965, 0.7206693291664124, 0.7509876489639282, 0.7813059687614441, 0.81162428855896, 0.8419426679611206, 0.8722609877586365, 0.9025793075561523, 0.9328976273536682, 0.9632159471511841, 0.9935342669487, 1.0238525867462158, 1.0541709661483765, 1.0844892263412476, 1.1148076057434082, 1.1451259851455688, 1.17544424533844, 1.2057626247406006, 1.2360808849334717, 1.2663992643356323, 1.2967175245285034, 1.327035903930664, 1.3573541641235352]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 7.0, 8.0, 16.0, 9.0, 24.0, 22.0, 26.0, 39.0, 29.0, 48.0, 63.0, 73.0, 71.0, 63.0, 78.0, 64.0, 51.0, 61.0, 40.0, 38.0, 27.0, 22.0, 23.0, 23.0, 10.0, 10.0, 6.0, 6.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.05999755859375, -0.05833101272583008, -0.056664466857910156, -0.054997920989990234, -0.05333137512207031, -0.05166482925415039, -0.04999828338623047, -0.04833173751831055, -0.046665191650390625, -0.0449986457824707, -0.04333209991455078, -0.04166555404663086, -0.03999900817871094, -0.038332462310791016, -0.036665916442871094, -0.03499937057495117, -0.03333282470703125, -0.03166627883911133, -0.029999732971191406, -0.028333187103271484, -0.026666641235351562, -0.02500009536743164, -0.02333354949951172, -0.021667003631591797, -0.020000457763671875, -0.018333911895751953, -0.01666736602783203, -0.01500082015991211, -0.013334274291992188, -0.011667728424072266, -0.010001182556152344, -0.008334636688232422, -0.0066680908203125, -0.005001544952392578, -0.0033349990844726562, -0.0016684532165527344, -1.9073486328125e-06, 0.0016646385192871094, 0.0033311843872070312, 0.004997730255126953, 0.006664276123046875, 0.008330821990966797, 0.009997367858886719, 0.01166391372680664, 0.013330459594726562, 0.014997005462646484, 0.016663551330566406, 0.018330097198486328, 0.01999664306640625, 0.021663188934326172, 0.023329734802246094, 0.024996280670166016, 0.026662826538085938, 0.02832937240600586, 0.02999591827392578, 0.0316624641418457, 0.033329010009765625, 0.03499555587768555, 0.03666210174560547, 0.03832864761352539, 0.03999519348144531, 0.041661739349365234, 0.043328285217285156, 0.04499483108520508, 0.046661376953125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 9.0, 8.0, 11.0, 25.0, 28.0, 39.0, 59.0, 92.0, 127.0, 218.0, 272.0, 497.0, 873.0, 1634.0, 3338.0, 7266.0, 18529.0, 54417.0, 161854.0, 175520.0, 61747.0, 21170.0, 8289.0, 3740.0, 1910.0, 957.0, 586.0, 309.0, 223.0, 147.0, 99.0, 68.0, 54.0, 35.0, 19.0, 20.0, 15.0, 11.0, 6.0, 5.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.46240234375, -0.4464874267578125, -0.430572509765625, -0.4146575927734375, -0.39874267578125, -0.3828277587890625, -0.366912841796875, -0.3509979248046875, -0.3350830078125, -0.3191680908203125, -0.303253173828125, -0.2873382568359375, -0.27142333984375, -0.2555084228515625, -0.239593505859375, -0.2236785888671875, -0.207763671875, -0.1918487548828125, -0.175933837890625, -0.1600189208984375, -0.14410400390625, -0.1281890869140625, -0.112274169921875, -0.0963592529296875, -0.0804443359375, -0.0645294189453125, -0.048614501953125, -0.0326995849609375, -0.01678466796875, -0.0008697509765625, 0.015045166015625, 0.0309600830078125, 0.046875, 0.0627899169921875, 0.078704833984375, 0.0946197509765625, 0.11053466796875, 0.1264495849609375, 0.142364501953125, 0.1582794189453125, 0.1741943359375, 0.1901092529296875, 0.206024169921875, 0.2219390869140625, 0.23785400390625, 0.2537689208984375, 0.269683837890625, 0.2855987548828125, 0.301513671875, 0.3174285888671875, 0.333343505859375, 0.3492584228515625, 0.36517333984375, 0.3810882568359375, 0.397003173828125, 0.4129180908203125, 0.4288330078125, 0.4447479248046875, 0.460662841796875, 0.4765777587890625, 0.49249267578125, 0.5084075927734375, 0.524322509765625, 0.5402374267578125, 0.55615234375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 13.0, 9.0, 21.0, 28.0, 35.0, 42.0, 46.0, 62.0, 72.0, 79.0, 105.0, 80.0, 68.0, 76.0, 67.0, 43.0, 36.0, 23.0, 19.0, 21.0, 11.0, 7.0, 8.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.11648178100585938, -0.11290740966796875, -0.10933303833007812, -0.1057586669921875, -0.10218429565429688, -0.09860992431640625, -0.09503555297851562, -0.091461181640625, -0.08788681030273438, -0.08431243896484375, -0.08073806762695312, -0.0771636962890625, -0.07358932495117188, -0.07001495361328125, -0.06644058227539062, -0.0628662109375, -0.059291839599609375, -0.05571746826171875, -0.052143096923828125, -0.0485687255859375, -0.044994354248046875, -0.04141998291015625, -0.037845611572265625, -0.034271240234375, -0.030696868896484375, -0.02712249755859375, -0.023548126220703125, -0.0199737548828125, -0.016399383544921875, -0.01282501220703125, -0.009250640869140625, -0.00567626953125, -0.002101898193359375, 0.00147247314453125, 0.005046844482421875, 0.0086212158203125, 0.012195587158203125, 0.01576995849609375, 0.019344329833984375, 0.022918701171875, 0.026493072509765625, 0.03006744384765625, 0.033641815185546875, 0.0372161865234375, 0.040790557861328125, 0.04436492919921875, 0.047939300537109375, 0.051513671875, 0.055088043212890625, 0.05866241455078125, 0.062236785888671875, 0.0658111572265625, 0.06938552856445312, 0.07295989990234375, 0.07653427124023438, 0.080108642578125, 0.08368301391601562, 0.08725738525390625, 0.09083175659179688, 0.0944061279296875, 0.09798049926757812, 0.10155487060546875, 0.10512924194335938, 0.10870361328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 15.0, 16.0, 21.0, 43.0, 71.0, 89.0, 101.0, 40.0, 27.0, 14.0, 3.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6835649013519287, -0.6624685525894165, -0.6413722634315491, -0.6202759146690369, -0.5991796255111694, -0.5780832767486572, -0.556986927986145, -0.5358905792236328, -0.5147942900657654, -0.49369797110557556, -0.47260165214538574, -0.45150530338287354, -0.4304089844226837, -0.4093126654624939, -0.3882163166999817, -0.36711999773979187, -0.34602367877960205, -0.32492735981941223, -0.3038310408592224, -0.2827346920967102, -0.2616383731365204, -0.24054205417633057, -0.21944572031497955, -0.19834938645362854, -0.17725306749343872, -0.1561567485332489, -0.1350604146718979, -0.11396408826112747, -0.09286776185035706, -0.07177143543958664, -0.05067510902881622, -0.02957877516746521, -0.008482396602630615, 0.012613929808139801, 0.03371025621891022, 0.054806582629680634, 0.07590290904045105, 0.09699923545122147, 0.11809556186199188, 0.1391918957233429, 0.16028821468353271, 0.18138453364372253, 0.20248086750507355, 0.22357720136642456, 0.24467352032661438, 0.2657698392868042, 0.2868661880493164, 0.3079625070095062, 0.32905882596969604, 0.35015514492988586, 0.3712514638900757, 0.3923478126525879, 0.4134441316127777, 0.43454045057296753, 0.45563679933547974, 0.47673311829566956, 0.4978294372558594, 0.5189257860183716, 0.540022075176239, 0.5611184239387512, 0.5822147130966187, 0.6033110618591309, 0.6244074106216431, 0.6455037593841553, 0.6666000485420227]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 3.0, 3.0, 3.0, 5.0, 9.0, 2.0, 10.0, 15.0, 41.0, 57.0, 78.0, 93.0, 59.0, 23.0, 16.0, 12.0, 8.0, 4.0, 7.0, 4.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4047253131866455, -0.3888840675354004, -0.3730428218841553, -0.35720157623291016, -0.34136033058166504, -0.3255190849304199, -0.3096778094768524, -0.2938365638256073, -0.2779953181743622, -0.26215407252311707, -0.24631282687187195, -0.23047156631946564, -0.21463032066822052, -0.1987890750169754, -0.1829478144645691, -0.16710656881332397, -0.15126532316207886, -0.13542407751083374, -0.11958282440900803, -0.10374157130718231, -0.0879003256559372, -0.07205908000469208, -0.056217826902866364, -0.04037657380104065, -0.024535328149795532, -0.008694078773260117, 0.007147170603275299, 0.022988419979810715, 0.03882966935634613, 0.05467091500759125, 0.07051216810941696, 0.08635342121124268, 0.10219460725784302, 0.11803585290908813, 0.13387709856033325, 0.14971835911273956, 0.16555960476398468, 0.1814008504152298, 0.1972421109676361, 0.21308335661888123, 0.22892460227012634, 0.24476584792137146, 0.2606070935726166, 0.2764483392238617, 0.2922896146774292, 0.3081308603286743, 0.32397210597991943, 0.33981335163116455, 0.35565459728240967, 0.3714958429336548, 0.3873370885848999, 0.403178334236145, 0.41901957988739014, 0.43486082553863525, 0.45070210099220276, 0.4665433466434479, 0.482384592294693, 0.4982258379459381, 0.5140671133995056, 0.5299083590507507, 0.5457496047019958, 0.561590850353241, 0.5774320960044861, 0.5932733416557312, 0.6091145873069763]}, "eval/loss": 4.63620138168335, "eval/wer": 1.0192383974613248, "eval/runtime": 439.1186, "eval/samples_per_second": 6.017, "eval/steps_per_second": 0.754} \ No newline at end of file